Training in progress, step 696
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:431790197d033ed83a237d50da74065654ba8b057580a76fcdb350483865d374
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb4b8611b2b8e2d72516004247d307272e227f6aa6000c7b10f96848b75bdd5c
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6dd873d8f2b78cc8ce909638e9a3698da4d7f193d671d0112e075b9af620ed98
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e36916674c1e7bde773b02c861c6ca1c1d09241990ebc523ca5286dff166db17
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -603,3 +603,95 @@
|
|
603 |
{"current_steps": 603, "total_steps": 696, "loss": 0.3484, "lr": 5.347602368086563e-07, "epoch": 2.5954088952654235, "percentage": 86.64, "elapsed_time": "3:23:07", "remaining_time": "0:31:19"}
|
604 |
{"current_steps": 604, "total_steps": 696, "loss": 0.3596, "lr": 5.235258128979676e-07, "epoch": 2.599713055954089, "percentage": 86.78, "elapsed_time": "3:23:26", "remaining_time": "0:30:59"}
|
605 |
{"current_steps": 605, "total_steps": 696, "loss": 0.3605, "lr": 5.124041311215544e-07, "epoch": 2.6040172166427547, "percentage": 86.93, "elapsed_time": "3:23:47", "remaining_time": "0:30:39"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
603 |
{"current_steps": 603, "total_steps": 696, "loss": 0.3484, "lr": 5.347602368086563e-07, "epoch": 2.5954088952654235, "percentage": 86.64, "elapsed_time": "3:23:07", "remaining_time": "0:31:19"}
|
604 |
{"current_steps": 604, "total_steps": 696, "loss": 0.3596, "lr": 5.235258128979676e-07, "epoch": 2.599713055954089, "percentage": 86.78, "elapsed_time": "3:23:26", "remaining_time": "0:30:59"}
|
605 |
{"current_steps": 605, "total_steps": 696, "loss": 0.3605, "lr": 5.124041311215544e-07, "epoch": 2.6040172166427547, "percentage": 86.93, "elapsed_time": "3:23:47", "remaining_time": "0:30:39"}
|
606 |
+
{"current_steps": 606, "total_steps": 696, "loss": 0.4133, "lr": 5.0139547158427e-07, "epoch": 2.6083213773314204, "percentage": 87.07, "elapsed_time": "3:24:08", "remaining_time": "0:30:19"}
|
607 |
+
{"current_steps": 607, "total_steps": 696, "loss": 0.3752, "lr": 4.905001115444475e-07, "epoch": 2.6126255380200862, "percentage": 87.21, "elapsed_time": "3:24:28", "remaining_time": "0:29:58"}
|
608 |
+
{"current_steps": 608, "total_steps": 696, "loss": 0.3829, "lr": 4.797183254069176e-07, "epoch": 2.616929698708752, "percentage": 87.36, "elapsed_time": "3:24:45", "remaining_time": "0:29:38"}
|
609 |
+
{"current_steps": 609, "total_steps": 696, "loss": 0.4159, "lr": 4.690503847160982e-07, "epoch": 2.6212338593974174, "percentage": 87.5, "elapsed_time": "3:25:07", "remaining_time": "0:29:18"}
|
610 |
+
{"current_steps": 610, "total_steps": 696, "loss": 0.3548, "lr": 4.5849655814915683e-07, "epoch": 2.625538020086083, "percentage": 87.64, "elapsed_time": "3:25:23", "remaining_time": "0:28:57"}
|
611 |
+
{"current_steps": 611, "total_steps": 696, "loss": 0.3677, "lr": 4.4805711150924304e-07, "epoch": 2.629842180774749, "percentage": 87.79, "elapsed_time": "3:25:43", "remaining_time": "0:28:37"}
|
612 |
+
{"current_steps": 612, "total_steps": 696, "loss": 0.4144, "lr": 4.3773230771879004e-07, "epoch": 2.6341463414634148, "percentage": 87.93, "elapsed_time": "3:26:05", "remaining_time": "0:28:17"}
|
613 |
+
{"current_steps": 613, "total_steps": 696, "loss": 0.3533, "lr": 4.2752240681290027e-07, "epoch": 2.6384505021520805, "percentage": 88.07, "elapsed_time": "3:26:23", "remaining_time": "0:27:56"}
|
614 |
+
{"current_steps": 614, "total_steps": 696, "loss": 0.3949, "lr": 4.1742766593278974e-07, "epoch": 2.642754662840746, "percentage": 88.22, "elapsed_time": "3:26:44", "remaining_time": "0:27:36"}
|
615 |
+
{"current_steps": 615, "total_steps": 696, "loss": 0.3824, "lr": 4.074483393193135e-07, "epoch": 2.6470588235294117, "percentage": 88.36, "elapsed_time": "3:27:04", "remaining_time": "0:27:16"}
|
616 |
+
{"current_steps": 616, "total_steps": 696, "loss": 0.3311, "lr": 3.9758467830656623e-07, "epoch": 2.6513629842180775, "percentage": 88.51, "elapsed_time": "3:27:24", "remaining_time": "0:26:56"}
|
617 |
+
{"current_steps": 617, "total_steps": 696, "loss": 0.3832, "lr": 3.8783693131554836e-07, "epoch": 2.6556671449067433, "percentage": 88.65, "elapsed_time": "3:27:44", "remaining_time": "0:26:35"}
|
618 |
+
{"current_steps": 618, "total_steps": 696, "loss": 0.3637, "lr": 3.782053438479094e-07, "epoch": 2.659971305595409, "percentage": 88.79, "elapsed_time": "3:28:01", "remaining_time": "0:26:15"}
|
619 |
+
{"current_steps": 619, "total_steps": 696, "loss": 0.3638, "lr": 3.686901584797675e-07, "epoch": 2.6642754662840744, "percentage": 88.94, "elapsed_time": "3:28:17", "remaining_time": "0:25:54"}
|
620 |
+
{"current_steps": 620, "total_steps": 696, "loss": 0.376, "lr": 3.5929161485559694e-07, "epoch": 2.66857962697274, "percentage": 89.08, "elapsed_time": "3:28:37", "remaining_time": "0:25:34"}
|
621 |
+
{"current_steps": 621, "total_steps": 696, "loss": 0.372, "lr": 3.5000994968219406e-07, "epoch": 2.672883787661406, "percentage": 89.22, "elapsed_time": "3:28:57", "remaining_time": "0:25:14"}
|
622 |
+
{"current_steps": 622, "total_steps": 696, "loss": 0.361, "lr": 3.4084539672271764e-07, "epoch": 2.677187948350072, "percentage": 89.37, "elapsed_time": "3:29:18", "remaining_time": "0:24:54"}
|
623 |
+
{"current_steps": 623, "total_steps": 696, "loss": 0.3799, "lr": 3.3179818679079936e-07, "epoch": 2.6814921090387376, "percentage": 89.51, "elapsed_time": "3:29:40", "remaining_time": "0:24:34"}
|
624 |
+
{"current_steps": 624, "total_steps": 696, "loss": 0.3515, "lr": 3.228685477447291e-07, "epoch": 2.685796269727403, "percentage": 89.66, "elapsed_time": "3:30:01", "remaining_time": "0:24:14"}
|
625 |
+
{"current_steps": 625, "total_steps": 696, "loss": 0.383, "lr": 3.140567044817172e-07, "epoch": 2.6901004304160687, "percentage": 89.8, "elapsed_time": "3:30:19", "remaining_time": "0:23:53"}
|
626 |
+
{"current_steps": 626, "total_steps": 696, "loss": 0.3733, "lr": 3.0536287893223603e-07, "epoch": 2.6944045911047345, "percentage": 89.94, "elapsed_time": "3:30:36", "remaining_time": "0:23:33"}
|
627 |
+
{"current_steps": 627, "total_steps": 696, "loss": 0.3751, "lr": 2.967872900544194e-07, "epoch": 2.6987087517934003, "percentage": 90.09, "elapsed_time": "3:30:56", "remaining_time": "0:23:12"}
|
628 |
+
{"current_steps": 628, "total_steps": 696, "loss": 0.3578, "lr": 2.883301538285582e-07, "epoch": 2.703012912482066, "percentage": 90.23, "elapsed_time": "3:31:17", "remaining_time": "0:22:52"}
|
629 |
+
{"current_steps": 629, "total_steps": 696, "loss": 0.4041, "lr": 2.799916832516575e-07, "epoch": 2.7073170731707314, "percentage": 90.37, "elapsed_time": "3:31:38", "remaining_time": "0:22:32"}
|
630 |
+
{"current_steps": 630, "total_steps": 696, "loss": 0.3779, "lr": 2.717720883320685e-07, "epoch": 2.7116212338593977, "percentage": 90.52, "elapsed_time": "3:31:56", "remaining_time": "0:22:12"}
|
631 |
+
{"current_steps": 631, "total_steps": 696, "loss": 0.3444, "lr": 2.6367157608420347e-07, "epoch": 2.715925394548063, "percentage": 90.66, "elapsed_time": "3:32:17", "remaining_time": "0:21:52"}
|
632 |
+
{"current_steps": 632, "total_steps": 696, "loss": 0.3881, "lr": 2.556903505233216e-07, "epoch": 2.720229555236729, "percentage": 90.8, "elapsed_time": "3:32:37", "remaining_time": "0:21:31"}
|
633 |
+
{"current_steps": 633, "total_steps": 696, "loss": 0.3657, "lr": 2.4782861266038904e-07, "epoch": 2.7245337159253946, "percentage": 90.95, "elapsed_time": "3:32:57", "remaining_time": "0:21:11"}
|
634 |
+
{"current_steps": 634, "total_steps": 696, "loss": 0.3845, "lr": 2.4008656049701875e-07, "epoch": 2.7288378766140604, "percentage": 91.09, "elapsed_time": "3:33:13", "remaining_time": "0:20:51"}
|
635 |
+
{"current_steps": 635, "total_steps": 696, "loss": 0.3815, "lr": 2.3246438902048196e-07, "epoch": 2.733142037302726, "percentage": 91.24, "elapsed_time": "3:33:35", "remaining_time": "0:20:31"}
|
636 |
+
{"current_steps": 636, "total_steps": 696, "loss": 0.3297, "lr": 2.2496229019879635e-07, "epoch": 2.7374461979913915, "percentage": 91.38, "elapsed_time": "3:33:56", "remaining_time": "0:20:10"}
|
637 |
+
{"current_steps": 637, "total_steps": 696, "loss": 0.3956, "lr": 2.175804529758929e-07, "epoch": 2.7417503586800573, "percentage": 91.52, "elapsed_time": "3:34:17", "remaining_time": "0:19:50"}
|
638 |
+
{"current_steps": 638, "total_steps": 696, "loss": 0.3644, "lr": 2.1031906326685946e-07, "epoch": 2.746054519368723, "percentage": 91.67, "elapsed_time": "3:34:36", "remaining_time": "0:19:30"}
|
639 |
+
{"current_steps": 639, "total_steps": 696, "loss": 0.4271, "lr": 2.0317830395325255e-07, "epoch": 2.750358680057389, "percentage": 91.81, "elapsed_time": "3:34:57", "remaining_time": "0:19:10"}
|
640 |
+
{"current_steps": 640, "total_steps": 696, "loss": 0.3978, "lr": 1.9615835487849677e-07, "epoch": 2.7546628407460547, "percentage": 91.95, "elapsed_time": "3:35:16", "remaining_time": "0:18:50"}
|
641 |
+
{"current_steps": 641, "total_steps": 696, "loss": 0.4061, "lr": 1.8925939284335225e-07, "epoch": 2.75896700143472, "percentage": 92.1, "elapsed_time": "3:35:38", "remaining_time": "0:18:30"}
|
642 |
+
{"current_steps": 642, "total_steps": 696, "loss": 0.3499, "lr": 1.824815916014644e-07, "epoch": 2.763271162123386, "percentage": 92.24, "elapsed_time": "3:36:00", "remaining_time": "0:18:10"}
|
643 |
+
{"current_steps": 643, "total_steps": 696, "loss": 0.3588, "lr": 1.7582512185498446e-07, "epoch": 2.7675753228120517, "percentage": 92.39, "elapsed_time": "3:36:21", "remaining_time": "0:17:49"}
|
644 |
+
{"current_steps": 644, "total_steps": 696, "loss": 0.3768, "lr": 1.6929015125027314e-07, "epoch": 2.7718794835007174, "percentage": 92.53, "elapsed_time": "3:36:44", "remaining_time": "0:17:30"}
|
645 |
+
{"current_steps": 645, "total_steps": 696, "loss": 0.3517, "lr": 1.6287684437367724e-07, "epoch": 2.7761836441893832, "percentage": 92.67, "elapsed_time": "3:37:03", "remaining_time": "0:17:09"}
|
646 |
+
{"current_steps": 646, "total_steps": 696, "loss": 0.3764, "lr": 1.5658536274738623e-07, "epoch": 2.7804878048780486, "percentage": 92.82, "elapsed_time": "3:37:20", "remaining_time": "0:16:49"}
|
647 |
+
{"current_steps": 647, "total_steps": 696, "loss": 0.3823, "lr": 1.504158648253584e-07, "epoch": 2.7847919655667144, "percentage": 92.96, "elapsed_time": "3:37:40", "remaining_time": "0:16:29"}
|
648 |
+
{"current_steps": 648, "total_steps": 696, "loss": 0.3456, "lr": 1.443685059893396e-07, "epoch": 2.78909612625538, "percentage": 93.1, "elapsed_time": "3:38:02", "remaining_time": "0:16:09"}
|
649 |
+
{"current_steps": 649, "total_steps": 696, "loss": 0.3695, "lr": 1.3844343854494123e-07, "epoch": 2.793400286944046, "percentage": 93.25, "elapsed_time": "3:38:21", "remaining_time": "0:15:48"}
|
650 |
+
{"current_steps": 650, "total_steps": 696, "loss": 0.3661, "lr": 1.3264081171780797e-07, "epoch": 2.7977044476327118, "percentage": 93.39, "elapsed_time": "3:38:41", "remaining_time": "0:15:28"}
|
651 |
+
{"current_steps": 651, "total_steps": 696, "loss": 0.3741, "lr": 1.2696077164986e-07, "epoch": 2.802008608321377, "percentage": 93.53, "elapsed_time": "3:39:03", "remaining_time": "0:15:08"}
|
652 |
+
{"current_steps": 652, "total_steps": 696, "loss": 0.3896, "lr": 1.2140346139561277e-07, "epoch": 2.806312769010043, "percentage": 93.68, "elapsed_time": "3:39:23", "remaining_time": "0:14:48"}
|
653 |
+
{"current_steps": 653, "total_steps": 696, "loss": 0.3667, "lr": 1.1596902091857043e-07, "epoch": 2.8106169296987087, "percentage": 93.82, "elapsed_time": "3:39:41", "remaining_time": "0:14:27"}
|
654 |
+
{"current_steps": 654, "total_steps": 696, "loss": 0.3591, "lr": 1.1065758708770468e-07, "epoch": 2.8149210903873745, "percentage": 93.97, "elapsed_time": "3:40:02", "remaining_time": "0:14:07"}
|
655 |
+
{"current_steps": 655, "total_steps": 696, "loss": 0.3288, "lr": 1.0546929367400705e-07, "epoch": 2.8192252510760403, "percentage": 94.11, "elapsed_time": "3:40:19", "remaining_time": "0:13:47"}
|
656 |
+
{"current_steps": 656, "total_steps": 696, "loss": 0.393, "lr": 1.004042713471165e-07, "epoch": 2.8235294117647056, "percentage": 94.25, "elapsed_time": "3:40:40", "remaining_time": "0:13:27"}
|
657 |
+
{"current_steps": 657, "total_steps": 696, "loss": 0.3538, "lr": 9.546264767203328e-08, "epoch": 2.827833572453372, "percentage": 94.4, "elapsed_time": "3:41:01", "remaining_time": "0:13:07"}
|
658 |
+
{"current_steps": 658, "total_steps": 696, "loss": 0.3927, "lr": 9.064454710590253e-08, "epoch": 2.832137733142037, "percentage": 94.54, "elapsed_time": "3:41:18", "remaining_time": "0:12:46"}
|
659 |
+
{"current_steps": 659, "total_steps": 696, "loss": 0.377, "lr": 8.595009099488238e-08, "epoch": 2.836441893830703, "percentage": 94.68, "elapsed_time": "3:41:39", "remaining_time": "0:12:26"}
|
660 |
+
{"current_steps": 660, "total_steps": 696, "loss": 0.3939, "lr": 8.137939757108526e-08, "epoch": 2.840746054519369, "percentage": 94.83, "elapsed_time": "3:41:58", "remaining_time": "0:12:06"}
|
661 |
+
{"current_steps": 661, "total_steps": 696, "loss": 0.3562, "lr": 7.693258194960252e-08, "epoch": 2.8450502152080346, "percentage": 94.97, "elapsed_time": "3:42:15", "remaining_time": "0:11:46"}
|
662 |
+
{"current_steps": 662, "total_steps": 696, "loss": 0.3841, "lr": 7.260975612560173e-08, "epoch": 2.8493543758967004, "percentage": 95.11, "elapsed_time": "3:42:33", "remaining_time": "0:11:25"}
|
663 |
+
{"current_steps": 663, "total_steps": 696, "loss": 0.3377, "lr": 6.84110289715112e-08, "epoch": 2.8536585365853657, "percentage": 95.26, "elapsed_time": "3:42:52", "remaining_time": "0:11:05"}
|
664 |
+
{"current_steps": 664, "total_steps": 696, "loss": 0.4037, "lr": 6.433650623427379e-08, "epoch": 2.8579626972740315, "percentage": 95.4, "elapsed_time": "3:43:12", "remaining_time": "0:10:45"}
|
665 |
+
{"current_steps": 665, "total_steps": 696, "loss": 0.3728, "lr": 6.038629053268464e-08, "epoch": 2.8622668579626973, "percentage": 95.55, "elapsed_time": "3:43:33", "remaining_time": "0:10:25"}
|
666 |
+
{"current_steps": 666, "total_steps": 696, "loss": 0.356, "lr": 5.6560481354807625e-08, "epoch": 2.866571018651363, "percentage": 95.69, "elapsed_time": "3:43:54", "remaining_time": "0:10:05"}
|
667 |
+
{"current_steps": 667, "total_steps": 696, "loss": 0.3998, "lr": 5.285917505546967e-08, "epoch": 2.870875179340029, "percentage": 95.83, "elapsed_time": "3:44:16", "remaining_time": "0:09:45"}
|
668 |
+
{"current_steps": 668, "total_steps": 696, "loss": 0.3753, "lr": 4.928246485383148e-08, "epoch": 2.8751793400286942, "percentage": 95.98, "elapsed_time": "3:44:34", "remaining_time": "0:09:24"}
|
669 |
+
{"current_steps": 669, "total_steps": 696, "loss": 0.393, "lr": 4.583044083104282e-08, "epoch": 2.87948350071736, "percentage": 96.12, "elapsed_time": "3:44:55", "remaining_time": "0:09:04"}
|
670 |
+
{"current_steps": 670, "total_steps": 696, "loss": 0.3897, "lr": 4.250318992797375e-08, "epoch": 2.883787661406026, "percentage": 96.26, "elapsed_time": "3:45:15", "remaining_time": "0:08:44"}
|
671 |
+
{"current_steps": 671, "total_steps": 696, "loss": 0.3355, "lr": 3.9300795943021943e-08, "epoch": 2.8880918220946916, "percentage": 96.41, "elapsed_time": "3:45:32", "remaining_time": "0:08:24"}
|
672 |
+
{"current_steps": 672, "total_steps": 696, "loss": 0.379, "lr": 3.622333953000601e-08, "epoch": 2.8923959827833574, "percentage": 96.55, "elapsed_time": "3:45:54", "remaining_time": "0:08:04"}
|
673 |
+
{"current_steps": 673, "total_steps": 696, "loss": 0.3706, "lr": 3.3270898196129944e-08, "epoch": 2.8967001434720228, "percentage": 96.7, "elapsed_time": "3:46:14", "remaining_time": "0:07:43"}
|
674 |
+
{"current_steps": 674, "total_steps": 696, "loss": 0.3586, "lr": 3.0443546300035764e-08, "epoch": 2.9010043041606886, "percentage": 96.84, "elapsed_time": "3:46:33", "remaining_time": "0:07:23"}
|
675 |
+
{"current_steps": 675, "total_steps": 696, "loss": 0.4084, "lr": 2.77413550499267e-08, "epoch": 2.9053084648493543, "percentage": 96.98, "elapsed_time": "3:46:54", "remaining_time": "0:07:03"}
|
676 |
+
{"current_steps": 676, "total_steps": 696, "loss": 0.3481, "lr": 2.516439250177749e-08, "epoch": 2.90961262553802, "percentage": 97.13, "elapsed_time": "3:47:15", "remaining_time": "0:06:43"}
|
677 |
+
{"current_steps": 677, "total_steps": 696, "loss": 0.378, "lr": 2.2712723557616335e-08, "epoch": 2.913916786226686, "percentage": 97.27, "elapsed_time": "3:47:37", "remaining_time": "0:06:23"}
|
678 |
+
{"current_steps": 678, "total_steps": 696, "loss": 0.3678, "lr": 2.038640996389285e-08, "epoch": 2.9182209469153513, "percentage": 97.41, "elapsed_time": "3:47:56", "remaining_time": "0:06:03"}
|
679 |
+
{"current_steps": 679, "total_steps": 696, "loss": 0.3775, "lr": 1.818551030992377e-08, "epoch": 2.922525107604017, "percentage": 97.56, "elapsed_time": "3:48:18", "remaining_time": "0:05:42"}
|
680 |
+
{"current_steps": 680, "total_steps": 696, "loss": 0.3711, "lr": 1.6110080026414123e-08, "epoch": 2.926829268292683, "percentage": 97.7, "elapsed_time": "3:48:35", "remaining_time": "0:05:22"}
|
681 |
+
{"current_steps": 681, "total_steps": 696, "loss": 0.3636, "lr": 1.4160171384064447e-08, "epoch": 2.9311334289813487, "percentage": 97.84, "elapsed_time": "3:48:56", "remaining_time": "0:05:02"}
|
682 |
+
{"current_steps": 682, "total_steps": 696, "loss": 0.3957, "lr": 1.2335833492252425e-08, "epoch": 2.9354375896700144, "percentage": 97.99, "elapsed_time": "3:49:16", "remaining_time": "0:04:42"}
|
683 |
+
{"current_steps": 683, "total_steps": 696, "loss": 0.382, "lr": 1.063711229779718e-08, "epoch": 2.93974175035868, "percentage": 98.13, "elapsed_time": "3:49:35", "remaining_time": "0:04:22"}
|
684 |
+
{"current_steps": 684, "total_steps": 696, "loss": 0.3698, "lr": 9.06405058380022e-09, "epoch": 2.944045911047346, "percentage": 98.28, "elapsed_time": "3:49:56", "remaining_time": "0:04:02"}
|
685 |
+
{"current_steps": 685, "total_steps": 696, "loss": 0.3711, "lr": 7.61668796857018e-09, "epoch": 2.9483500717360114, "percentage": 98.42, "elapsed_time": "3:50:18", "remaining_time": "0:03:41"}
|
686 |
+
{"current_steps": 686, "total_steps": 696, "loss": 0.3881, "lr": 6.295060904623618e-09, "epoch": 2.952654232424677, "percentage": 98.56, "elapsed_time": "3:50:38", "remaining_time": "0:03:21"}
|
687 |
+
{"current_steps": 687, "total_steps": 696, "loss": 0.4193, "lr": 5.099202677767978e-09, "epoch": 2.956958393113343, "percentage": 98.71, "elapsed_time": "3:50:57", "remaining_time": "0:03:01"}
|
688 |
+
{"current_steps": 688, "total_steps": 696, "loss": 0.3409, "lr": 4.02914340626226e-09, "epoch": 2.9612625538020088, "percentage": 98.85, "elapsed_time": "3:51:16", "remaining_time": "0:02:41"}
|
689 |
+
{"current_steps": 689, "total_steps": 696, "loss": 0.336, "lr": 3.0849100400587307e-09, "epoch": 2.9655667144906745, "percentage": 98.99, "elapsed_time": "3:51:34", "remaining_time": "0:02:21"}
|
690 |
+
{"current_steps": 690, "total_steps": 696, "loss": 0.3638, "lr": 2.2665263601240328e-09, "epoch": 2.96987087517934, "percentage": 99.14, "elapsed_time": "3:51:52", "remaining_time": "0:02:00"}
|
691 |
+
{"current_steps": 691, "total_steps": 696, "loss": 0.3601, "lr": 1.5740129778413215e-09, "epoch": 2.9741750358680057, "percentage": 99.28, "elapsed_time": "3:52:12", "remaining_time": "0:01:40"}
|
692 |
+
{"current_steps": 692, "total_steps": 696, "loss": 0.4064, "lr": 1.0073873344895735e-09, "epoch": 2.9784791965566715, "percentage": 99.43, "elapsed_time": "3:52:33", "remaining_time": "0:01:20"}
|
693 |
+
{"current_steps": 693, "total_steps": 696, "loss": 0.3881, "lr": 5.666637008061582e-10, "epoch": 2.9827833572453373, "percentage": 99.57, "elapsed_time": "3:52:52", "remaining_time": "0:01:00"}
|
694 |
+
{"current_steps": 694, "total_steps": 696, "loss": 0.358, "lr": 2.5185317662490547e-10, "epoch": 2.987087517934003, "percentage": 99.71, "elapsed_time": "3:53:12", "remaining_time": "0:00:40"}
|
695 |
+
{"current_steps": 695, "total_steps": 696, "loss": 0.3728, "lr": 6.296369059854978e-11, "epoch": 2.9913916786226684, "percentage": 99.86, "elapsed_time": "3:53:33", "remaining_time": "0:00:20"}
|
696 |
+
{"current_steps": 696, "total_steps": 696, "loss": 0.3634, "lr": 0.0, "epoch": 2.995695839311334, "percentage": 100.0, "elapsed_time": "3:53:51", "remaining_time": "0:00:00"}
|
697 |
+
{"current_steps": 696, "total_steps": 696, "epoch": 2.995695839311334, "percentage": 100.0, "elapsed_time": "3:54:44", "remaining_time": "0:00:00"}
|