Training in progress, step 236854
Browse files- model.safetensors +1 -1
- trainer_log.jsonl +26 -0
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1260367448
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:69c547368365ab99e2bd66f9dc55956a0c2cca956e82d51236bb6e64fef15ef0
|
3 |
size 1260367448
|
trainer_log.jsonl
CHANGED
@@ -23661,3 +23661,29 @@
|
|
23661 |
{"current_steps": 236580, "total_steps": 236854, "loss": 0.0065, "lr": 4.0765828065447713e-11, "epoch": 1.9976779042029933, "percentage": 99.88, "elapsed_time": "1 day, 2:42:39", "remaining_time": "0:01:51"}
|
23662 |
{"current_steps": 236590, "total_steps": 236854, "loss": 0.0028, "lr": 3.7844523276264756e-11, "epoch": 1.9977623440501573, "percentage": 99.89, "elapsed_time": "1 day, 2:42:43", "remaining_time": "0:01:47"}
|
23663 |
{"current_steps": 236600, "total_steps": 236854, "loss": 0.0069, "lr": 3.503181664088473e-11, "epoch": 1.9978467838973213, "percentage": 99.89, "elapsed_time": "1 day, 2:42:47", "remaining_time": "0:01:43"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
23661 |
{"current_steps": 236580, "total_steps": 236854, "loss": 0.0065, "lr": 4.0765828065447713e-11, "epoch": 1.9976779042029933, "percentage": 99.88, "elapsed_time": "1 day, 2:42:39", "remaining_time": "0:01:51"}
|
23662 |
{"current_steps": 236590, "total_steps": 236854, "loss": 0.0028, "lr": 3.7844523276264756e-11, "epoch": 1.9977623440501573, "percentage": 99.89, "elapsed_time": "1 day, 2:42:43", "remaining_time": "0:01:47"}
|
23663 |
{"current_steps": 236600, "total_steps": 236854, "loss": 0.0069, "lr": 3.503181664088473e-11, "epoch": 1.9978467838973213, "percentage": 99.89, "elapsed_time": "1 day, 2:42:47", "remaining_time": "0:01:43"}
|
23664 |
+
{"current_steps": 236610, "total_steps": 236854, "loss": 0.0064, "lr": 3.23277082203699e-11, "epoch": 1.997931223744485, "percentage": 99.9, "elapsed_time": "1 day, 2:42:52", "remaining_time": "0:01:39"}
|
23665 |
+
{"current_steps": 236620, "total_steps": 236854, "loss": 0.0061, "lr": 2.973219807245187e-11, "epoch": 1.9980156635916488, "percentage": 99.9, "elapsed_time": "1 day, 2:42:55", "remaining_time": "0:01:35"}
|
23666 |
+
{"current_steps": 236630, "total_steps": 236854, "loss": 0.0071, "lr": 2.7245286254862223e-11, "epoch": 1.9981001034388126, "percentage": 99.91, "elapsed_time": "1 day, 2:42:59", "remaining_time": "0:01:31"}
|
23667 |
+
{"current_steps": 236640, "total_steps": 236854, "loss": 0.0061, "lr": 2.4866972820336566e-11, "epoch": 1.9981845432859766, "percentage": 99.91, "elapsed_time": "1 day, 2:43:03", "remaining_time": "0:01:26"}
|
23668 |
+
{"current_steps": 236650, "total_steps": 236854, "loss": 0.005, "lr": 2.2597257821610486e-11, "epoch": 1.9982689831331406, "percentage": 99.91, "elapsed_time": "1 day, 2:43:06", "remaining_time": "0:01:22"}
|
23669 |
+
{"current_steps": 236660, "total_steps": 236854, "loss": 0.0068, "lr": 2.0436141306978685e-11, "epoch": 1.9983534229803044, "percentage": 99.92, "elapsed_time": "1 day, 2:43:10", "remaining_time": "0:01:18"}
|
23670 |
+
{"current_steps": 236670, "total_steps": 236854, "loss": 0.0032, "lr": 1.8383623324180754e-11, "epoch": 1.9984378628274682, "percentage": 99.92, "elapsed_time": "1 day, 2:43:14", "remaining_time": "0:01:14"}
|
23671 |
+
{"current_steps": 236680, "total_steps": 236854, "loss": 0.0045, "lr": 1.6439703917625617e-11, "epoch": 1.9985223026746322, "percentage": 99.93, "elapsed_time": "1 day, 2:43:17", "remaining_time": "0:01:10"}
|
23672 |
+
{"current_steps": 236690, "total_steps": 236854, "loss": 0.0057, "lr": 1.460438312894663e-11, "epoch": 1.9986067425217962, "percentage": 99.93, "elapsed_time": "1 day, 2:43:21", "remaining_time": "0:01:06"}
|
23673 |
+
{"current_steps": 236700, "total_steps": 236854, "loss": 0.0058, "lr": 1.287766099866694e-11, "epoch": 1.99869118236896, "percentage": 99.93, "elapsed_time": "1 day, 2:43:25", "remaining_time": "0:01:02"}
|
23674 |
+
{"current_steps": 236710, "total_steps": 236854, "loss": 0.0053, "lr": 1.1259537563979018e-11, "epoch": 1.9987756222161237, "percentage": 99.94, "elapsed_time": "1 day, 2:43:29", "remaining_time": "0:00:58"}
|
23675 |
+
{"current_steps": 236720, "total_steps": 236854, "loss": 0.0027, "lr": 9.750012860409997e-12, "epoch": 1.9988600620632877, "percentage": 99.94, "elapsed_time": "1 day, 2:43:33", "remaining_time": "0:00:54"}
|
23676 |
+
{"current_steps": 236730, "total_steps": 236854, "loss": 0.005, "lr": 8.349086920711457e-12, "epoch": 1.9989445019104517, "percentage": 99.95, "elapsed_time": "1 day, 2:43:36", "remaining_time": "0:00:50"}
|
23677 |
+
{"current_steps": 236740, "total_steps": 236854, "loss": 0.0063, "lr": 7.056759774304312e-12, "epoch": 1.9990289417576155, "percentage": 99.95, "elapsed_time": "1 day, 2:43:39", "remaining_time": "0:00:46"}
|
23678 |
+
{"current_steps": 236750, "total_steps": 236854, "loss": 0.0073, "lr": 5.8730314506094674e-12, "epoch": 1.9991133816047792, "percentage": 99.96, "elapsed_time": "1 day, 2:43:43", "remaining_time": "0:00:42"}
|
23679 |
+
{"current_steps": 236760, "total_steps": 236854, "loss": 0.0039, "lr": 4.797901974606944e-12, "epoch": 1.999197821451943, "percentage": 99.96, "elapsed_time": "1 day, 2:43:46", "remaining_time": "0:00:38"}
|
23680 |
+
{"current_steps": 236770, "total_steps": 236854, "loss": 0.0081, "lr": 3.831371369611425e-12, "epoch": 1.999282261299107, "percentage": 99.96, "elapsed_time": "1 day, 2:43:50", "remaining_time": "0:00:34"}
|
23681 |
+
{"current_steps": 236780, "total_steps": 236854, "loss": 0.0038, "lr": 2.973439657272259e-12, "epoch": 1.999366701146271, "percentage": 99.97, "elapsed_time": "1 day, 2:43:53", "remaining_time": "0:00:30"}
|
23682 |
+
{"current_steps": 236790, "total_steps": 236854, "loss": 0.0057, "lr": 2.2241068553530142e-12, "epoch": 1.9994511409934348, "percentage": 99.97, "elapsed_time": "1 day, 2:43:56", "remaining_time": "0:00:26"}
|
23683 |
+
{"current_steps": 236800, "total_steps": 236854, "loss": 0.0095, "lr": 1.5833729805070364e-12, "epoch": 1.9995355808405986, "percentage": 99.98, "elapsed_time": "1 day, 2:44:00", "remaining_time": "0:00:21"}
|
23684 |
+
{"current_steps": 236810, "total_steps": 236854, "loss": 0.0093, "lr": 1.0512380471672246e-12, "epoch": 1.9996200206877626, "percentage": 99.98, "elapsed_time": "1 day, 2:44:04", "remaining_time": "0:00:17"}
|
23685 |
+
{"current_steps": 236820, "total_steps": 236854, "loss": 0.0033, "lr": 6.277020658806976e-13, "epoch": 1.9997044605349266, "percentage": 99.99, "elapsed_time": "1 day, 2:44:08", "remaining_time": "0:00:13"}
|
23686 |
+
{"current_steps": 236830, "total_steps": 236854, "loss": 0.0087, "lr": 3.127650466394627e-13, "epoch": 1.9997889003820903, "percentage": 99.99, "elapsed_time": "1 day, 2:44:12", "remaining_time": "0:00:09"}
|
23687 |
+
{"current_steps": 236840, "total_steps": 236854, "loss": 0.0053, "lr": 1.0642699554974656e-13, "epoch": 1.9998733402292541, "percentage": 99.99, "elapsed_time": "1 day, 2:44:15", "remaining_time": "0:00:05"}
|
23688 |
+
{"current_steps": 236850, "total_steps": 236854, "loss": 0.0069, "lr": 8.687918162664232e-15, "epoch": 1.9999577800764181, "percentage": 100.0, "elapsed_time": "1 day, 2:44:18", "remaining_time": "0:00:01"}
|
23689 |
+
{"current_steps": 236854, "total_steps": 236854, "epoch": 1.9999915560152837, "percentage": 100.0, "elapsed_time": "1 day, 2:44:27", "remaining_time": "0:00:00"}
|