Training in progress, epoch 83
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84847fb95014540053e95f581a7b42d0009b5bace46b87fb1556163ba03e63fd
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:871c0efa7ea9196a5c0aca96af832dd221e293d558aa23f342ca2eedcb3f2ac3
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61bc6ea99d8b695343d57c8eeb0d4cf358dcbaa67d6339cca6cc333058950f1b
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9bc8f95aaf7674ef8d1129a18c8e5f17c02f384e1a3f057457a0be0efdfc0121
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -472,3 +472,9 @@
|
|
472 |
{"current_steps": 3900, "total_steps": 4183, "loss": 0.0034, "lr": 5e-06, "epoch": 82.75862068965517, "percentage": 93.23, "elapsed_time": "1 day, 13:30:53", "remaining_time": "2:43:20"}
|
473 |
{"current_steps": 3910, "total_steps": 4183, "loss": 0.0034, "lr": 5e-06, "epoch": 82.9708222811671, "percentage": 93.47, "elapsed_time": "1 day, 13:36:14", "remaining_time": "2:37:31"}
|
474 |
{"current_steps": 3911, "total_steps": 4183, "eval_loss": 2.1120784282684326, "epoch": 82.9920424403183, "percentage": 93.5, "elapsed_time": "1 day, 13:37:27", "remaining_time": "2:37:00"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
472 |
{"current_steps": 3900, "total_steps": 4183, "loss": 0.0034, "lr": 5e-06, "epoch": 82.75862068965517, "percentage": 93.23, "elapsed_time": "1 day, 13:30:53", "remaining_time": "2:43:20"}
|
473 |
{"current_steps": 3910, "total_steps": 4183, "loss": 0.0034, "lr": 5e-06, "epoch": 82.9708222811671, "percentage": 93.47, "elapsed_time": "1 day, 13:36:14", "remaining_time": "2:37:31"}
|
474 |
{"current_steps": 3911, "total_steps": 4183, "eval_loss": 2.1120784282684326, "epoch": 82.9920424403183, "percentage": 93.5, "elapsed_time": "1 day, 13:37:27", "remaining_time": "2:37:00"}
|
475 |
+
{"current_steps": 3920, "total_steps": 4183, "loss": 0.0032, "lr": 5e-06, "epoch": 83.18302387267904, "percentage": 93.71, "elapsed_time": "1 day, 13:43:29", "remaining_time": "2:31:51"}
|
476 |
+
{"current_steps": 3930, "total_steps": 4183, "loss": 0.0034, "lr": 5e-06, "epoch": 83.39522546419099, "percentage": 93.95, "elapsed_time": "1 day, 13:48:48", "remaining_time": "2:26:03"}
|
477 |
+
{"current_steps": 3940, "total_steps": 4183, "loss": 0.0033, "lr": 5e-06, "epoch": 83.60742705570291, "percentage": 94.19, "elapsed_time": "1 day, 13:54:08", "remaining_time": "2:20:15"}
|
478 |
+
{"current_steps": 3950, "total_steps": 4183, "loss": 0.0033, "lr": 5e-06, "epoch": 83.81962864721486, "percentage": 94.43, "elapsed_time": "1 day, 13:59:28", "remaining_time": "2:14:27"}
|
479 |
+
{"current_steps": 3958, "total_steps": 4183, "eval_loss": 2.0832369327545166, "epoch": 83.9893899204244, "percentage": 94.62, "elapsed_time": "1 day, 14:04:28", "remaining_time": "2:09:51"}
|
480 |
+
{"current_steps": 3960, "total_steps": 4183, "loss": 0.0035, "lr": 5e-06, "epoch": 84.03183023872678, "percentage": 94.67, "elapsed_time": "1 day, 14:06:49", "remaining_time": "2:08:46"}
|