Training in progress, epoch 73
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e8b20eed09adcdc4d206f016a96b023ba2b86cd0b9b00acc9f1d1bda3ff9d60
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08433f4401ac84bf3b6e57ddeed334395c9ff6c9714fe7346cba053d194a0add
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cec2ad74ab0fc97b474753fce50ded6922323fef44eb1b1d1aa13e49d2147b88
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22c4430dce037f9a378f74aab81da62ced2686bb5f78df372ce2d870c2c3ce22
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -415,3 +415,9 @@
|
|
415 |
{"current_steps": 3430, "total_steps": 4183, "loss": 0.0036, "lr": 5e-06, "epoch": 72.78514588859416, "percentage": 82.0, "elapsed_time": "1 day, 8:57:18", "remaining_time": "7:14:05"}
|
416 |
{"current_steps": 3440, "total_steps": 4183, "loss": 0.0036, "lr": 5e-06, "epoch": 72.9973474801061, "percentage": 82.24, "elapsed_time": "1 day, 9:02:37", "remaining_time": "7:08:13"}
|
417 |
{"current_steps": 3440, "total_steps": 4183, "eval_loss": 2.140444278717041, "epoch": 72.9973474801061, "percentage": 82.24, "elapsed_time": "1 day, 9:03:12", "remaining_time": "7:08:20"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
415 |
{"current_steps": 3430, "total_steps": 4183, "loss": 0.0036, "lr": 5e-06, "epoch": 72.78514588859416, "percentage": 82.0, "elapsed_time": "1 day, 8:57:18", "remaining_time": "7:14:05"}
|
416 |
{"current_steps": 3440, "total_steps": 4183, "loss": 0.0036, "lr": 5e-06, "epoch": 72.9973474801061, "percentage": 82.24, "elapsed_time": "1 day, 9:02:37", "remaining_time": "7:08:13"}
|
417 |
{"current_steps": 3440, "total_steps": 4183, "eval_loss": 2.140444278717041, "epoch": 72.9973474801061, "percentage": 82.24, "elapsed_time": "1 day, 9:03:12", "remaining_time": "7:08:20"}
|
418 |
+
{"current_steps": 3450, "total_steps": 4183, "loss": 0.0035, "lr": 5e-06, "epoch": 73.20954907161804, "percentage": 82.48, "elapsed_time": "1 day, 9:09:48", "remaining_time": "7:02:45"}
|
419 |
+
{"current_steps": 3460, "total_steps": 4183, "loss": 0.0037, "lr": 5e-06, "epoch": 73.42175066312997, "percentage": 82.72, "elapsed_time": "1 day, 9:15:07", "remaining_time": "6:56:53"}
|
420 |
+
{"current_steps": 3470, "total_steps": 4183, "loss": 0.0035, "lr": 5e-06, "epoch": 73.63395225464191, "percentage": 82.95, "elapsed_time": "1 day, 9:20:26", "remaining_time": "6:51:02"}
|
421 |
+
{"current_steps": 3480, "total_steps": 4183, "loss": 0.0036, "lr": 5e-06, "epoch": 73.84615384615384, "percentage": 83.19, "elapsed_time": "1 day, 9:25:45", "remaining_time": "6:45:11"}
|
422 |
+
{"current_steps": 3487, "total_steps": 4183, "eval_loss": 2.0650992393493652, "epoch": 73.9946949602122, "percentage": 83.36, "elapsed_time": "1 day, 9:30:06", "remaining_time": "6:41:12"}
|
423 |
+
{"current_steps": 3490, "total_steps": 4183, "loss": 0.0035, "lr": 5e-06, "epoch": 74.05835543766578, "percentage": 83.43, "elapsed_time": "1 day, 9:32:59", "remaining_time": "6:39:42"}
|