Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78fd94ad3968700809ca0e962ef45325ebb374cf76999877fcf72fc99231789f
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a28c7b7aa51e100c8798ccb28a9aa3fe9af3829bd52ed19bab34bb353f4c0cd
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:366f6f0412276de2cba9064f23c048c520697b19c3f7b80ea2b08d1b9f51db33
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ef2051c3e4487831ff26c72af7cb550d3ac2433d172fcefc1845b6236bd64e8
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -5,3 +5,10 @@
|
|
5 |
{"current_steps": 50, "total_steps": 177, "loss": 0.7147, "lr": 5e-06, "epoch": 0.8385744234800838, "percentage": 28.25, "elapsed_time": "0:48:07", "remaining_time": "2:02:15"}
|
6 |
{"current_steps": 59, "total_steps": 177, "eval_loss": 0.6969855427742004, "epoch": 0.989517819706499, "percentage": 33.33, "elapsed_time": "0:58:20", "remaining_time": "1:56:41"}
|
7 |
{"current_steps": 60, "total_steps": 177, "loss": 0.7324, "lr": 5e-06, "epoch": 1.0083857442348008, "percentage": 33.9, "elapsed_time": "1:00:02", "remaining_time": "1:57:04"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
5 |
{"current_steps": 50, "total_steps": 177, "loss": 0.7147, "lr": 5e-06, "epoch": 0.8385744234800838, "percentage": 28.25, "elapsed_time": "0:48:07", "remaining_time": "2:02:15"}
|
6 |
{"current_steps": 59, "total_steps": 177, "eval_loss": 0.6969855427742004, "epoch": 0.989517819706499, "percentage": 33.33, "elapsed_time": "0:58:20", "remaining_time": "1:56:41"}
|
7 |
{"current_steps": 60, "total_steps": 177, "loss": 0.7324, "lr": 5e-06, "epoch": 1.0083857442348008, "percentage": 33.9, "elapsed_time": "1:00:02", "remaining_time": "1:57:04"}
|
8 |
+
{"current_steps": 70, "total_steps": 177, "loss": 0.6726, "lr": 5e-06, "epoch": 1.1761006289308176, "percentage": 39.55, "elapsed_time": "1:09:40", "remaining_time": "1:46:30"}
|
9 |
+
{"current_steps": 80, "total_steps": 177, "loss": 0.6595, "lr": 5e-06, "epoch": 1.3438155136268344, "percentage": 45.2, "elapsed_time": "1:19:18", "remaining_time": "1:36:09"}
|
10 |
+
{"current_steps": 90, "total_steps": 177, "loss": 0.6558, "lr": 5e-06, "epoch": 1.5115303983228512, "percentage": 50.85, "elapsed_time": "1:28:54", "remaining_time": "1:25:56"}
|
11 |
+
{"current_steps": 100, "total_steps": 177, "loss": 0.6525, "lr": 5e-06, "epoch": 1.6792452830188678, "percentage": 56.5, "elapsed_time": "1:38:31", "remaining_time": "1:15:51"}
|
12 |
+
{"current_steps": 110, "total_steps": 177, "loss": 0.6543, "lr": 5e-06, "epoch": 1.8469601677148848, "percentage": 62.15, "elapsed_time": "1:48:08", "remaining_time": "1:05:52"}
|
13 |
+
{"current_steps": 119, "total_steps": 177, "eval_loss": 0.6759442090988159, "epoch": 1.9979035639412999, "percentage": 67.23, "elapsed_time": "1:57:51", "remaining_time": "0:57:26"}
|
14 |
+
{"current_steps": 120, "total_steps": 177, "loss": 0.6821, "lr": 5e-06, "epoch": 2.0167714884696015, "percentage": 67.8, "elapsed_time": "2:00:03", "remaining_time": "0:57:01"}
|