Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3102b5a01fd87c966a244fe6073c0c893f922763205b49a25654b8e92649d703
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2c8215ff60c35e87335338fdda5ba83096de631e1ebc3a5f789549a266d8908
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58848a8f1d1cb5dbfe21e4ae4b9ad0e9c8efef18a41dd483f1f60c13e8954324
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b886b263cb0adbe4013f3e9074e22689182c2925a8ed127f0339d5f5a9e18675
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -21,3 +21,24 @@
|
|
21 |
{"current_steps": 21, "total_steps": 60, "loss": 1.1651, "lr": 8.213938048432697e-06, "epoch": 1.024390243902439, "percentage": 35.0, "elapsed_time": "0:19:07", "remaining_time": "0:35:30"}
|
22 |
{"current_steps": 22, "total_steps": 60, "loss": 0.7399, "lr": 7.985792958513932e-06, "epoch": 1.0731707317073171, "percentage": 36.67, "elapsed_time": "0:20:02", "remaining_time": "0:34:36"}
|
23 |
{"current_steps": 23, "total_steps": 60, "loss": 0.8688, "lr": 7.747544890354031e-06, "epoch": 1.1219512195121952, "percentage": 38.33, "elapsed_time": "0:20:57", "remaining_time": "0:33:43"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
21 |
{"current_steps": 21, "total_steps": 60, "loss": 1.1651, "lr": 8.213938048432697e-06, "epoch": 1.024390243902439, "percentage": 35.0, "elapsed_time": "0:19:07", "remaining_time": "0:35:30"}
|
22 |
{"current_steps": 22, "total_steps": 60, "loss": 0.7399, "lr": 7.985792958513932e-06, "epoch": 1.0731707317073171, "percentage": 36.67, "elapsed_time": "0:20:02", "remaining_time": "0:34:36"}
|
23 |
{"current_steps": 23, "total_steps": 60, "loss": 0.8688, "lr": 7.747544890354031e-06, "epoch": 1.1219512195121952, "percentage": 38.33, "elapsed_time": "0:20:57", "remaining_time": "0:33:43"}
|
24 |
+
{"current_steps": 24, "total_steps": 60, "loss": 0.7049, "lr": 7.500000000000001e-06, "epoch": 1.170731707317073, "percentage": 40.0, "elapsed_time": "0:21:44", "remaining_time": "0:32:36"}
|
25 |
+
{"current_steps": 25, "total_steps": 60, "loss": 0.92, "lr": 7.243995901002312e-06, "epoch": 1.2195121951219512, "percentage": 41.67, "elapsed_time": "0:22:48", "remaining_time": "0:31:55"}
|
26 |
+
{"current_steps": 26, "total_steps": 60, "loss": 0.6655, "lr": 6.980398830195785e-06, "epoch": 1.2682926829268293, "percentage": 43.33, "elapsed_time": "0:23:30", "remaining_time": "0:30:44"}
|
27 |
+
{"current_steps": 27, "total_steps": 60, "loss": 0.7905, "lr": 6.710100716628345e-06, "epoch": 1.3170731707317074, "percentage": 45.0, "elapsed_time": "0:24:15", "remaining_time": "0:29:39"}
|
28 |
+
{"current_steps": 28, "total_steps": 60, "loss": 0.8514, "lr": 6.434016163555452e-06, "epoch": 1.3658536585365852, "percentage": 46.67, "elapsed_time": "0:25:09", "remaining_time": "0:28:45"}
|
29 |
+
{"current_steps": 29, "total_steps": 60, "loss": 0.88, "lr": 6.153079353712201e-06, "epoch": 1.4146341463414633, "percentage": 48.33, "elapsed_time": "0:26:02", "remaining_time": "0:27:50"}
|
30 |
+
{"current_steps": 30, "total_steps": 60, "loss": 0.6719, "lr": 5.8682408883346535e-06, "epoch": 1.4634146341463414, "percentage": 50.0, "elapsed_time": "0:26:47", "remaining_time": "0:26:47"}
|
31 |
+
{"current_steps": 31, "total_steps": 60, "loss": 0.9152, "lr": 5.5804645706261515e-06, "epoch": 1.5121951219512195, "percentage": 51.67, "elapsed_time": "0:27:42", "remaining_time": "0:25:54"}
|
32 |
+
{"current_steps": 32, "total_steps": 60, "loss": 0.6975, "lr": 5.290724144552379e-06, "epoch": 1.5609756097560976, "percentage": 53.33, "elapsed_time": "0:28:25", "remaining_time": "0:24:52"}
|
33 |
+
{"current_steps": 33, "total_steps": 60, "loss": 0.8428, "lr": 5e-06, "epoch": 1.6097560975609757, "percentage": 55.0, "elapsed_time": "0:29:19", "remaining_time": "0:23:59"}
|
34 |
+
{"current_steps": 34, "total_steps": 60, "loss": 0.7701, "lr": 4.7092758554476215e-06, "epoch": 1.6585365853658538, "percentage": 56.67, "elapsed_time": "0:30:07", "remaining_time": "0:23:02"}
|
35 |
+
{"current_steps": 35, "total_steps": 60, "loss": 0.684, "lr": 4.4195354293738484e-06, "epoch": 1.7073170731707317, "percentage": 58.33, "elapsed_time": "0:30:57", "remaining_time": "0:22:06"}
|
36 |
+
{"current_steps": 36, "total_steps": 60, "loss": 0.811, "lr": 4.131759111665349e-06, "epoch": 1.7560975609756098, "percentage": 60.0, "elapsed_time": "0:31:44", "remaining_time": "0:21:09"}
|
37 |
+
{"current_steps": 37, "total_steps": 60, "loss": 0.8534, "lr": 3.8469206462878e-06, "epoch": 1.8048780487804879, "percentage": 61.67, "elapsed_time": "0:32:34", "remaining_time": "0:20:14"}
|
38 |
+
{"current_steps": 38, "total_steps": 60, "loss": 0.7364, "lr": 3.5659838364445505e-06, "epoch": 1.8536585365853657, "percentage": 63.33, "elapsed_time": "0:33:27", "remaining_time": "0:19:22"}
|
39 |
+
{"current_steps": 39, "total_steps": 60, "loss": 0.7937, "lr": 3.289899283371657e-06, "epoch": 1.9024390243902438, "percentage": 65.0, "elapsed_time": "0:34:19", "remaining_time": "0:18:29"}
|
40 |
+
{"current_steps": 40, "total_steps": 60, "loss": 0.7559, "lr": 3.019601169804216e-06, "epoch": 1.951219512195122, "percentage": 66.67, "elapsed_time": "0:35:16", "remaining_time": "0:17:38"}
|
41 |
+
{"current_steps": 41, "total_steps": 60, "loss": 1.254, "lr": 2.7560040989976894e-06, "epoch": 2.0, "percentage": 68.33, "elapsed_time": "0:36:08", "remaining_time": "0:16:45"}
|
42 |
+
{"current_steps": 42, "total_steps": 60, "loss": 0.7906, "lr": 2.5000000000000015e-06, "epoch": 2.048780487804878, "percentage": 70.0, "elapsed_time": "0:38:14", "remaining_time": "0:16:23"}
|
43 |
+
{"current_steps": 43, "total_steps": 60, "loss": 0.7495, "lr": 2.2524551096459703e-06, "epoch": 2.097560975609756, "percentage": 71.67, "elapsed_time": "0:39:04", "remaining_time": "0:15:26"}
|
44 |
+
{"current_steps": 44, "total_steps": 60, "loss": 0.7846, "lr": 2.0142070414860704e-06, "epoch": 2.1463414634146343, "percentage": 73.33, "elapsed_time": "0:39:53", "remaining_time": "0:14:30"}
|