Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ab5a5a19d615d9dc236ab67bc14e9d16ee7b2b1bb7ff420fec62c4bce5b93a7
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b5db5d532ad2f260aa22d89047c1ed1ab95e83c27719ebc310801554ed905f3
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c701987f23639c8ecc334adcb1c1b49bf25dc8eb2944e73598cff99e08e1f267
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a9f2a284a7ad966274091ad834ea17c595bf8ef901c609787cb06b2ce198c9b
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -42,3 +42,20 @@
|
|
42 |
{"current_steps": 42, "total_steps": 60, "loss": 0.7906, "lr": 2.5000000000000015e-06, "epoch": 2.048780487804878, "percentage": 70.0, "elapsed_time": "0:38:14", "remaining_time": "0:16:23"}
|
43 |
{"current_steps": 43, "total_steps": 60, "loss": 0.7495, "lr": 2.2524551096459703e-06, "epoch": 2.097560975609756, "percentage": 71.67, "elapsed_time": "0:39:04", "remaining_time": "0:15:26"}
|
44 |
{"current_steps": 44, "total_steps": 60, "loss": 0.7846, "lr": 2.0142070414860704e-06, "epoch": 2.1463414634146343, "percentage": 73.33, "elapsed_time": "0:39:53", "remaining_time": "0:14:30"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
42 |
{"current_steps": 42, "total_steps": 60, "loss": 0.7906, "lr": 2.5000000000000015e-06, "epoch": 2.048780487804878, "percentage": 70.0, "elapsed_time": "0:38:14", "remaining_time": "0:16:23"}
|
43 |
{"current_steps": 43, "total_steps": 60, "loss": 0.7495, "lr": 2.2524551096459703e-06, "epoch": 2.097560975609756, "percentage": 71.67, "elapsed_time": "0:39:04", "remaining_time": "0:15:26"}
|
44 |
{"current_steps": 44, "total_steps": 60, "loss": 0.7846, "lr": 2.0142070414860704e-06, "epoch": 2.1463414634146343, "percentage": 73.33, "elapsed_time": "0:39:53", "remaining_time": "0:14:30"}
|
45 |
+
{"current_steps": 45, "total_steps": 60, "loss": 0.7664, "lr": 1.7860619515673034e-06, "epoch": 2.1951219512195124, "percentage": 75.0, "elapsed_time": "0:40:38", "remaining_time": "0:13:32"}
|
46 |
+
{"current_steps": 46, "total_steps": 60, "loss": 0.7178, "lr": 1.5687918106563326e-06, "epoch": 2.2439024390243905, "percentage": 76.67, "elapsed_time": "0:41:30", "remaining_time": "0:12:38"}
|
47 |
+
{"current_steps": 47, "total_steps": 60, "loss": 0.7867, "lr": 1.3631317921347564e-06, "epoch": 2.292682926829268, "percentage": 78.33, "elapsed_time": "0:42:29", "remaining_time": "0:11:45"}
|
48 |
+
{"current_steps": 48, "total_steps": 60, "loss": 0.7419, "lr": 1.1697777844051105e-06, "epoch": 2.341463414634146, "percentage": 80.0, "elapsed_time": "0:43:29", "remaining_time": "0:10:52"}
|
49 |
+
{"current_steps": 49, "total_steps": 60, "loss": 0.7224, "lr": 9.893840362247809e-07, "epoch": 2.3902439024390243, "percentage": 81.67, "elapsed_time": "0:44:20", "remaining_time": "0:09:57"}
|
50 |
+
{"current_steps": 50, "total_steps": 60, "loss": 0.7914, "lr": 8.225609429353187e-07, "epoch": 2.4390243902439024, "percentage": 83.33, "elapsed_time": "0:45:11", "remaining_time": "0:09:02"}
|
51 |
+
{"current_steps": 51, "total_steps": 60, "loss": 0.7448, "lr": 6.698729810778065e-07, "epoch": 2.4878048780487805, "percentage": 85.0, "elapsed_time": "0:45:56", "remaining_time": "0:08:06"}
|
52 |
+
{"current_steps": 52, "total_steps": 60, "loss": 0.7486, "lr": 5.318367983829393e-07, "epoch": 2.5365853658536586, "percentage": 86.67, "elapsed_time": "0:46:50", "remaining_time": "0:07:12"}
|
53 |
+
{"current_steps": 53, "total_steps": 60, "loss": 0.7421, "lr": 4.089194655986306e-07, "epoch": 2.5853658536585367, "percentage": 88.33, "elapsed_time": "0:47:33", "remaining_time": "0:06:16"}
|
54 |
+
{"current_steps": 54, "total_steps": 60, "loss": 0.8132, "lr": 3.015368960704584e-07, "epoch": 2.6341463414634148, "percentage": 90.0, "elapsed_time": "0:48:29", "remaining_time": "0:05:23"}
|
55 |
+
{"current_steps": 55, "total_steps": 60, "loss": 0.7491, "lr": 2.1005243842255552e-07, "epoch": 2.682926829268293, "percentage": 91.67, "elapsed_time": "0:49:24", "remaining_time": "0:04:29"}
|
56 |
+
{"current_steps": 56, "total_steps": 60, "loss": 0.7919, "lr": 1.3477564710088097e-07, "epoch": 2.7317073170731705, "percentage": 93.33, "elapsed_time": "0:50:30", "remaining_time": "0:03:36"}
|
57 |
+
{"current_steps": 57, "total_steps": 60, "loss": 0.7485, "lr": 7.59612349389599e-08, "epoch": 2.7804878048780486, "percentage": 95.0, "elapsed_time": "0:51:24", "remaining_time": "0:02:42"}
|
58 |
+
{"current_steps": 58, "total_steps": 60, "loss": 0.734, "lr": 3.3808211290284886e-08, "epoch": 2.8292682926829267, "percentage": 96.67, "elapsed_time": "0:52:17", "remaining_time": "0:01:48"}
|
59 |
+
{"current_steps": 59, "total_steps": 60, "loss": 0.7751, "lr": 8.459208643659122e-09, "epoch": 2.8780487804878048, "percentage": 98.33, "elapsed_time": "0:53:02", "remaining_time": "0:00:53"}
|
60 |
+
{"current_steps": 60, "total_steps": 60, "loss": 0.7135, "lr": 0.0, "epoch": 2.926829268292683, "percentage": 100.0, "elapsed_time": "0:53:43", "remaining_time": "0:00:00"}
|
61 |
+
{"current_steps": 60, "total_steps": 60, "epoch": 2.926829268292683, "percentage": 100.0, "elapsed_time": "0:55:52", "remaining_time": "0:00:00"}
|