prosecalign
/

phi3m0128-cds-0.5-kendall-onof-ofif-corr-max-2-simpo-max1500-default

Transformers

Safetensors

Generated from Trainer

llama-factory

Model card Files Files and versions Community

ziansu commited on Jan 31

Commit

14c15b6

verified ·

1 Parent(s): ef73d08

Training in progress, step 1350

Browse files

Files changed (2) hide show

adapter_model.safetensors +1 -1
trainer_log.jsonl +6 -0

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9b2c668e4517cc458ef314c0afc30551e48c3e398573caa7706e25ed810c2beb
 size 25200088

 version https://git-lfs.github.com/spec/v1
+oid sha256:347ee966d6ee1e2a39042a2d03d2c638cb1f113d7e076ea73733f5062a849630
 size 25200088

trainer_log.jsonl CHANGED Viewed

@@ -154,3 +154,9 @@
 {"current_steps": 1290, "total_steps": 1500, "loss": 0.2538, "accuracy": 0.9624999761581421, "learning_rate": 2.3793236883495164e-07, "epoch": 1.375266524520256, "percentage": 86.0, "elapsed_time": "2:55:27", "remaining_time": "0:28:33", "throughput": "0.00", "total_tokens": 0}
 {"current_steps": 1300, "total_steps": 1500, "loss": 0.2363, "accuracy": 0.949999988079071, "learning_rate": 2.1613635589349756e-07, "epoch": 1.3859275053304905, "percentage": 86.67, "elapsed_time": "2:56:43", "remaining_time": "0:27:11", "throughput": "0.00", "total_tokens": 0}
 {"current_steps": 1300, "total_steps": 1500, "eval_loss": 0.2328612357378006, "epoch": 1.3859275053304905, "percentage": 86.67, "elapsed_time": "2:57:04", "remaining_time": "0:27:14", "throughput": "0.00", "total_tokens": 0}

 {"current_steps": 1290, "total_steps": 1500, "loss": 0.2538, "accuracy": 0.9624999761581421, "learning_rate": 2.3793236883495164e-07, "epoch": 1.375266524520256, "percentage": 86.0, "elapsed_time": "2:55:27", "remaining_time": "0:28:33", "throughput": "0.00", "total_tokens": 0}
 {"current_steps": 1300, "total_steps": 1500, "loss": 0.2363, "accuracy": 0.949999988079071, "learning_rate": 2.1613635589349756e-07, "epoch": 1.3859275053304905, "percentage": 86.67, "elapsed_time": "2:56:43", "remaining_time": "0:27:11", "throughput": "0.00", "total_tokens": 0}
 {"current_steps": 1300, "total_steps": 1500, "eval_loss": 0.2328612357378006, "epoch": 1.3859275053304905, "percentage": 86.67, "elapsed_time": "2:57:04", "remaining_time": "0:27:14", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 1310, "total_steps": 1500, "loss": 0.2443, "accuracy": 0.862500011920929, "learning_rate": 1.95342121028749e-07, "epoch": 1.396588486140725, "percentage": 87.33, "elapsed_time": "2:58:24", "remaining_time": "0:25:52", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 1320, "total_steps": 1500, "loss": 0.1976, "accuracy": 0.949999988079071, "learning_rate": 1.7555878527937164e-07, "epoch": 1.4072494669509594, "percentage": 88.0, "elapsed_time": "2:59:37", "remaining_time": "0:24:29", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 1330, "total_steps": 1500, "loss": 0.2462, "accuracy": 0.949999988079071, "learning_rate": 1.567950262702714e-07, "epoch": 1.417910447761194, "percentage": 88.67, "elapsed_time": "3:00:51", "remaining_time": "0:23:07", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 1340, "total_steps": 1500, "loss": 0.2305, "accuracy": 0.8999999761581421, "learning_rate": 1.3905907440629752e-07, "epoch": 1.4285714285714286, "percentage": 89.33, "elapsed_time": "3:02:04", "remaining_time": "0:21:44", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 1350, "total_steps": 1500, "loss": 0.2559, "accuracy": 0.887499988079071, "learning_rate": 1.223587092621162e-07, "epoch": 1.439232409381663, "percentage": 90.0, "elapsed_time": "3:03:24", "remaining_time": "0:20:22", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 1350, "total_steps": 1500, "eval_loss": 0.2323991060256958, "epoch": 1.439232409381663, "percentage": 90.0, "elapsed_time": "3:03:45", "remaining_time": "0:20:25", "throughput": "0.00", "total_tokens": 0}