tttx
/

ttt-problem10-32b-021025-sl25000

alignment-handbook

Generated from Trainer

Model card Files Files and versions Community

aadityap commited on Feb 11

Commit

83cf367

·

verified ·

1 Parent(s): fdaa848

Model save

Files changed (3) hide show

README.md +1 -6
all_results.json +6 -6
train_results.json +6 -6

README.md CHANGED Viewed

@@ -3,14 +3,9 @@ library_name: peft
 license: mit
 base_model: deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
 tags:
-- alignment-handbook
 - trl
 - sft
 - generated_from_trainer
-datasets:
-- tttx/star-run-step1-master
-- tttx/ttt-problem-10-continue-step1-master
-- tttx/ttt-problem-10-continue-step2-master
 model-index:
 - name: ttt-problem10-32b-021025-sl25000
   results: []
@@ -21,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
 # ttt-problem10-32b-021025-sl25000
-This model is a fine-tuned version of [tttx/sft-32b-020925-19k-5ep](https://huggingface.co/tttx/sft-32b-020925-19k-5ep) on the tttx/star-run-step1-master, the tttx/ttt-problem-10-continue-step1-master and the tttx/ttt-problem-10-continue-step2-master datasets.
 ## Model description

 license: mit
 base_model: deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
 tags:
 - trl
 - sft
 - generated_from_trainer
 model-index:
 - name: ttt-problem10-32b-021025-sl25000
   results: []
 # ttt-problem10-32b-021025-sl25000
+This model is a fine-tuned version of [deepseek-ai/DeepSeek-R1-Distill-Qwen-32B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B) on an unknown dataset.
 ## Model description

all_results.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
     "epoch": 2.0,
-    "total_flos": 1704342039035904.0,
-    "train_loss": 0.08834147482282585,
-    "train_runtime": 2715.1649,
-    "train_samples": 715,
-    "train_samples_per_second": 0.527,
-    "train_steps_per_second": 0.033
 }

 {
     "epoch": 2.0,
+    "total_flos": 490074470875136.0,
+    "train_loss": 0.058849748490112166,
+    "train_runtime": 478.1215,
+    "train_samples": 216,
+    "train_samples_per_second": 0.904,
+    "train_steps_per_second": 0.059
 }

train_results.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
     "epoch": 2.0,
-    "total_flos": 1704342039035904.0,
-    "train_loss": 0.08834147482282585,
-    "train_runtime": 2715.1649,
-    "train_samples": 715,
-    "train_samples_per_second": 0.527,
-    "train_steps_per_second": 0.033
 }

 {
     "epoch": 2.0,
+    "total_flos": 490074470875136.0,
+    "train_loss": 0.058849748490112166,
+    "train_runtime": 478.1215,
+    "train_samples": 216,
+    "train_samples_per_second": 0.904,
+    "train_steps_per_second": 0.059
 }