tuanna08go commited on
Commit
619acd6
·
verified ·
1 Parent(s): 1a218a5

Training in progress, step 16, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:918b1cab71ebba90a428579a7564e639298e83e6761374483f49644704075e7f
3
  size 41581360
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2376eaccda4d880910e5930a99fa7a7b290c7cc289ccf3a0abde38ccebef511
3
  size 41581360
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2d5ef7870af310ef229829711dae4b6f79456d9e6f9e1492bbe28b604211baa4
3
  size 21505540
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71ea54e312f14bb4fd0b487cc196798a40bd997888fab2103109e536ce82603d
3
  size 21505540
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5e05343cded05c60740d6de4c4834260b4a342f6ca5ef008d7c59110070d517c
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7df23e03f3c3533698e583560c479b817273cd5ed4163a9984c58ecc560a679c
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21e2b5d9560191cd8cd454fd2be1d438284aac8617273afc89cbf21659e669ae
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8eeea5c208aac12ca1d7588ccb40479c9754522c5504911db2e6c3df2af3627
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.7710843373493976,
5
  "eval_steps": 4,
6
- "global_step": 12,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -46,6 +46,14 @@
46
  "eval_samples_per_second": 32.006,
47
  "eval_steps_per_second": 4.268,
48
  "step": 12
 
 
 
 
 
 
 
 
49
  }
50
  ],
51
  "logging_steps": 10,
@@ -60,12 +68,12 @@
60
  "should_evaluate": false,
61
  "should_log": false,
62
  "should_save": true,
63
- "should_training_stop": false
64
  },
65
  "attributes": {}
66
  }
67
  },
68
- "total_flos": 9601868749602816.0,
69
  "train_batch_size": 8,
70
  "trial_name": null,
71
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.0602409638554218,
5
  "eval_steps": 4,
6
+ "global_step": 16,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
46
  "eval_samples_per_second": 32.006,
47
  "eval_steps_per_second": 4.268,
48
  "step": 12
49
+ },
50
+ {
51
+ "epoch": 1.0602409638554218,
52
+ "eval_loss": 1.1985491514205933,
53
+ "eval_runtime": 3.2919,
54
+ "eval_samples_per_second": 31.897,
55
+ "eval_steps_per_second": 4.253,
56
+ "step": 16
57
  }
58
  ],
59
  "logging_steps": 10,
 
68
  "should_evaluate": false,
69
  "should_log": false,
70
  "should_save": true,
71
+ "should_training_stop": true
72
  },
73
  "attributes": {}
74
  }
75
  },
76
+ "total_flos": 1.2802491666137088e+16,
77
  "train_batch_size": 8,
78
  "trial_name": null,
79
  "trial_params": null