umairrkhn commited on
Commit
db0eb22
·
verified ·
1 Parent(s): 1841026

End of training

Browse files
Files changed (5) hide show
  1. README.md +3 -3
  2. all_results.json +11 -11
  3. eval_results.json +6 -6
  4. train_results.json +6 -6
  5. trainer_state.json +30 -78
README.md CHANGED
@@ -23,7 +23,7 @@ model-index:
23
  metrics:
24
  - name: Accuracy
25
  type: accuracy
26
- value: 1.0
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -33,8 +33,8 @@ should probably proofread and complete it, then remove this comment. -->
33
 
34
  This model is a fine-tuned version of [Marqo/nsfw-image-detection-384](https://huggingface.co/Marqo/nsfw-image-detection-384) on the imagefolder dataset.
35
  It achieves the following results on the evaluation set:
36
- - Loss: 0.0003
37
- - Accuracy: 1.0
38
 
39
  ## Model description
40
 
 
23
  metrics:
24
  - name: Accuracy
25
  type: accuracy
26
+ value: 0.999
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
33
 
34
  This model is a fine-tuned version of [Marqo/nsfw-image-detection-384](https://huggingface.co/Marqo/nsfw-image-detection-384) on the imagefolder dataset.
35
  It achieves the following results on the evaluation set:
36
+ - Loss: 0.0041
37
+ - Accuracy: 0.999
38
 
39
  ## Model description
40
 
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_accuracy": 0.996,
4
- "eval_loss": 0.0253806933760643,
5
- "eval_runtime": 28.4966,
6
- "eval_samples_per_second": 35.092,
7
- "eval_steps_per_second": 4.386,
8
- "total_flos": 7.036273897136456e+17,
9
- "train_loss": 0.009760016079127729,
10
- "train_runtime": 1762.5795,
11
- "train_samples_per_second": 26.869,
12
- "train_steps_per_second": 1.68
13
  }
 
1
  {
2
+ "epoch": 1.5005065856129685,
3
+ "eval_accuracy": 0.999,
4
+ "eval_loss": 0.004140933509916067,
5
+ "eval_runtime": 28.4475,
6
+ "eval_samples_per_second": 35.152,
7
+ "eval_steps_per_second": 2.215,
8
+ "total_flos": 3.5197712872833024e+17,
9
+ "train_loss": 0.002488548292009352,
10
+ "train_runtime": 874.5228,
11
+ "train_samples_per_second": 27.076,
12
+ "train_steps_per_second": 1.693
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_accuracy": 0.996,
4
- "eval_loss": 0.0253806933760643,
5
- "eval_runtime": 28.4966,
6
- "eval_samples_per_second": 35.092,
7
- "eval_steps_per_second": 4.386
8
  }
 
1
  {
2
+ "epoch": 1.5005065856129685,
3
+ "eval_accuracy": 0.999,
4
+ "eval_loss": 0.004140933509916067,
5
+ "eval_runtime": 28.4475,
6
+ "eval_samples_per_second": 35.152,
7
+ "eval_steps_per_second": 2.215
8
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "total_flos": 7.036273897136456e+17,
4
- "train_loss": 0.009760016079127729,
5
- "train_runtime": 1762.5795,
6
- "train_samples_per_second": 26.869,
7
- "train_steps_per_second": 1.68
8
  }
 
1
  {
2
+ "epoch": 1.5005065856129685,
3
+ "total_flos": 3.5197712872833024e+17,
4
+ "train_loss": 0.002488548292009352,
5
+ "train_runtime": 874.5228,
6
+ "train_samples_per_second": 27.076,
7
+ "train_steps_per_second": 1.693
8
  }
trainer_state.json CHANGED
@@ -1,108 +1,60 @@
1
  {
2
- "best_metric": 1.5119968338694889e-05,
3
- "best_model_checkpoint": "./nsfw-fine-tuned-timm/checkpoint-2000",
4
- "epoch": 3.0,
5
  "eval_steps": 500,
6
- "global_step": 2961,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.5065856129685917,
13
- "grad_norm": 0.025366274639964104,
14
- "learning_rate": 4.1556906450523474e-05,
15
- "loss": 0.0375,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.5065856129685917,
20
- "eval_accuracy": 0.998,
21
- "eval_loss": 0.0066848029382526875,
22
- "eval_runtime": 27.7412,
23
- "eval_samples_per_second": 36.047,
24
- "eval_steps_per_second": 4.506,
25
  "step": 500
26
  },
27
  {
28
  "epoch": 1.0131712259371835,
29
- "grad_norm": 0.008881847374141216,
30
- "learning_rate": 3.3113812901046945e-05,
31
- "loss": 0.0138,
32
  "step": 1000
33
  },
34
  {
35
  "epoch": 1.0131712259371835,
36
  "eval_accuracy": 1.0,
37
- "eval_loss": 0.00014481571270152926,
38
- "eval_runtime": 27.3526,
39
- "eval_samples_per_second": 36.56,
40
- "eval_steps_per_second": 4.57,
41
  "step": 1000
42
  },
43
  {
44
- "epoch": 1.5197568389057752,
45
- "grad_norm": 0.004049438983201981,
46
- "learning_rate": 2.4670719351570416e-05,
47
- "loss": 0.0028,
48
- "step": 1500
49
- },
50
- {
51
- "epoch": 1.5197568389057752,
52
- "eval_accuracy": 1.0,
53
- "eval_loss": 9.533474803902209e-05,
54
- "eval_runtime": 27.4005,
55
- "eval_samples_per_second": 36.496,
56
- "eval_steps_per_second": 4.562,
57
- "step": 1500
58
- },
59
- {
60
- "epoch": 2.026342451874367,
61
- "grad_norm": 0.0020459946244955063,
62
- "learning_rate": 1.6227625802093887e-05,
63
- "loss": 0.002,
64
- "step": 2000
65
- },
66
- {
67
- "epoch": 2.026342451874367,
68
- "eval_accuracy": 1.0,
69
- "eval_loss": 1.5119968338694889e-05,
70
- "eval_runtime": 27.7767,
71
- "eval_samples_per_second": 36.001,
72
- "eval_steps_per_second": 4.5,
73
- "step": 2000
74
- },
75
- {
76
- "epoch": 2.5329280648429586,
77
- "grad_norm": 0.025027019903063774,
78
- "learning_rate": 7.784532252617359e-06,
79
- "loss": 0.0013,
80
- "step": 2500
81
- },
82
- {
83
- "epoch": 2.5329280648429586,
84
- "eval_accuracy": 1.0,
85
- "eval_loss": 2.4935185138019733e-05,
86
- "eval_runtime": 27.3766,
87
- "eval_samples_per_second": 36.528,
88
- "eval_steps_per_second": 4.566,
89
- "step": 2500
90
- },
91
- {
92
- "epoch": 3.0,
93
- "step": 2961,
94
- "total_flos": 7.036273897136456e+17,
95
- "train_loss": 0.009760016079127729,
96
- "train_runtime": 1762.5795,
97
- "train_samples_per_second": 26.869,
98
- "train_steps_per_second": 1.68
99
  }
100
  ],
101
  "logging_steps": 500,
102
- "max_steps": 2961,
103
  "num_input_tokens_seen": 0,
104
- "num_train_epochs": 3,
105
- "save_steps": 1000,
106
  "stateful_callbacks": {
107
  "TrainerControl": {
108
  "args": {
@@ -115,7 +67,7 @@
115
  "attributes": {}
116
  }
117
  },
118
- "total_flos": 7.036273897136456e+17,
119
  "train_batch_size": 16,
120
  "trial_name": null,
121
  "trial_params": null
 
1
  {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 1.5005065856129685,
5
  "eval_steps": 500,
6
+ "global_step": 1481,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.5065856129685917,
13
+ "grad_norm": 0.000192928608157672,
14
+ "learning_rate": 1.676459191498087e-05,
15
+ "loss": 0.0041,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.5065856129685917,
20
+ "eval_accuracy": 0.996,
21
+ "eval_loss": 0.014655331149697304,
22
+ "eval_runtime": 27.4552,
23
+ "eval_samples_per_second": 36.423,
24
+ "eval_steps_per_second": 2.295,
25
  "step": 500
26
  },
27
  {
28
  "epoch": 1.0131712259371835,
29
+ "grad_norm": 0.00017229605873581022,
30
+ "learning_rate": 5.773817382593008e-06,
31
+ "loss": 0.0023,
32
  "step": 1000
33
  },
34
  {
35
  "epoch": 1.0131712259371835,
36
  "eval_accuracy": 1.0,
37
+ "eval_loss": 0.00030512735247612,
38
+ "eval_runtime": 27.4106,
39
+ "eval_samples_per_second": 36.482,
40
+ "eval_steps_per_second": 2.298,
41
  "step": 1000
42
  },
43
  {
44
+ "epoch": 1.5005065856129685,
45
+ "step": 1481,
46
+ "total_flos": 3.5197712872833024e+17,
47
+ "train_loss": 0.002488548292009352,
48
+ "train_runtime": 874.5228,
49
+ "train_samples_per_second": 27.076,
50
+ "train_steps_per_second": 1.693
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
51
  }
52
  ],
53
  "logging_steps": 500,
54
+ "max_steps": 1481,
55
  "num_input_tokens_seen": 0,
56
+ "num_train_epochs": 2,
57
+ "save_steps": 500,
58
  "stateful_callbacks": {
59
  "TrainerControl": {
60
  "args": {
 
67
  "attributes": {}
68
  }
69
  },
70
+ "total_flos": 3.5197712872833024e+17,
71
  "train_batch_size": 16,
72
  "trial_name": null,
73
  "trial_params": null