andro-flock commited on
Commit
7c0fe75
·
verified ·
1 Parent(s): 641b5b0

Model save

Browse files
README.md CHANGED
@@ -2,8 +2,6 @@
2
  library_name: transformers
3
  base_model: andro-flock/b2-classification
4
  tags:
5
- - image-segmentation
6
- - vision
7
  - generated_from_trainer
8
  model-index:
9
  - name: b2-segmentation
@@ -15,7 +13,7 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  # b2-segmentation
17
 
18
- This model is a fine-tuned version of [andro-flock/b2-classification](https://huggingface.co/andro-flock/b2-classification) on the andro-flock/semantic-segment dataset.
19
 
20
  ## Model description
21
 
@@ -35,11 +33,9 @@ More information needed
35
 
36
  The following hyperparameters were used during training:
37
  - learning_rate: 6e-05
38
- - train_batch_size: 4
39
  - eval_batch_size: 8
40
  - seed: 1337
41
- - gradient_accumulation_steps: 2
42
- - total_train_batch_size: 8
43
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
44
  - lr_scheduler_type: polynomial
45
  - training_steps: 500
 
2
  library_name: transformers
3
  base_model: andro-flock/b2-classification
4
  tags:
 
 
5
  - generated_from_trainer
6
  model-index:
7
  - name: b2-segmentation
 
13
 
14
  # b2-segmentation
15
 
16
+ This model is a fine-tuned version of [andro-flock/b2-classification](https://huggingface.co/andro-flock/b2-classification) on an unknown dataset.
17
 
18
  ## Model description
19
 
 
33
 
34
  The following hyperparameters were used during training:
35
  - learning_rate: 6e-05
36
+ - train_batch_size: 8
37
  - eval_batch_size: 8
38
  - seed: 1337
 
 
39
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
40
  - lr_scheduler_type: polynomial
41
  - training_steps: 500
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 125.0,
3
- "total_flos": 4.67800620466176e+17,
4
- "train_loss": 0.1090870885848999,
5
- "train_runtime": 959.3782,
6
- "train_samples_per_second": 4.169,
7
- "train_steps_per_second": 0.521
8
  }
 
1
  {
2
+ "epoch": 500.0,
3
+ "total_flos": 7.8886713950208e+16,
4
+ "train_loss": 0.1895984401702881,
5
+ "train_runtime": 397.1334,
6
+ "train_samples_per_second": 20.144,
7
+ "train_steps_per_second": 2.518
8
  }
config.json CHANGED
@@ -29,15 +29,17 @@
29
  ],
30
  "id2label": {
31
  "0": "background",
32
- "1": "head",
33
- "2": "body"
 
34
  },
35
  "image_size": 224,
36
  "initializer_range": 0.02,
37
  "label2id": {
38
  "background": "0",
39
- "body": "2",
40
- "head": "1"
 
41
  },
42
  "layer_norm_eps": 1e-06,
43
  "mlp_ratios": [
 
29
  ],
30
  "id2label": {
31
  "0": "background",
32
+ "1": "hair",
33
+ "2": "skin",
34
+ "3": "cloths"
35
  },
36
  "image_size": 224,
37
  "initializer_range": 0.02,
38
  "label2id": {
39
  "background": "0",
40
+ "cloths": "3",
41
+ "hair": "1",
42
+ "skin": "2"
43
  },
44
  "layer_norm_eps": 1e-06,
45
  "mlp_ratios": [
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14842d4a49c211fcec3cd7a79d0a8bcf4f92ee43da4d1e3f6d88c089891de57d
3
- size 109447092
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3529b865cae264a86f42ccef78802036c949e12444f78c61e7854fdf7b666b73
3
+ size 109450168
runs/Mar07_01-57-13_183eb2dda0db/events.out.tfevents.1741312639.183eb2dda0db.2407.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:874d28aa52d2a3c3cb546be0b17ba5ebab5cc9e5a8a81d0e4aa0ade293332e56
3
+ size 5662
runs/Mar07_02-03-50_183eb2dda0db/events.out.tfevents.1741313034.183eb2dda0db.4118.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:070a33ecc508c8bd126b1c16beba7cb843dc34fc6e031adb61d3f25a7b05b178
3
+ size 6649
runs/Mar07_02-12-31_183eb2dda0db/events.out.tfevents.1741313556.183eb2dda0db.6286.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8760feb8ba6a2009e6e9b958b43b0ee1e7ea7c43830859fd9e075764934533f2
3
+ size 7072
runs/Mar07_02-24-11_183eb2dda0db/events.out.tfevents.1741314258.183eb2dda0db.9202.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b80efeff04198213316d3b79e80557ba0d91de1c96d0bd3a50ddc370dfea0536
3
+ size 6455
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 125.0,
3
- "total_flos": 4.67800620466176e+17,
4
- "train_loss": 0.1090870885848999,
5
- "train_runtime": 959.3782,
6
- "train_samples_per_second": 4.169,
7
- "train_steps_per_second": 0.521
8
  }
 
1
  {
2
+ "epoch": 500.0,
3
+ "total_flos": 7.8886713950208e+16,
4
+ "train_loss": 0.1895984401702881,
5
+ "train_runtime": 397.1334,
6
+ "train_samples_per_second": 20.144,
7
+ "train_steps_per_second": 2.518
8
  }
trainer_state.json CHANGED
@@ -1,97 +1,62 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 125.0,
5
  "eval_steps": 500,
6
- "global_step": 500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 12.5,
13
- "grad_norm": 3.6458182334899902,
14
- "learning_rate": 5.401e-05,
15
- "loss": 0.3174,
16
- "step": 50
17
- },
18
- {
19
- "epoch": 25.0,
20
- "grad_norm": 2.206636905670166,
21
  "learning_rate": 4.8020000000000004e-05,
22
- "loss": 0.1611,
23
- "step": 100
24
- },
25
- {
26
- "epoch": 37.5,
27
- "grad_norm": 0.8555470705032349,
28
- "learning_rate": 4.203e-05,
29
- "loss": 0.1319,
30
- "step": 150
31
- },
32
- {
33
- "epoch": 50.0,
34
- "grad_norm": 0.6757478713989258,
35
- "learning_rate": 3.604e-05,
36
- "loss": 0.1038,
37
  "step": 200
38
  },
39
  {
40
- "epoch": 62.5,
41
- "grad_norm": 1.159254550933838,
42
- "learning_rate": 3.0050000000000002e-05,
43
- "loss": 0.0701,
44
- "step": 250
45
  },
46
  {
47
- "epoch": 75.0,
48
- "grad_norm": 2.89020037651062,
49
  "learning_rate": 2.406e-05,
50
- "loss": 0.0658,
51
- "step": 300
52
- },
53
- {
54
- "epoch": 87.5,
55
- "grad_norm": 1.4937611818313599,
56
- "learning_rate": 1.807e-05,
57
- "loss": 0.0635,
58
- "step": 350
59
  },
60
  {
61
- "epoch": 100.0,
62
- "grad_norm": 0.5791894197463989,
63
  "learning_rate": 1.2079999999999998e-05,
64
- "loss": 0.0692,
65
- "step": 400
66
- },
67
- {
68
- "epoch": 112.5,
69
- "grad_norm": 0.22667507827281952,
70
- "learning_rate": 6.0899999999999984e-06,
71
- "loss": 0.0585,
72
- "step": 450
73
  },
74
  {
75
- "epoch": 125.0,
76
- "grad_norm": 0.2987639307975769,
77
  "learning_rate": 1e-07,
78
- "loss": 0.0497,
79
- "step": 500
80
  },
81
  {
82
- "epoch": 125.0,
83
- "step": 500,
84
- "total_flos": 4.67800620466176e+17,
85
- "train_loss": 0.1090870885848999,
86
- "train_runtime": 959.3782,
87
- "train_samples_per_second": 4.169,
88
- "train_steps_per_second": 0.521
89
  }
90
  ],
91
- "logging_steps": 50,
92
- "max_steps": 500,
93
  "num_input_tokens_seen": 0,
94
- "num_train_epochs": 125,
95
  "save_steps": 500,
96
  "stateful_callbacks": {
97
  "TrainerControl": {
@@ -105,8 +70,8 @@
105
  "attributes": {}
106
  }
107
  },
108
- "total_flos": 4.67800620466176e+17,
109
- "train_batch_size": 4,
110
  "trial_name": null,
111
  "trial_params": null
112
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 500.0,
5
  "eval_steps": 500,
6
+ "global_step": 1000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 100.0,
13
+ "grad_norm": 1.8578704595565796,
 
 
 
 
 
 
 
14
  "learning_rate": 4.8020000000000004e-05,
15
+ "loss": 0.4234,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
16
  "step": 200
17
  },
18
  {
19
+ "epoch": 200.0,
20
+ "grad_norm": 0.6928507685661316,
21
+ "learning_rate": 3.604e-05,
22
+ "loss": 0.1814,
23
+ "step": 400
24
  },
25
  {
26
+ "epoch": 300.0,
27
+ "grad_norm": 1.1086845397949219,
28
  "learning_rate": 2.406e-05,
29
+ "loss": 0.1281,
30
+ "step": 600
 
 
 
 
 
 
 
31
  },
32
  {
33
+ "epoch": 400.0,
34
+ "grad_norm": 1.4631288051605225,
35
  "learning_rate": 1.2079999999999998e-05,
36
+ "loss": 0.1144,
37
+ "step": 800
 
 
 
 
 
 
 
38
  },
39
  {
40
+ "epoch": 500.0,
41
+ "grad_norm": 0.9606817364692688,
42
  "learning_rate": 1e-07,
43
+ "loss": 0.1007,
44
+ "step": 1000
45
  },
46
  {
47
+ "epoch": 500.0,
48
+ "step": 1000,
49
+ "total_flos": 7.8886713950208e+16,
50
+ "train_loss": 0.1895984401702881,
51
+ "train_runtime": 397.1334,
52
+ "train_samples_per_second": 20.144,
53
+ "train_steps_per_second": 2.518
54
  }
55
  ],
56
+ "logging_steps": 200,
57
+ "max_steps": 1000,
58
  "num_input_tokens_seen": 0,
59
+ "num_train_epochs": 500,
60
  "save_steps": 500,
61
  "stateful_callbacks": {
62
  "TrainerControl": {
 
70
  "attributes": {}
71
  }
72
  },
73
+ "total_flos": 7.8886713950208e+16,
74
+ "train_batch_size": 8,
75
  "trial_name": null,
76
  "trial_params": null
77
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f63fef78833f2e056701b0761ddf3d0a22cccb53dcde50e0fbfdf6c737ced8db
3
- size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a31b223fa03376c8ece09ab0e17c53ee11f53b02c5d17355ccd5503c10c6ee91
3
+ size 5432