thean commited on
Commit
0ca5a73
·
1 Parent(s): ec72691

Training in progress, epoch 5

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 2.98,
3
  "eval_accuracy": 0.796875,
4
  "eval_loss": 0.776684582233429,
5
- "eval_runtime": 43.6376,
6
- "eval_samples_per_second": 36.666,
7
- "eval_steps_per_second": 0.573,
8
- "total_flos": 1.1739110279510753e+18,
9
- "train_loss": 1.9657008977646524,
10
- "train_runtime": 10337.147,
11
- "train_samples_per_second": 3.501,
12
- "train_steps_per_second": 0.014
13
  }
 
1
  {
2
+ "epoch": 4.99,
3
  "eval_accuracy": 0.796875,
4
  "eval_loss": 0.776684582233429,
5
+ "eval_runtime": 45.0682,
6
+ "eval_samples_per_second": 35.502,
7
+ "eval_steps_per_second": 0.555,
8
+ "total_flos": 1.971449904436347e+18,
9
+ "train_loss": 0.42377444733964637,
10
+ "train_runtime": 1020.3883,
11
+ "train_samples_per_second": 59.12,
12
+ "train_steps_per_second": 0.23
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 2.98,
3
  "eval_accuracy": 0.796875,
4
  "eval_loss": 0.776684582233429,
5
- "eval_runtime": 43.6376,
6
- "eval_samples_per_second": 36.666,
7
- "eval_steps_per_second": 0.573
8
  }
 
1
  {
2
+ "epoch": 4.99,
3
  "eval_accuracy": 0.796875,
4
  "eval_loss": 0.776684582233429,
5
+ "eval_runtime": 45.0682,
6
+ "eval_samples_per_second": 35.502,
7
+ "eval_steps_per_second": 0.555
8
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f63348280f49b98c911a27eb5955ea9592b6eb23308bf0fb4b6f8dc927e1854a
3
  size 110552801
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfea6cb0efd41a3bbeb51e4e8f232c2e8ca4897a1818f093bb00bb6ac447036f
3
  size 110552801
runs/Apr21_21-14-33_25733e00f35f/events.out.tfevents.1682124684.25733e00f35f.544.7 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:97fd33c8ed6c3599f399a0585b73fa157abe660142f2370d3745c62b2d7cd634
3
- size 22446
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4330b04eab97d38e0feaf1228792cc07c5c03af9efce91173859d97bfc64b5c
3
+ size 22800
runs/Apr21_21-14-33_25733e00f35f/events.out.tfevents.1682128540.25733e00f35f.544.11 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4fadbdcd72d7e00add7fa3dfe857424f73b0e110de461fcf5faeb51886be835
3
+ size 411
runs/Apr22_01-57-25_25733e00f35f/1682128678.0475118/events.out.tfevents.1682128678.25733e00f35f.544.13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0b509999c3568745e7f46e7e23ad9c7f73bd6285456d6bbe32b3805694b30ee
3
+ size 5961
runs/Apr22_01-57-25_25733e00f35f/events.out.tfevents.1682128678.25733e00f35f.544.12 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99e3574c9d3be163606e7c48c7169ecc2e8d7d3169f01a45adb104a3a5bfb389
3
+ size 7802
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 2.98,
3
- "total_flos": 1.1739110279510753e+18,
4
- "train_loss": 1.9657008977646524,
5
- "train_runtime": 10337.147,
6
- "train_samples_per_second": 3.501,
7
- "train_steps_per_second": 0.014
8
  }
 
1
  {
2
+ "epoch": 4.99,
3
+ "total_flos": 1.971449904436347e+18,
4
+ "train_loss": 0.42377444733964637,
5
+ "train_runtime": 1020.3883,
6
+ "train_samples_per_second": 59.12,
7
+ "train_steps_per_second": 0.23
8
  }
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 0.796875,
3
  "best_model_checkpoint": "swinv2-tiny-patch4-window8-256-finetuned-thai/checkpoint-141",
4
- "epoch": 2.984126984126984,
5
- "global_step": 141,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -119,18 +119,90 @@
119
  "step": 141
120
  },
121
  {
122
- "epoch": 2.98,
123
- "step": 141,
124
- "total_flos": 1.1739110279510753e+18,
125
- "train_loss": 1.9657008977646524,
126
- "train_runtime": 10337.147,
127
- "train_samples_per_second": 3.501,
128
- "train_steps_per_second": 0.014
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
129
  }
130
  ],
131
- "max_steps": 141,
132
- "num_train_epochs": 3,
133
- "total_flos": 1.1739110279510753e+18,
134
  "trial_name": null,
135
  "trial_params": null
136
  }
 
1
  {
2
  "best_metric": 0.796875,
3
  "best_model_checkpoint": "swinv2-tiny-patch4-window8-256-finetuned-thai/checkpoint-141",
4
+ "epoch": 4.98941798941799,
5
+ "global_step": 235,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
119
  "step": 141
120
  },
121
  {
122
+ "epoch": 3.19,
123
+ "learning_rate": 0.0,
124
+ "loss": 1.092,
125
+ "step": 150
126
+ },
127
+ {
128
+ "epoch": 3.4,
129
+ "learning_rate": 0.0,
130
+ "loss": 1.0781,
131
+ "step": 160
132
+ },
133
+ {
134
+ "epoch": 3.61,
135
+ "learning_rate": 0.0,
136
+ "loss": 1.0461,
137
+ "step": 170
138
+ },
139
+ {
140
+ "epoch": 3.83,
141
+ "learning_rate": 0.0,
142
+ "loss": 1.0487,
143
+ "step": 180
144
+ },
145
+ {
146
+ "epoch": 3.99,
147
+ "eval_accuracy": 0.796875,
148
+ "eval_loss": 0.776684582233429,
149
+ "eval_runtime": 43.5371,
150
+ "eval_samples_per_second": 36.75,
151
+ "eval_steps_per_second": 0.574,
152
+ "step": 188
153
+ },
154
+ {
155
+ "epoch": 4.04,
156
+ "learning_rate": 0.0,
157
+ "loss": 1.0316,
158
+ "step": 190
159
+ },
160
+ {
161
+ "epoch": 4.25,
162
+ "learning_rate": 0.0,
163
+ "loss": 1.06,
164
+ "step": 200
165
+ },
166
+ {
167
+ "epoch": 4.46,
168
+ "learning_rate": 0.0,
169
+ "loss": 1.0528,
170
+ "step": 210
171
+ },
172
+ {
173
+ "epoch": 4.67,
174
+ "learning_rate": 0.0,
175
+ "loss": 1.0339,
176
+ "step": 220
177
+ },
178
+ {
179
+ "epoch": 4.88,
180
+ "learning_rate": 0.0,
181
+ "loss": 1.0889,
182
+ "step": 230
183
+ },
184
+ {
185
+ "epoch": 4.99,
186
+ "eval_accuracy": 0.796875,
187
+ "eval_loss": 0.776684582233429,
188
+ "eval_runtime": 43.9225,
189
+ "eval_samples_per_second": 36.428,
190
+ "eval_steps_per_second": 0.569,
191
+ "step": 235
192
+ },
193
+ {
194
+ "epoch": 4.99,
195
+ "step": 235,
196
+ "total_flos": 1.971449904436347e+18,
197
+ "train_loss": 0.42377444733964637,
198
+ "train_runtime": 1020.3883,
199
+ "train_samples_per_second": 59.12,
200
+ "train_steps_per_second": 0.23
201
  }
202
  ],
203
+ "max_steps": 235,
204
+ "num_train_epochs": 5,
205
+ "total_flos": 1.971449904436347e+18,
206
  "trial_name": null,
207
  "trial_params": null
208
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c88f8d9e6e17864b2fbdc5786aa50c38e06a595f903bf942228e7ba7bd33fe7a
3
  size 3643
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c3c0fd013aeeb31c04363116eb17010e8356d94af1eff566cd9e2e854b96dc9
3
  size 3643