RobertoSonic commited on
Commit
94e73cd
·
verified ·
1 Parent(s): 1fce96b

End of training

Browse files
README.md CHANGED
@@ -19,7 +19,7 @@ should probably proofread and complete it, then remove this comment. -->
19
  This model is a fine-tuned version of [microsoft/swinv2-tiny-patch4-window8-256](https://huggingface.co/microsoft/swinv2-tiny-patch4-window8-256) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
  - Loss: 0.7428
22
- - Accuracy: 0.75
23
 
24
  ## Model description
25
 
 
19
  This model is a fine-tuned version of [microsoft/swinv2-tiny-patch4-window8-256](https://huggingface.co/microsoft/swinv2-tiny-patch4-window8-256) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
  - Loss: 0.7428
22
+ - Accuracy: 0.7614
23
 
24
  ## Model description
25
 
all_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 30.0,
3
+ "eval_accuracy": 0.7613636363636364,
4
+ "eval_loss": 0.7427918910980225,
5
+ "eval_runtime": 1.7844,
6
+ "eval_samples_per_second": 49.316,
7
+ "eval_steps_per_second": 1.681,
8
+ "total_flos": 3.982534914657485e+17,
9
+ "train_loss": 2.4056013425191245,
10
+ "train_runtime": 469.8187,
11
+ "train_samples_per_second": 34.737,
12
+ "train_steps_per_second": 0.255
13
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 30.0,
3
+ "eval_accuracy": 0.7613636363636364,
4
+ "eval_loss": 0.7427918910980225,
5
+ "eval_runtime": 1.7844,
6
+ "eval_samples_per_second": 49.316,
7
+ "eval_steps_per_second": 1.681
8
+ }
runs/Feb05_23-59-36_2066b31ba251/events.out.tfevents.1738800491.2066b31ba251.3964.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:656fb0909c453e2d9b15f99c2e3766db47e22ad0900c0e6d83ee9e8302d03b96
3
+ size 405
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 30.0,
3
+ "total_flos": 3.982534914657485e+17,
4
+ "train_loss": 2.4056013425191245,
5
+ "train_runtime": 469.8187,
6
+ "train_samples_per_second": 34.737,
7
+ "train_steps_per_second": 0.255
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,382 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.7613636363636364,
3
+ "best_model_checkpoint": "swinv2-tiny-patch4-window8-256-dmae-humeda-DAV40/checkpoint-100",
4
+ "epoch": 30.0,
5
+ "eval_steps": 500,
6
+ "global_step": 120,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 1.0,
13
+ "eval_accuracy": 0.3409090909090909,
14
+ "eval_loss": 1.5349395275115967,
15
+ "eval_runtime": 2.5542,
16
+ "eval_samples_per_second": 34.453,
17
+ "eval_steps_per_second": 1.175,
18
+ "step": 4
19
+ },
20
+ {
21
+ "epoch": 2.0,
22
+ "eval_accuracy": 0.4431818181818182,
23
+ "eval_loss": 1.321252703666687,
24
+ "eval_runtime": 2.354,
25
+ "eval_samples_per_second": 37.383,
26
+ "eval_steps_per_second": 1.274,
27
+ "step": 8
28
+ },
29
+ {
30
+ "epoch": 3.0,
31
+ "grad_norm": 8.033442497253418,
32
+ "learning_rate": 5e-05,
33
+ "loss": 4.7629,
34
+ "step": 12
35
+ },
36
+ {
37
+ "epoch": 3.0,
38
+ "eval_accuracy": 0.4431818181818182,
39
+ "eval_loss": 1.2540555000305176,
40
+ "eval_runtime": 2.642,
41
+ "eval_samples_per_second": 33.308,
42
+ "eval_steps_per_second": 1.136,
43
+ "step": 12
44
+ },
45
+ {
46
+ "epoch": 4.0,
47
+ "eval_accuracy": 0.6022727272727273,
48
+ "eval_loss": 1.2072031497955322,
49
+ "eval_runtime": 1.7756,
50
+ "eval_samples_per_second": 49.56,
51
+ "eval_steps_per_second": 1.69,
52
+ "step": 16
53
+ },
54
+ {
55
+ "epoch": 5.0,
56
+ "eval_accuracy": 0.6363636363636364,
57
+ "eval_loss": 1.1313027143478394,
58
+ "eval_runtime": 1.6972,
59
+ "eval_samples_per_second": 51.852,
60
+ "eval_steps_per_second": 1.768,
61
+ "step": 20
62
+ },
63
+ {
64
+ "epoch": 6.0,
65
+ "grad_norm": 8.113847732543945,
66
+ "learning_rate": 4.849231551964771e-05,
67
+ "loss": 3.7987,
68
+ "step": 24
69
+ },
70
+ {
71
+ "epoch": 6.0,
72
+ "eval_accuracy": 0.6477272727272727,
73
+ "eval_loss": 1.0712097883224487,
74
+ "eval_runtime": 1.7097,
75
+ "eval_samples_per_second": 51.471,
76
+ "eval_steps_per_second": 1.755,
77
+ "step": 24
78
+ },
79
+ {
80
+ "epoch": 7.0,
81
+ "eval_accuracy": 0.6590909090909091,
82
+ "eval_loss": 0.967653214931488,
83
+ "eval_runtime": 1.7586,
84
+ "eval_samples_per_second": 50.041,
85
+ "eval_steps_per_second": 1.706,
86
+ "step": 28
87
+ },
88
+ {
89
+ "epoch": 8.0,
90
+ "eval_accuracy": 0.7159090909090909,
91
+ "eval_loss": 0.8655213713645935,
92
+ "eval_runtime": 1.6895,
93
+ "eval_samples_per_second": 52.087,
94
+ "eval_steps_per_second": 1.776,
95
+ "step": 32
96
+ },
97
+ {
98
+ "epoch": 9.0,
99
+ "grad_norm": 13.333137512207031,
100
+ "learning_rate": 4.415111107797445e-05,
101
+ "loss": 3.0437,
102
+ "step": 36
103
+ },
104
+ {
105
+ "epoch": 9.0,
106
+ "eval_accuracy": 0.6818181818181818,
107
+ "eval_loss": 0.8563566207885742,
108
+ "eval_runtime": 1.7069,
109
+ "eval_samples_per_second": 51.555,
110
+ "eval_steps_per_second": 1.758,
111
+ "step": 36
112
+ },
113
+ {
114
+ "epoch": 10.0,
115
+ "eval_accuracy": 0.6818181818181818,
116
+ "eval_loss": 0.8003210425376892,
117
+ "eval_runtime": 1.7037,
118
+ "eval_samples_per_second": 51.653,
119
+ "eval_steps_per_second": 1.761,
120
+ "step": 40
121
+ },
122
+ {
123
+ "epoch": 11.0,
124
+ "eval_accuracy": 0.7386363636363636,
125
+ "eval_loss": 0.7986971139907837,
126
+ "eval_runtime": 2.4009,
127
+ "eval_samples_per_second": 36.653,
128
+ "eval_steps_per_second": 1.25,
129
+ "step": 44
130
+ },
131
+ {
132
+ "epoch": 12.0,
133
+ "grad_norm": 16.13611602783203,
134
+ "learning_rate": 3.7500000000000003e-05,
135
+ "loss": 2.4867,
136
+ "step": 48
137
+ },
138
+ {
139
+ "epoch": 12.0,
140
+ "eval_accuracy": 0.7159090909090909,
141
+ "eval_loss": 0.7619297504425049,
142
+ "eval_runtime": 2.3634,
143
+ "eval_samples_per_second": 37.235,
144
+ "eval_steps_per_second": 1.269,
145
+ "step": 48
146
+ },
147
+ {
148
+ "epoch": 13.0,
149
+ "eval_accuracy": 0.7386363636363636,
150
+ "eval_loss": 0.7425692081451416,
151
+ "eval_runtime": 1.785,
152
+ "eval_samples_per_second": 49.3,
153
+ "eval_steps_per_second": 1.681,
154
+ "step": 52
155
+ },
156
+ {
157
+ "epoch": 14.0,
158
+ "eval_accuracy": 0.6931818181818182,
159
+ "eval_loss": 0.7491652965545654,
160
+ "eval_runtime": 1.6916,
161
+ "eval_samples_per_second": 52.023,
162
+ "eval_steps_per_second": 1.774,
163
+ "step": 56
164
+ },
165
+ {
166
+ "epoch": 15.0,
167
+ "grad_norm": 18.206378936767578,
168
+ "learning_rate": 2.9341204441673266e-05,
169
+ "loss": 2.147,
170
+ "step": 60
171
+ },
172
+ {
173
+ "epoch": 15.0,
174
+ "eval_accuracy": 0.7159090909090909,
175
+ "eval_loss": 0.7827097177505493,
176
+ "eval_runtime": 1.681,
177
+ "eval_samples_per_second": 52.349,
178
+ "eval_steps_per_second": 1.785,
179
+ "step": 60
180
+ },
181
+ {
182
+ "epoch": 16.0,
183
+ "eval_accuracy": 0.7045454545454546,
184
+ "eval_loss": 0.7509434223175049,
185
+ "eval_runtime": 1.7041,
186
+ "eval_samples_per_second": 51.641,
187
+ "eval_steps_per_second": 1.76,
188
+ "step": 64
189
+ },
190
+ {
191
+ "epoch": 17.0,
192
+ "eval_accuracy": 0.7386363636363636,
193
+ "eval_loss": 0.7364481091499329,
194
+ "eval_runtime": 1.6978,
195
+ "eval_samples_per_second": 51.831,
196
+ "eval_steps_per_second": 1.767,
197
+ "step": 68
198
+ },
199
+ {
200
+ "epoch": 18.0,
201
+ "grad_norm": 16.78498649597168,
202
+ "learning_rate": 2.0658795558326743e-05,
203
+ "loss": 1.8443,
204
+ "step": 72
205
+ },
206
+ {
207
+ "epoch": 18.0,
208
+ "eval_accuracy": 0.7159090909090909,
209
+ "eval_loss": 0.770459771156311,
210
+ "eval_runtime": 1.7059,
211
+ "eval_samples_per_second": 51.585,
212
+ "eval_steps_per_second": 1.759,
213
+ "step": 72
214
+ },
215
+ {
216
+ "epoch": 19.0,
217
+ "eval_accuracy": 0.7272727272727273,
218
+ "eval_loss": 0.7515316009521484,
219
+ "eval_runtime": 1.7077,
220
+ "eval_samples_per_second": 51.532,
221
+ "eval_steps_per_second": 1.757,
222
+ "step": 76
223
+ },
224
+ {
225
+ "epoch": 20.0,
226
+ "eval_accuracy": 0.7386363636363636,
227
+ "eval_loss": 0.747029721736908,
228
+ "eval_runtime": 1.8467,
229
+ "eval_samples_per_second": 47.652,
230
+ "eval_steps_per_second": 1.625,
231
+ "step": 80
232
+ },
233
+ {
234
+ "epoch": 21.0,
235
+ "grad_norm": 14.945952415466309,
236
+ "learning_rate": 1.2500000000000006e-05,
237
+ "loss": 1.659,
238
+ "step": 84
239
+ },
240
+ {
241
+ "epoch": 21.0,
242
+ "eval_accuracy": 0.75,
243
+ "eval_loss": 0.7494531273841858,
244
+ "eval_runtime": 2.3744,
245
+ "eval_samples_per_second": 37.062,
246
+ "eval_steps_per_second": 1.263,
247
+ "step": 84
248
+ },
249
+ {
250
+ "epoch": 22.0,
251
+ "eval_accuracy": 0.75,
252
+ "eval_loss": 0.7236538529396057,
253
+ "eval_runtime": 2.3525,
254
+ "eval_samples_per_second": 37.408,
255
+ "eval_steps_per_second": 1.275,
256
+ "step": 88
257
+ },
258
+ {
259
+ "epoch": 23.0,
260
+ "eval_accuracy": 0.75,
261
+ "eval_loss": 0.744009256362915,
262
+ "eval_runtime": 2.2107,
263
+ "eval_samples_per_second": 39.807,
264
+ "eval_steps_per_second": 1.357,
265
+ "step": 92
266
+ },
267
+ {
268
+ "epoch": 24.0,
269
+ "grad_norm": 21.294570922851562,
270
+ "learning_rate": 5.848888922025553e-06,
271
+ "loss": 1.5303,
272
+ "step": 96
273
+ },
274
+ {
275
+ "epoch": 24.0,
276
+ "eval_accuracy": 0.75,
277
+ "eval_loss": 0.736692488193512,
278
+ "eval_runtime": 1.7151,
279
+ "eval_samples_per_second": 51.31,
280
+ "eval_steps_per_second": 1.749,
281
+ "step": 96
282
+ },
283
+ {
284
+ "epoch": 25.0,
285
+ "eval_accuracy": 0.7613636363636364,
286
+ "eval_loss": 0.7427918910980225,
287
+ "eval_runtime": 1.6602,
288
+ "eval_samples_per_second": 53.006,
289
+ "eval_steps_per_second": 1.807,
290
+ "step": 100
291
+ },
292
+ {
293
+ "epoch": 26.0,
294
+ "eval_accuracy": 0.75,
295
+ "eval_loss": 0.7406925559043884,
296
+ "eval_runtime": 1.671,
297
+ "eval_samples_per_second": 52.662,
298
+ "eval_steps_per_second": 1.795,
299
+ "step": 104
300
+ },
301
+ {
302
+ "epoch": 27.0,
303
+ "grad_norm": 18.939655303955078,
304
+ "learning_rate": 1.5076844803522922e-06,
305
+ "loss": 1.4305,
306
+ "step": 108
307
+ },
308
+ {
309
+ "epoch": 27.0,
310
+ "eval_accuracy": 0.75,
311
+ "eval_loss": 0.740644633769989,
312
+ "eval_runtime": 1.6889,
313
+ "eval_samples_per_second": 52.104,
314
+ "eval_steps_per_second": 1.776,
315
+ "step": 108
316
+ },
317
+ {
318
+ "epoch": 28.0,
319
+ "eval_accuracy": 0.75,
320
+ "eval_loss": 0.7422773241996765,
321
+ "eval_runtime": 1.6858,
322
+ "eval_samples_per_second": 52.2,
323
+ "eval_steps_per_second": 1.78,
324
+ "step": 112
325
+ },
326
+ {
327
+ "epoch": 29.0,
328
+ "eval_accuracy": 0.75,
329
+ "eval_loss": 0.7426608800888062,
330
+ "eval_runtime": 1.7009,
331
+ "eval_samples_per_second": 51.738,
332
+ "eval_steps_per_second": 1.764,
333
+ "step": 116
334
+ },
335
+ {
336
+ "epoch": 30.0,
337
+ "grad_norm": 13.808012962341309,
338
+ "learning_rate": 0.0,
339
+ "loss": 1.3529,
340
+ "step": 120
341
+ },
342
+ {
343
+ "epoch": 30.0,
344
+ "eval_accuracy": 0.75,
345
+ "eval_loss": 0.7427504062652588,
346
+ "eval_runtime": 2.6552,
347
+ "eval_samples_per_second": 33.142,
348
+ "eval_steps_per_second": 1.13,
349
+ "step": 120
350
+ },
351
+ {
352
+ "epoch": 30.0,
353
+ "step": 120,
354
+ "total_flos": 3.982534914657485e+17,
355
+ "train_loss": 2.4056013425191245,
356
+ "train_runtime": 469.8187,
357
+ "train_samples_per_second": 34.737,
358
+ "train_steps_per_second": 0.255
359
+ }
360
+ ],
361
+ "logging_steps": 12,
362
+ "max_steps": 120,
363
+ "num_input_tokens_seen": 0,
364
+ "num_train_epochs": 40,
365
+ "save_steps": 500,
366
+ "stateful_callbacks": {
367
+ "TrainerControl": {
368
+ "args": {
369
+ "should_epoch_stop": false,
370
+ "should_evaluate": false,
371
+ "should_log": false,
372
+ "should_save": true,
373
+ "should_training_stop": true
374
+ },
375
+ "attributes": {}
376
+ }
377
+ },
378
+ "total_flos": 3.982534914657485e+17,
379
+ "train_batch_size": 32,
380
+ "trial_name": null,
381
+ "trial_params": null
382
+ }