Melo1512 commited on
Commit
a0ffda3
·
verified ·
1 Parent(s): 5e43645

End of training

Browse files
README.md CHANGED
@@ -23,7 +23,7 @@ model-index:
23
  metrics:
24
  - name: Accuracy
25
  type: accuracy
26
- value: 0.9120879120879121
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -33,8 +33,8 @@ should probably proofread and complete it, then remove this comment. -->
33
 
34
  This model is a fine-tuned version of [facebook/vit-msn-small](https://huggingface.co/facebook/vit-msn-small) on the imagefolder dataset.
35
  It achieves the following results on the evaluation set:
36
- - Loss: 0.2491
37
- - Accuracy: 0.9121
38
 
39
  ## Model description
40
 
 
23
  metrics:
24
  - name: Accuracy
25
  type: accuracy
26
+ value: 0.9194139194139194
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
33
 
34
  This model is a fine-tuned version of [facebook/vit-msn-small](https://huggingface.co/facebook/vit-msn-small) on the imagefolder dataset.
35
  It achieves the following results on the evaluation set:
36
+ - Loss: 0.2229
37
+ - Accuracy: 0.9194
38
 
39
  ## Model description
40
 
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
  "epoch": 18.46153846153846,
3
- "eval_accuracy": 0.9497584541062802,
4
- "eval_loss": 0.1871330887079239,
5
- "eval_runtime": 4.3162,
6
- "eval_samples_per_second": 239.797,
7
- "eval_steps_per_second": 3.939,
8
  "total_flos": 2.9458314315627725e+17,
9
- "train_loss": 0.35900469223658243,
10
- "train_runtime": 212.0852,
11
- "train_samples_per_second": 76.856,
12
- "train_steps_per_second": 0.283
13
  }
 
1
  {
2
  "epoch": 18.46153846153846,
3
+ "eval_accuracy": 0.9194139194139194,
4
+ "eval_loss": 0.22294031083583832,
5
+ "eval_runtime": 1.2677,
6
+ "eval_samples_per_second": 215.358,
7
+ "eval_steps_per_second": 3.944,
8
  "total_flos": 2.9458314315627725e+17,
9
+ "train_loss": 0.342086935043335,
10
+ "train_runtime": 153.4118,
11
+ "train_samples_per_second": 106.25,
12
+ "train_steps_per_second": 0.391
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 18.46153846153846,
3
- "eval_accuracy": 0.9497584541062802,
4
- "eval_loss": 0.1871330887079239,
5
- "eval_runtime": 4.3162,
6
- "eval_samples_per_second": 239.797,
7
- "eval_steps_per_second": 3.939
8
  }
 
1
  {
2
  "epoch": 18.46153846153846,
3
+ "eval_accuracy": 0.9194139194139194,
4
+ "eval_loss": 0.22294031083583832,
5
+ "eval_runtime": 1.2677,
6
+ "eval_samples_per_second": 215.358,
7
+ "eval_steps_per_second": 3.944
8
  }
runs/Jan14_17-44-41_c583982b4f3d/events.out.tfevents.1736876900.c583982b4f3d.215.9 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5e372d0453ced4d5ac7d7fcee3f40ec8bd5be65095c31c693c1a65c13d94143
3
+ size 405
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 18.46153846153846,
3
  "total_flos": 2.9458314315627725e+17,
4
- "train_loss": 0.35900469223658243,
5
- "train_runtime": 212.0852,
6
- "train_samples_per_second": 76.856,
7
- "train_steps_per_second": 0.283
8
  }
 
1
  {
2
  "epoch": 18.46153846153846,
3
  "total_flos": 2.9458314315627725e+17,
4
+ "train_loss": 0.342086935043335,
5
+ "train_runtime": 153.4118,
6
+ "train_samples_per_second": 106.25,
7
+ "train_steps_per_second": 0.391
8
  }
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.9497584541062802,
3
- "best_model_checkpoint": "vit-msn-small-corect_deepcleaned_dataset_lateral_flow_ivalidation/checkpoint-22",
4
  "epoch": 18.46153846153846,
5
  "eval_steps": 500,
6
  "global_step": 60,
@@ -10,225 +10,225 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.9230769230769231,
13
- "eval_accuracy": 0.8927536231884058,
14
- "eval_loss": 0.3933483958244324,
15
- "eval_runtime": 4.3694,
16
- "eval_samples_per_second": 236.874,
17
- "eval_steps_per_second": 3.891,
18
  "step": 3
19
  },
20
  {
21
  "epoch": 1.8461538461538463,
22
- "eval_accuracy": 0.9188405797101449,
23
- "eval_loss": 0.4166622459888458,
24
- "eval_runtime": 4.2818,
25
- "eval_samples_per_second": 241.72,
26
- "eval_steps_per_second": 3.97,
27
  "step": 6
28
  },
29
  {
30
  "epoch": 2.769230769230769,
31
- "eval_accuracy": 0.4966183574879227,
32
- "eval_loss": 0.933142364025116,
33
- "eval_runtime": 4.3066,
34
- "eval_samples_per_second": 240.328,
35
- "eval_steps_per_second": 3.947,
36
  "step": 9
37
  },
38
  {
39
  "epoch": 3.076923076923077,
40
- "grad_norm": 62.32957458496094,
41
  "learning_rate": 4.62962962962963e-05,
42
- "loss": 0.615,
43
  "step": 10
44
  },
45
  {
46
  "epoch": 4.0,
47
- "eval_accuracy": 0.9178743961352657,
48
- "eval_loss": 0.3084805905818939,
49
- "eval_runtime": 4.3796,
50
- "eval_samples_per_second": 236.322,
51
- "eval_steps_per_second": 3.882,
52
  "step": 13
53
  },
54
  {
55
  "epoch": 4.923076923076923,
56
- "eval_accuracy": 0.9333333333333333,
57
- "eval_loss": 0.22097891569137573,
58
- "eval_runtime": 4.3446,
59
- "eval_samples_per_second": 238.226,
60
- "eval_steps_per_second": 3.913,
61
  "step": 16
62
  },
63
  {
64
  "epoch": 5.846153846153846,
65
- "eval_accuracy": 0.9391304347826087,
66
- "eval_loss": 0.21061654388904572,
67
- "eval_runtime": 4.4485,
68
- "eval_samples_per_second": 232.66,
69
- "eval_steps_per_second": 3.821,
70
  "step": 19
71
  },
72
  {
73
  "epoch": 6.153846153846154,
74
- "grad_norm": 3.9477076530456543,
75
  "learning_rate": 3.7037037037037037e-05,
76
- "loss": 0.3763,
77
  "step": 20
78
  },
79
  {
80
  "epoch": 6.769230769230769,
81
- "eval_accuracy": 0.9497584541062802,
82
- "eval_loss": 0.1871330887079239,
83
- "eval_runtime": 4.3598,
84
- "eval_samples_per_second": 237.396,
85
- "eval_steps_per_second": 3.899,
86
  "step": 22
87
  },
88
  {
89
  "epoch": 8.0,
90
- "eval_accuracy": 0.9371980676328503,
91
- "eval_loss": 0.20427261292934418,
92
- "eval_runtime": 4.2827,
93
- "eval_samples_per_second": 241.673,
94
- "eval_steps_per_second": 3.97,
95
  "step": 26
96
  },
97
  {
98
  "epoch": 8.923076923076923,
99
- "eval_accuracy": 0.8888888888888888,
100
- "eval_loss": 0.31205740571022034,
101
- "eval_runtime": 4.4195,
102
- "eval_samples_per_second": 234.192,
103
- "eval_steps_per_second": 3.847,
104
  "step": 29
105
  },
106
  {
107
  "epoch": 9.23076923076923,
108
- "grad_norm": 4.070008754730225,
109
  "learning_rate": 2.777777777777778e-05,
110
- "loss": 0.3511,
111
  "step": 30
112
  },
113
  {
114
  "epoch": 9.846153846153847,
115
- "eval_accuracy": 0.9314009661835749,
116
- "eval_loss": 0.20154337584972382,
117
- "eval_runtime": 4.2969,
118
- "eval_samples_per_second": 240.871,
119
- "eval_steps_per_second": 3.956,
120
  "step": 32
121
  },
122
  {
123
  "epoch": 10.76923076923077,
124
- "eval_accuracy": 0.8376811594202899,
125
- "eval_loss": 0.44852134585380554,
126
- "eval_runtime": 4.3709,
127
- "eval_samples_per_second": 236.795,
128
- "eval_steps_per_second": 3.889,
129
  "step": 35
130
  },
131
  {
132
  "epoch": 12.0,
133
- "eval_accuracy": 0.9285024154589372,
134
- "eval_loss": 0.24452261626720428,
135
- "eval_runtime": 4.3262,
136
- "eval_samples_per_second": 239.241,
137
- "eval_steps_per_second": 3.93,
138
  "step": 39
139
  },
140
  {
141
  "epoch": 12.307692307692308,
142
- "grad_norm": 7.704187393188477,
143
  "learning_rate": 1.8518518518518518e-05,
144
- "loss": 0.2962,
145
  "step": 40
146
  },
147
  {
148
  "epoch": 12.923076923076923,
149
- "eval_accuracy": 0.9053140096618357,
150
- "eval_loss": 0.30447185039520264,
151
- "eval_runtime": 4.2886,
152
- "eval_samples_per_second": 241.336,
153
- "eval_steps_per_second": 3.964,
154
  "step": 42
155
  },
156
  {
157
  "epoch": 13.846153846153847,
158
- "eval_accuracy": 0.8714975845410629,
159
- "eval_loss": 0.3914734721183777,
160
- "eval_runtime": 4.4006,
161
- "eval_samples_per_second": 235.195,
162
- "eval_steps_per_second": 3.863,
163
  "step": 45
164
  },
165
  {
166
  "epoch": 14.76923076923077,
167
- "eval_accuracy": 0.893719806763285,
168
- "eval_loss": 0.31650951504707336,
169
- "eval_runtime": 4.327,
170
- "eval_samples_per_second": 239.195,
171
- "eval_steps_per_second": 3.929,
172
  "step": 48
173
  },
174
  {
175
  "epoch": 15.384615384615385,
176
- "grad_norm": 5.901269912719727,
177
  "learning_rate": 9.259259259259259e-06,
178
- "loss": 0.2553,
179
  "step": 50
180
  },
181
  {
182
  "epoch": 16.0,
183
- "eval_accuracy": 0.9082125603864735,
184
- "eval_loss": 0.28225788474082947,
185
- "eval_runtime": 4.4633,
186
- "eval_samples_per_second": 231.89,
187
- "eval_steps_per_second": 3.809,
188
  "step": 52
189
  },
190
  {
191
  "epoch": 16.923076923076923,
192
- "eval_accuracy": 0.8869565217391304,
193
- "eval_loss": 0.3504292070865631,
194
- "eval_runtime": 4.37,
195
- "eval_samples_per_second": 236.841,
196
- "eval_steps_per_second": 3.89,
197
  "step": 55
198
  },
199
  {
200
  "epoch": 17.846153846153847,
201
- "eval_accuracy": 0.8869565217391304,
202
- "eval_loss": 0.36792051792144775,
203
- "eval_runtime": 4.4082,
204
- "eval_samples_per_second": 234.792,
205
- "eval_steps_per_second": 3.856,
206
  "step": 58
207
  },
208
  {
209
  "epoch": 18.46153846153846,
210
- "grad_norm": 7.85857629776001,
211
  "learning_rate": 0.0,
212
- "loss": 0.2601,
213
  "step": 60
214
  },
215
  {
216
  "epoch": 18.46153846153846,
217
- "eval_accuracy": 0.8879227053140096,
218
- "eval_loss": 0.3520191013813019,
219
- "eval_runtime": 4.3424,
220
- "eval_samples_per_second": 238.347,
221
- "eval_steps_per_second": 3.915,
222
  "step": 60
223
  },
224
  {
225
  "epoch": 18.46153846153846,
226
  "step": 60,
227
  "total_flos": 2.9458314315627725e+17,
228
- "train_loss": 0.35900469223658243,
229
- "train_runtime": 212.0852,
230
- "train_samples_per_second": 76.856,
231
- "train_steps_per_second": 0.283
232
  }
233
  ],
234
  "logging_steps": 10,
 
1
  {
2
+ "best_metric": 0.9194139194139194,
3
+ "best_model_checkpoint": "vit-msn-small-corect_deepcleaned_dataset_lateral_flow_ivalidation/checkpoint-39",
4
  "epoch": 18.46153846153846,
5
  "eval_steps": 500,
6
  "global_step": 60,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.9230769230769231,
13
+ "eval_accuracy": 0.7216117216117216,
14
+ "eval_loss": 0.6175123453140259,
15
+ "eval_runtime": 1.1447,
16
+ "eval_samples_per_second": 238.5,
17
+ "eval_steps_per_second": 4.368,
18
  "step": 3
19
  },
20
  {
21
  "epoch": 1.8461538461538463,
22
+ "eval_accuracy": 0.8351648351648352,
23
+ "eval_loss": 0.4141041934490204,
24
+ "eval_runtime": 1.1326,
25
+ "eval_samples_per_second": 241.031,
26
+ "eval_steps_per_second": 4.414,
27
  "step": 6
28
  },
29
  {
30
  "epoch": 2.769230769230769,
31
+ "eval_accuracy": 0.5787545787545788,
32
+ "eval_loss": 0.7407873868942261,
33
+ "eval_runtime": 1.1747,
34
+ "eval_samples_per_second": 232.409,
35
+ "eval_steps_per_second": 4.257,
36
  "step": 9
37
  },
38
  {
39
  "epoch": 3.076923076923077,
40
+ "grad_norm": 70.46142578125,
41
  "learning_rate": 4.62962962962963e-05,
42
+ "loss": 0.5817,
43
  "step": 10
44
  },
45
  {
46
  "epoch": 4.0,
47
+ "eval_accuracy": 0.9157509157509157,
48
+ "eval_loss": 0.27566295862197876,
49
+ "eval_runtime": 1.1638,
50
+ "eval_samples_per_second": 234.573,
51
+ "eval_steps_per_second": 4.296,
52
  "step": 13
53
  },
54
  {
55
  "epoch": 4.923076923076923,
56
+ "eval_accuracy": 0.8791208791208791,
57
+ "eval_loss": 0.28472262620925903,
58
+ "eval_runtime": 1.1571,
59
+ "eval_samples_per_second": 235.942,
60
+ "eval_steps_per_second": 4.321,
61
  "step": 16
62
  },
63
  {
64
  "epoch": 5.846153846153846,
65
+ "eval_accuracy": 0.9010989010989011,
66
+ "eval_loss": 0.2455928921699524,
67
+ "eval_runtime": 1.2196,
68
+ "eval_samples_per_second": 223.848,
69
+ "eval_steps_per_second": 4.1,
70
  "step": 19
71
  },
72
  {
73
  "epoch": 6.153846153846154,
74
+ "grad_norm": 8.08311653137207,
75
  "learning_rate": 3.7037037037037037e-05,
76
+ "loss": 0.3724,
77
  "step": 20
78
  },
79
  {
80
  "epoch": 6.769230769230769,
81
+ "eval_accuracy": 0.9120879120879121,
82
+ "eval_loss": 0.25474727153778076,
83
+ "eval_runtime": 1.1827,
84
+ "eval_samples_per_second": 230.827,
85
+ "eval_steps_per_second": 4.228,
86
  "step": 22
87
  },
88
  {
89
  "epoch": 8.0,
90
+ "eval_accuracy": 0.8827838827838828,
91
+ "eval_loss": 0.3007383942604065,
92
+ "eval_runtime": 1.2369,
93
+ "eval_samples_per_second": 220.714,
94
+ "eval_steps_per_second": 4.042,
95
  "step": 26
96
  },
97
  {
98
  "epoch": 8.923076923076923,
99
+ "eval_accuracy": 0.9010989010989011,
100
+ "eval_loss": 0.3042505383491516,
101
+ "eval_runtime": 1.1883,
102
+ "eval_samples_per_second": 229.74,
103
+ "eval_steps_per_second": 4.208,
104
  "step": 29
105
  },
106
  {
107
  "epoch": 9.23076923076923,
108
+ "grad_norm": 12.493155479431152,
109
  "learning_rate": 2.777777777777778e-05,
110
+ "loss": 0.3155,
111
  "step": 30
112
  },
113
  {
114
  "epoch": 9.846153846153847,
115
+ "eval_accuracy": 0.9047619047619048,
116
+ "eval_loss": 0.2603397071361542,
117
+ "eval_runtime": 1.1963,
118
+ "eval_samples_per_second": 228.207,
119
+ "eval_steps_per_second": 4.18,
120
  "step": 32
121
  },
122
  {
123
  "epoch": 10.76923076923077,
124
+ "eval_accuracy": 0.9157509157509157,
125
+ "eval_loss": 0.24810168147087097,
126
+ "eval_runtime": 1.1361,
127
+ "eval_samples_per_second": 240.289,
128
+ "eval_steps_per_second": 4.401,
129
  "step": 35
130
  },
131
  {
132
  "epoch": 12.0,
133
+ "eval_accuracy": 0.9194139194139194,
134
+ "eval_loss": 0.22294031083583832,
135
+ "eval_runtime": 1.1914,
136
+ "eval_samples_per_second": 229.149,
137
+ "eval_steps_per_second": 4.197,
138
  "step": 39
139
  },
140
  {
141
  "epoch": 12.307692307692308,
142
+ "grad_norm": 8.086904525756836,
143
  "learning_rate": 1.8518518518518518e-05,
144
+ "loss": 0.2844,
145
  "step": 40
146
  },
147
  {
148
  "epoch": 12.923076923076923,
149
+ "eval_accuracy": 0.8791208791208791,
150
+ "eval_loss": 0.3036467432975769,
151
+ "eval_runtime": 1.1286,
152
+ "eval_samples_per_second": 241.895,
153
+ "eval_steps_per_second": 4.43,
154
  "step": 42
155
  },
156
  {
157
  "epoch": 13.846153846153847,
158
+ "eval_accuracy": 0.9084249084249084,
159
+ "eval_loss": 0.2578851580619812,
160
+ "eval_runtime": 1.1539,
161
+ "eval_samples_per_second": 236.595,
162
+ "eval_steps_per_second": 4.333,
163
  "step": 45
164
  },
165
  {
166
  "epoch": 14.76923076923077,
167
+ "eval_accuracy": 0.9157509157509157,
168
+ "eval_loss": 0.2433992624282837,
169
+ "eval_runtime": 1.2067,
170
+ "eval_samples_per_second": 226.24,
171
+ "eval_steps_per_second": 4.144,
172
  "step": 48
173
  },
174
  {
175
  "epoch": 15.384615384615385,
176
+ "grad_norm": 3.2125346660614014,
177
  "learning_rate": 9.259259259259259e-06,
178
+ "loss": 0.2517,
179
  "step": 50
180
  },
181
  {
182
  "epoch": 16.0,
183
+ "eval_accuracy": 0.9047619047619048,
184
+ "eval_loss": 0.27184122800827026,
185
+ "eval_runtime": 1.1306,
186
+ "eval_samples_per_second": 241.471,
187
+ "eval_steps_per_second": 4.423,
188
  "step": 52
189
  },
190
  {
191
  "epoch": 16.923076923076923,
192
+ "eval_accuracy": 0.9120879120879121,
193
+ "eval_loss": 0.25126636028289795,
194
+ "eval_runtime": 1.1542,
195
+ "eval_samples_per_second": 236.531,
196
+ "eval_steps_per_second": 4.332,
197
  "step": 55
198
  },
199
  {
200
  "epoch": 17.846153846153847,
201
+ "eval_accuracy": 0.9120879120879121,
202
+ "eval_loss": 0.25034624338150024,
203
+ "eval_runtime": 1.2382,
204
+ "eval_samples_per_second": 220.484,
205
+ "eval_steps_per_second": 4.038,
206
  "step": 58
207
  },
208
  {
209
  "epoch": 18.46153846153846,
210
+ "grad_norm": 4.7955803871154785,
211
  "learning_rate": 0.0,
212
+ "loss": 0.2468,
213
  "step": 60
214
  },
215
  {
216
  "epoch": 18.46153846153846,
217
+ "eval_accuracy": 0.9120879120879121,
218
+ "eval_loss": 0.24911320209503174,
219
+ "eval_runtime": 1.1404,
220
+ "eval_samples_per_second": 239.4,
221
+ "eval_steps_per_second": 4.385,
222
  "step": 60
223
  },
224
  {
225
  "epoch": 18.46153846153846,
226
  "step": 60,
227
  "total_flos": 2.9458314315627725e+17,
228
+ "train_loss": 0.342086935043335,
229
+ "train_runtime": 153.4118,
230
+ "train_samples_per_second": 106.25,
231
+ "train_steps_per_second": 0.391
232
  }
233
  ],
234
  "logging_steps": 10,