OckerGui commited on
Commit
f6f3b29
·
1 Parent(s): afa9c5d

Model save

Browse files
all_results.json CHANGED
@@ -1,11 +1,11 @@
1
  {
2
  "epoch": 7.02,
3
- "eval_accuracy": 0.44,
4
- "eval_loss": 0.9982941150665283,
5
- "eval_runtime": 16.8527,
6
  "eval_samples": 6,
7
- "eval_samples_per_second": 1.483,
8
- "eval_steps_per_second": 0.178,
9
  "total_flos": 2.208046144034046e+18,
10
  "train_loss": 0.6113187122344971,
11
  "train_runtime": 861.0964,
 
1
  {
2
  "epoch": 7.02,
3
+ "eval_accuracy": 0.5714285714285714,
4
+ "eval_loss": 0.9015251398086548,
5
+ "eval_runtime": 3.5127,
6
  "eval_samples": 6,
7
+ "eval_samples_per_second": 5.978,
8
+ "eval_steps_per_second": 0.569,
9
  "total_flos": 2.208046144034046e+18,
10
  "train_loss": 0.6113187122344971,
11
  "train_runtime": 861.0964,
runs/Oct15_02-59-37_226fb5eed268/events.out.tfevents.1697339652.226fb5eed268.363.8 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:56efc207b104c2115f9bf9fc4ebf506611606cd59d05f1aadfc57f3b85de3dc3
3
- size 734
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1aba308d4d6a03ef1a2ee44596b54cdeb05e837b56a0b046bb868c942280780e
3
+ size 1057
test_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 7.02,
3
+ "eval_accuracy": 0.5714285714285714,
4
+ "eval_loss": 0.9015251398086548,
5
+ "eval_runtime": 3.5127,
6
+ "eval_samples_per_second": 5.978,
7
+ "eval_steps_per_second": 0.569
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,214 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.44,
3
+ "best_model_checkpoint": "videomae-base-finetuned-SSBD/checkpoint-21",
4
+ "epoch": 7.02,
5
+ "global_step": 150,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.07,
12
+ "learning_rate": 3.3333333333333335e-05,
13
+ "loss": 1.0927,
14
+ "step": 10
15
+ },
16
+ {
17
+ "epoch": 0.13,
18
+ "learning_rate": 4.814814814814815e-05,
19
+ "loss": 1.1764,
20
+ "step": 20
21
+ },
22
+ {
23
+ "epoch": 0.14,
24
+ "eval_accuracy": 0.44,
25
+ "eval_loss": 0.9982941150665283,
26
+ "eval_runtime": 22.6723,
27
+ "eval_samples_per_second": 1.103,
28
+ "eval_steps_per_second": 0.132,
29
+ "step": 21
30
+ },
31
+ {
32
+ "epoch": 1.06,
33
+ "learning_rate": 4.4444444444444447e-05,
34
+ "loss": 0.9538,
35
+ "step": 30
36
+ },
37
+ {
38
+ "epoch": 1.13,
39
+ "learning_rate": 4.074074074074074e-05,
40
+ "loss": 1.2156,
41
+ "step": 40
42
+ },
43
+ {
44
+ "epoch": 1.14,
45
+ "eval_accuracy": 0.4,
46
+ "eval_loss": 1.1047239303588867,
47
+ "eval_runtime": 17.0623,
48
+ "eval_samples_per_second": 1.465,
49
+ "eval_steps_per_second": 0.176,
50
+ "step": 42
51
+ },
52
+ {
53
+ "epoch": 2.05,
54
+ "learning_rate": 3.7037037037037037e-05,
55
+ "loss": 0.7382,
56
+ "step": 50
57
+ },
58
+ {
59
+ "epoch": 2.12,
60
+ "learning_rate": 3.3333333333333335e-05,
61
+ "loss": 1.0214,
62
+ "step": 60
63
+ },
64
+ {
65
+ "epoch": 2.14,
66
+ "eval_accuracy": 0.2,
67
+ "eval_loss": 1.2947560548782349,
68
+ "eval_runtime": 16.4433,
69
+ "eval_samples_per_second": 1.52,
70
+ "eval_steps_per_second": 0.182,
71
+ "step": 63
72
+ },
73
+ {
74
+ "epoch": 3.05,
75
+ "learning_rate": 2.962962962962963e-05,
76
+ "loss": 0.8333,
77
+ "step": 70
78
+ },
79
+ {
80
+ "epoch": 3.11,
81
+ "learning_rate": 2.5925925925925925e-05,
82
+ "loss": 0.5585,
83
+ "step": 80
84
+ },
85
+ {
86
+ "epoch": 3.14,
87
+ "eval_accuracy": 0.44,
88
+ "eval_loss": 2.0399672985076904,
89
+ "eval_runtime": 16.7172,
90
+ "eval_samples_per_second": 1.495,
91
+ "eval_steps_per_second": 0.179,
92
+ "step": 84
93
+ },
94
+ {
95
+ "epoch": 4.04,
96
+ "learning_rate": 2.2222222222222223e-05,
97
+ "loss": 0.5306,
98
+ "step": 90
99
+ },
100
+ {
101
+ "epoch": 4.11,
102
+ "learning_rate": 1.8518518518518518e-05,
103
+ "loss": 0.3809,
104
+ "step": 100
105
+ },
106
+ {
107
+ "epoch": 4.14,
108
+ "eval_accuracy": 0.4,
109
+ "eval_loss": 2.2226576805114746,
110
+ "eval_runtime": 16.8941,
111
+ "eval_samples_per_second": 1.48,
112
+ "eval_steps_per_second": 0.178,
113
+ "step": 105
114
+ },
115
+ {
116
+ "epoch": 5.03,
117
+ "learning_rate": 1.4814814814814815e-05,
118
+ "loss": 0.2621,
119
+ "step": 110
120
+ },
121
+ {
122
+ "epoch": 5.1,
123
+ "learning_rate": 1.1111111111111112e-05,
124
+ "loss": 0.1665,
125
+ "step": 120
126
+ },
127
+ {
128
+ "epoch": 5.14,
129
+ "eval_accuracy": 0.12,
130
+ "eval_loss": 2.2652955055236816,
131
+ "eval_runtime": 16.6771,
132
+ "eval_samples_per_second": 1.499,
133
+ "eval_steps_per_second": 0.18,
134
+ "step": 126
135
+ },
136
+ {
137
+ "epoch": 6.03,
138
+ "learning_rate": 7.4074074074074075e-06,
139
+ "loss": 0.1161,
140
+ "step": 130
141
+ },
142
+ {
143
+ "epoch": 6.09,
144
+ "learning_rate": 3.7037037037037037e-06,
145
+ "loss": 0.0736,
146
+ "step": 140
147
+ },
148
+ {
149
+ "epoch": 6.14,
150
+ "eval_accuracy": 0.24,
151
+ "eval_loss": 2.824446201324463,
152
+ "eval_runtime": 17.0232,
153
+ "eval_samples_per_second": 1.469,
154
+ "eval_steps_per_second": 0.176,
155
+ "step": 147
156
+ },
157
+ {
158
+ "epoch": 7.02,
159
+ "learning_rate": 0.0,
160
+ "loss": 0.0501,
161
+ "step": 150
162
+ },
163
+ {
164
+ "epoch": 7.02,
165
+ "eval_accuracy": 0.2,
166
+ "eval_loss": 2.841770887374878,
167
+ "eval_runtime": 16.8793,
168
+ "eval_samples_per_second": 1.481,
169
+ "eval_steps_per_second": 0.178,
170
+ "step": 150
171
+ },
172
+ {
173
+ "epoch": 7.02,
174
+ "step": 150,
175
+ "total_flos": 2.208046144034046e+18,
176
+ "train_loss": 0.6113187122344971,
177
+ "train_runtime": 861.0964,
178
+ "train_samples_per_second": 2.09,
179
+ "train_steps_per_second": 0.174
180
+ },
181
+ {
182
+ "epoch": 7.02,
183
+ "eval_accuracy": 0.5714285714285714,
184
+ "eval_loss": 0.9015253186225891,
185
+ "eval_runtime": 7.2806,
186
+ "eval_samples_per_second": 2.884,
187
+ "eval_steps_per_second": 0.275,
188
+ "step": 150
189
+ },
190
+ {
191
+ "epoch": 7.02,
192
+ "eval_accuracy": 0.44,
193
+ "eval_loss": 0.9982941150665283,
194
+ "eval_runtime": 16.8527,
195
+ "eval_samples_per_second": 1.483,
196
+ "eval_steps_per_second": 0.178,
197
+ "step": 150
198
+ },
199
+ {
200
+ "epoch": 7.02,
201
+ "eval_accuracy": 0.5714285714285714,
202
+ "eval_loss": 0.9015251398086548,
203
+ "eval_runtime": 3.5127,
204
+ "eval_samples_per_second": 5.978,
205
+ "eval_steps_per_second": 0.569,
206
+ "step": 150
207
+ }
208
+ ],
209
+ "max_steps": 150,
210
+ "num_train_epochs": 9223372036854775807,
211
+ "total_flos": 2.208046144034046e+18,
212
+ "trial_name": null,
213
+ "trial_params": null
214
+ }