Training in progress, epoch 11
Browse files- config.json +1 -0
- logs/events.out.tfevents.1738541012.b7e596cebf8e.5776.0 +2 -2
- model.safetensors +1 -1
- trainer_state.json +117 -5
config.json
CHANGED
@@ -45,6 +45,7 @@
|
|
45 |
12
|
46 |
],
|
47 |
"patch_size": 14,
|
|
|
48 |
"qkv_bias": true,
|
49 |
"reshape_hidden_states": true,
|
50 |
"stage_names": [
|
|
|
45 |
12
|
46 |
],
|
47 |
"patch_size": 14,
|
48 |
+
"problem_type": "single_label_classification",
|
49 |
"qkv_bias": true,
|
50 |
"reshape_hidden_states": true,
|
51 |
"stage_names": [
|
logs/events.out.tfevents.1738541012.b7e596cebf8e.5776.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3073f44578b399f9d4ce8fb77dccc21b04a1bf7d062807f0deacedaefd927274
|
3 |
+
size 6535
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 346396816
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d3e256c94cba90f4d2445d12c7ac054cf13b37f8a96e2b2d11d3563898fe880
|
3 |
size 346396816
|
trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "./drive/Shareddrives/CS198-Drones/training_output/dinov2-base_rice-leaf-disease-augmented_t_020225/checkpoint-
|
4 |
-
"epoch":
|
5 |
"eval_steps": 500,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -55,6 +55,118 @@
|
|
55 |
"eval_samples_per_second": 18.689,
|
56 |
"eval_steps_per_second": 0.299,
|
57 |
"step": 750
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
58 |
}
|
59 |
],
|
60 |
"logging_steps": 500,
|
@@ -74,7 +186,7 @@
|
|
74 |
"attributes": {}
|
75 |
}
|
76 |
},
|
77 |
-
"total_flos":
|
78 |
"train_batch_size": 64,
|
79 |
"trial_name": null,
|
80 |
"trial_params": null
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.00931523460894823,
|
3 |
+
"best_model_checkpoint": "./drive/Shareddrives/CS198-Drones/training_output/dinov2-base_rice-leaf-disease-augmented_t_020225/checkpoint-1750",
|
4 |
+
"epoch": 10.0,
|
5 |
"eval_steps": 500,
|
6 |
+
"global_step": 2500,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
55 |
"eval_samples_per_second": 18.689,
|
56 |
"eval_steps_per_second": 0.299,
|
57 |
"step": 750
|
58 |
+
},
|
59 |
+
{
|
60 |
+
"epoch": 4.0,
|
61 |
+
"grad_norm": 11.413514137268066,
|
62 |
+
"learning_rate": 8.148148148148148e-06,
|
63 |
+
"loss": 0.0177,
|
64 |
+
"step": 1000
|
65 |
+
},
|
66 |
+
{
|
67 |
+
"epoch": 4.0,
|
68 |
+
"eval_accuracy": 0.986,
|
69 |
+
"eval_loss": 0.047092683613300323,
|
70 |
+
"eval_runtime": 116.0163,
|
71 |
+
"eval_samples_per_second": 17.239,
|
72 |
+
"eval_steps_per_second": 0.276,
|
73 |
+
"step": 1000
|
74 |
+
},
|
75 |
+
{
|
76 |
+
"epoch": 5.0,
|
77 |
+
"grad_norm": 0.018265413120388985,
|
78 |
+
"learning_rate": 7.4074074074074075e-06,
|
79 |
+
"loss": 0.0101,
|
80 |
+
"step": 1250
|
81 |
+
},
|
82 |
+
{
|
83 |
+
"epoch": 5.0,
|
84 |
+
"eval_accuracy": 0.9945,
|
85 |
+
"eval_loss": 0.016437631100416183,
|
86 |
+
"eval_runtime": 115.0025,
|
87 |
+
"eval_samples_per_second": 17.391,
|
88 |
+
"eval_steps_per_second": 0.278,
|
89 |
+
"step": 1250
|
90 |
+
},
|
91 |
+
{
|
92 |
+
"epoch": 6.0,
|
93 |
+
"grad_norm": 0.26411858201026917,
|
94 |
+
"learning_rate": 6.666666666666667e-06,
|
95 |
+
"loss": 0.008,
|
96 |
+
"step": 1500
|
97 |
+
},
|
98 |
+
{
|
99 |
+
"epoch": 6.0,
|
100 |
+
"eval_accuracy": 0.992,
|
101 |
+
"eval_loss": 0.029763367027044296,
|
102 |
+
"eval_runtime": 116.4617,
|
103 |
+
"eval_samples_per_second": 17.173,
|
104 |
+
"eval_steps_per_second": 0.275,
|
105 |
+
"step": 1500
|
106 |
+
},
|
107 |
+
{
|
108 |
+
"epoch": 7.0,
|
109 |
+
"grad_norm": 0.0010479438351467252,
|
110 |
+
"learning_rate": 5.925925925925926e-06,
|
111 |
+
"loss": 0.0014,
|
112 |
+
"step": 1750
|
113 |
+
},
|
114 |
+
{
|
115 |
+
"epoch": 7.0,
|
116 |
+
"eval_accuracy": 0.9965,
|
117 |
+
"eval_loss": 0.00931523460894823,
|
118 |
+
"eval_runtime": 114.6198,
|
119 |
+
"eval_samples_per_second": 17.449,
|
120 |
+
"eval_steps_per_second": 0.279,
|
121 |
+
"step": 1750
|
122 |
+
},
|
123 |
+
{
|
124 |
+
"epoch": 8.0,
|
125 |
+
"grad_norm": 0.007462013512849808,
|
126 |
+
"learning_rate": 5.185185185185185e-06,
|
127 |
+
"loss": 0.0008,
|
128 |
+
"step": 2000
|
129 |
+
},
|
130 |
+
{
|
131 |
+
"epoch": 8.0,
|
132 |
+
"eval_accuracy": 0.997,
|
133 |
+
"eval_loss": 0.013774478808045387,
|
134 |
+
"eval_runtime": 117.2101,
|
135 |
+
"eval_samples_per_second": 17.063,
|
136 |
+
"eval_steps_per_second": 0.273,
|
137 |
+
"step": 2000
|
138 |
+
},
|
139 |
+
{
|
140 |
+
"epoch": 9.0,
|
141 |
+
"grad_norm": 0.0013718679547309875,
|
142 |
+
"learning_rate": 4.444444444444444e-06,
|
143 |
+
"loss": 0.0007,
|
144 |
+
"step": 2250
|
145 |
+
},
|
146 |
+
{
|
147 |
+
"epoch": 9.0,
|
148 |
+
"eval_accuracy": 0.997,
|
149 |
+
"eval_loss": 0.010827419348061085,
|
150 |
+
"eval_runtime": 115.4895,
|
151 |
+
"eval_samples_per_second": 17.318,
|
152 |
+
"eval_steps_per_second": 0.277,
|
153 |
+
"step": 2250
|
154 |
+
},
|
155 |
+
{
|
156 |
+
"epoch": 10.0,
|
157 |
+
"grad_norm": 0.0020830812864005566,
|
158 |
+
"learning_rate": 3.7037037037037037e-06,
|
159 |
+
"loss": 0.0013,
|
160 |
+
"step": 2500
|
161 |
+
},
|
162 |
+
{
|
163 |
+
"epoch": 10.0,
|
164 |
+
"eval_accuracy": 0.9975,
|
165 |
+
"eval_loss": 0.011723974719643593,
|
166 |
+
"eval_runtime": 116.8921,
|
167 |
+
"eval_samples_per_second": 17.11,
|
168 |
+
"eval_steps_per_second": 0.274,
|
169 |
+
"step": 2500
|
170 |
}
|
171 |
],
|
172 |
"logging_steps": 500,
|
|
|
186 |
"attributes": {}
|
187 |
}
|
188 |
},
|
189 |
+
"total_flos": 1.251325189029888e+19,
|
190 |
"train_batch_size": 64,
|
191 |
"trial_name": null,
|
192 |
"trial_params": null
|