hdoi5324 commited on
Commit
c678ba2
·
verified ·
1 Parent(s): 32806c8

Initial model

Browse files
config.yaml ADDED
@@ -0,0 +1,415 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ AUG:
2
+ LABELED_INCLUDE_RANDOM_ERASING: true
3
+ LABELED_MIC_AUG: false
4
+ MIC_BLOCK_SIZE: 32
5
+ MIC_RATIO: 0.5
6
+ MOSAIC: false
7
+ MOSAIC_P: 0.25
8
+ UNLABELED_INCLUDE_RANDOM_ERASING: true
9
+ UNLABELED_MIC_AUG: false
10
+ WEAK_INCLUDES_MULTISCALE: true
11
+ CUDNN_BENCHMARK: false
12
+ DATALOADER:
13
+ ASPECT_RATIO_GROUPING: true
14
+ FILTER_EMPTY_ANNOTATIONS: true
15
+ FILTER_UNLABELED_EMPTY_ANNOTATIONS: false
16
+ NUM_WORKERS: 4
17
+ REPEAT_SQRT: true
18
+ REPEAT_THRESHOLD: 0.0
19
+ SAMPLER_TRAIN: TrainingSampler
20
+ DATASETS:
21
+ BATCH_CONTENTS:
22
+ - labeled_strong
23
+ BATCH_RATIOS:
24
+ - 1
25
+ PRECOMPUTED_PROPOSAL_TOPK_TEST: 1000
26
+ PRECOMPUTED_PROPOSAL_TOPK_TRAIN: 2000
27
+ PROPOSAL_FILES_TEST: []
28
+ PROPOSAL_FILES_TRAIN: []
29
+ TEST:
30
+ - sq_hand_test15v2
31
+ TRAIN:
32
+ - nudi_handfish_auv_v1_train
33
+ - trench_handfish_auv_v1_train
34
+ - sq_hand_train85_n200v2
35
+ TRAIN_SIZE: 10000000.0
36
+ UNLABELED: []
37
+ DOMAIN_ADAPT:
38
+ ALIGN:
39
+ IMG_DA_ENABLED: false
40
+ IMG_DA_HIDDEN_DIMS:
41
+ - 256
42
+ IMG_DA_IMPL: ours
43
+ IMG_DA_INPUT_DIM: 256
44
+ IMG_DA_LAYER: p2
45
+ IMG_DA_WEIGHT: 0.01
46
+ INS_DA_ENABLED: false
47
+ INS_DA_HIDDEN_DIMS:
48
+ - 1024
49
+ INS_DA_INPUT_DIM: 1024
50
+ INS_DA_WEIGHT: 0.01
51
+ SADA_COS_WEIGHT: 0.1
52
+ SADA_ENABLED: false
53
+ SADA_IMG_GRL_WEIGHT: 0.01
54
+ SADA_INS_GRL_WEIGHT: 0.1
55
+ CLS_LOSS_TYPE: CE
56
+ DISTILL:
57
+ CLS_TMP: 1.0
58
+ DISTILLER_NAME: ALDIDistiller
59
+ HARD_OBJ_ENABLED: false
60
+ HARD_ROIH_CLS_ENABLED: false
61
+ HARD_ROIH_REG_ENABLED: false
62
+ HARD_RPN_REG_ENABLED: false
63
+ OBJ_ENABLED: false
64
+ OBJ_TMP: 1.0
65
+ ROIH_CLS_ENABLED: false
66
+ ROIH_REG_ENABLED: false
67
+ RPN_REG_ENABLED: false
68
+ LOSSES:
69
+ QUALITY_LOSS_WEIGHT_ENABLED: false
70
+ TEACHER:
71
+ ENABLED: false
72
+ PSEUDO_LABEL_METHOD: thresholding
73
+ THRESHOLD: 0.8
74
+ EMA:
75
+ ALPHA: 0.9996
76
+ ENABLED: true
77
+ LOAD_FROM_EMA_ON_START: true
78
+ GLOBAL:
79
+ HACK: 1.0
80
+ GRCNN:
81
+ EFL: false
82
+ EFL_LAMBDA:
83
+ - 0.5
84
+ - 0.5
85
+ LEARN_ANCHORS_LABELED: false
86
+ LEARN_ANCHORS_UNLABELED: false
87
+ MODEL_TYPE: GAUSSIAN
88
+ TAU:
89
+ - 0.5
90
+ - 0.5
91
+ INPUT:
92
+ CROP:
93
+ ENABLED: false
94
+ SIZE:
95
+ - 0.9
96
+ - 0.9
97
+ TYPE: relative_range
98
+ FORMAT: BGR
99
+ MASK_FORMAT: polygon
100
+ MAX_SIZE_TEST: 2048
101
+ MAX_SIZE_TRAIN: 2048
102
+ MIN_SIZE_TEST: 1024
103
+ MIN_SIZE_TRAIN:
104
+ - 800
105
+ - 832
106
+ - 864
107
+ - 896
108
+ - 928
109
+ - 960
110
+ - 992
111
+ - 1024
112
+ MIN_SIZE_TRAIN_SAMPLING: choice
113
+ RANDOM_FLIP: horizontal
114
+ LOGGING:
115
+ API_TOKEN: eyJhcGlfYWRkcmVzcyI6Imh0dHBzOi8vYXBwLm5lcHR1bmUuYWkiLCJhcGlfdXJsIjoiaHR0cHM6Ly9hcHAubmVwdHVuZS5haSIsImFwaV9rZXkiOiIyODRhMzEyNi0wOTMxLTQzMWQtYTAwNi05OTY3OGY4YzYyNzQifQ==
116
+ GROUP_TAGS: HI2SQ,H1
117
+ ITERS: 100
118
+ PROJECT: ACFRmarine/ALDI-DOAD
119
+ TAGS: Base,RCCN-FPN,StrongAugEMA
120
+ MODEL:
121
+ ANCHOR_GENERATOR:
122
+ ANGLES:
123
+ - - -90
124
+ - 0
125
+ - 90
126
+ ASPECT_RATIOS:
127
+ - - 0.5
128
+ - 1.0
129
+ - 2.0
130
+ NAME: DefaultAnchorGenerator
131
+ OFFSET: 0.0
132
+ SIZES:
133
+ - - 32
134
+ - - 64
135
+ - - 128
136
+ - - 256
137
+ - - 512
138
+ BACKBONE:
139
+ FREEZE_AT: 2
140
+ NAME: build_resnet_fpn_backbone
141
+ DEVICE: cuda
142
+ FIND_UNUSED_PARAMETERS: false
143
+ FPN:
144
+ FUSE_TYPE: sum
145
+ IN_FEATURES:
146
+ - res2
147
+ - res3
148
+ - res4
149
+ - res5
150
+ NORM: ''
151
+ OUT_CHANNELS: 256
152
+ KEYPOINT_ON: false
153
+ LOAD_PROPOSALS: false
154
+ MASK_ON: false
155
+ META_ARCHITECTURE: GeneralizedRCNN
156
+ PANOPTIC_FPN:
157
+ COMBINE:
158
+ ENABLED: true
159
+ INSTANCES_CONFIDENCE_THRESH: 0.5
160
+ OVERLAP_THRESH: 0.5
161
+ STUFF_AREA_LIMIT: 4096
162
+ INSTANCE_LOSS_WEIGHT: 1.0
163
+ PIXEL_MEAN:
164
+ - 103.53
165
+ - 116.28
166
+ - 123.675
167
+ PIXEL_STD:
168
+ - 1.0
169
+ - 1.0
170
+ - 1.0
171
+ PROPOSAL_GENERATOR:
172
+ MIN_SIZE: 0
173
+ NAME: RPN
174
+ RESNETS:
175
+ DEFORM_MODULATED: false
176
+ DEFORM_NUM_GROUPS: 1
177
+ DEFORM_ON_PER_STAGE:
178
+ - false
179
+ - false
180
+ - false
181
+ - false
182
+ DEPTH: 50
183
+ NORM: FrozenBN
184
+ NUM_GROUPS: 1
185
+ OUT_FEATURES:
186
+ - res2
187
+ - res3
188
+ - res4
189
+ - res5
190
+ RES2_OUT_CHANNELS: 256
191
+ RES5_DILATION: 1
192
+ STEM_OUT_CHANNELS: 64
193
+ STRIDE_IN_1X1: true
194
+ WIDTH_PER_GROUP: 64
195
+ RETINANET:
196
+ BBOX_REG_LOSS_TYPE: smooth_l1
197
+ BBOX_REG_WEIGHTS: &id002
198
+ - 1.0
199
+ - 1.0
200
+ - 1.0
201
+ - 1.0
202
+ FOCAL_LOSS_ALPHA: 0.25
203
+ FOCAL_LOSS_GAMMA: 2.0
204
+ IN_FEATURES:
205
+ - p3
206
+ - p4
207
+ - p5
208
+ - p6
209
+ - p7
210
+ IOU_LABELS:
211
+ - 0
212
+ - -1
213
+ - 1
214
+ IOU_THRESHOLDS:
215
+ - 0.4
216
+ - 0.5
217
+ NMS_THRESH_TEST: 0.5
218
+ NORM: ''
219
+ NUM_CLASSES: 80
220
+ NUM_CONVS: 4
221
+ PRIOR_PROB: 0.01
222
+ SCORE_THRESH_TEST: 0.05
223
+ SMOOTH_L1_LOSS_BETA: 0.1
224
+ TOPK_CANDIDATES_TEST: 1000
225
+ ROI_BOX_CASCADE_HEAD:
226
+ BBOX_REG_WEIGHTS:
227
+ - &id001
228
+ - 10.0
229
+ - 10.0
230
+ - 5.0
231
+ - 5.0
232
+ - - 20.0
233
+ - 20.0
234
+ - 10.0
235
+ - 10.0
236
+ - - 30.0
237
+ - 30.0
238
+ - 15.0
239
+ - 15.0
240
+ IOUS:
241
+ - 0.5
242
+ - 0.6
243
+ - 0.7
244
+ ROI_BOX_HEAD:
245
+ BBOX_REG_LOSS_TYPE: smooth_l1
246
+ BBOX_REG_LOSS_WEIGHT: 1.0
247
+ BBOX_REG_WEIGHTS: *id001
248
+ CLS_AGNOSTIC_BBOX_REG: false
249
+ CONV_DIM: 256
250
+ FC_DIM: 1024
251
+ FED_LOSS_FREQ_WEIGHT_POWER: 0.5
252
+ FED_LOSS_NUM_CLASSES: 50
253
+ NAME: FastRCNNConvFCHead
254
+ NORM: ''
255
+ NUM_CONV: 0
256
+ NUM_FC: 2
257
+ POOLER_RESOLUTION: 7
258
+ POOLER_SAMPLING_RATIO: 0
259
+ POOLER_TYPE: ROIAlignV2
260
+ SMOOTH_L1_BETA: 0.0
261
+ TRAIN_ON_PRED_BOXES: false
262
+ USE_FED_LOSS: false
263
+ USE_SIGMOID_CE: false
264
+ ROI_HEADS:
265
+ BATCH_SIZE_PER_IMAGE: 512
266
+ IN_FEATURES:
267
+ - p2
268
+ - p3
269
+ - p4
270
+ - p5
271
+ IOU_LABELS:
272
+ - 0
273
+ - 1
274
+ IOU_THRESHOLDS:
275
+ - 0.5
276
+ NAME: StandardROIHeads
277
+ NMS_THRESH_TEST: 0.5
278
+ NUM_CLASSES: 1
279
+ POSITIVE_FRACTION: 0.25
280
+ PROPOSAL_APPEND_GT: true
281
+ SCORE_THRESH_TEST: 0.05
282
+ ROI_KEYPOINT_HEAD:
283
+ CONV_DIMS:
284
+ - 512
285
+ - 512
286
+ - 512
287
+ - 512
288
+ - 512
289
+ - 512
290
+ - 512
291
+ - 512
292
+ LOSS_WEIGHT: 1.0
293
+ MIN_KEYPOINTS_PER_IMAGE: 1
294
+ NAME: KRCNNConvDeconvUpsampleHead
295
+ NORMALIZE_LOSS_BY_VISIBLE_KEYPOINTS: true
296
+ NUM_KEYPOINTS: 17
297
+ POOLER_RESOLUTION: 14
298
+ POOLER_SAMPLING_RATIO: 0
299
+ POOLER_TYPE: ROIAlignV2
300
+ ROI_MASK_HEAD:
301
+ CLS_AGNOSTIC_MASK: false
302
+ CONV_DIM: 256
303
+ NAME: MaskRCNNConvUpsampleHead
304
+ NORM: ''
305
+ NUM_CONV: 4
306
+ POOLER_RESOLUTION: 14
307
+ POOLER_SAMPLING_RATIO: 0
308
+ POOLER_TYPE: ROIAlignV2
309
+ RPN:
310
+ BATCH_SIZE_PER_IMAGE: 256
311
+ BBOX_REG_LOSS_TYPE: smooth_l1
312
+ BBOX_REG_LOSS_WEIGHT: 1.0
313
+ BBOX_REG_WEIGHTS: *id002
314
+ BOUNDARY_THRESH: -1
315
+ CONV_DIMS:
316
+ - -1
317
+ HEAD_NAME: StandardRPNHead
318
+ IN_FEATURES:
319
+ - p2
320
+ - p3
321
+ - p4
322
+ - p5
323
+ - p6
324
+ IOU_LABELS:
325
+ - 0
326
+ - -1
327
+ - 1
328
+ IOU_THRESHOLDS:
329
+ - 0.3
330
+ - 0.7
331
+ LOSS_WEIGHT: 1.0
332
+ NMS_THRESH: 0.7
333
+ POSITIVE_FRACTION: 0.5
334
+ POST_NMS_TOPK_TEST: 1000
335
+ POST_NMS_TOPK_TRAIN: 1000
336
+ PRE_NMS_TOPK_TEST: 1000
337
+ PRE_NMS_TOPK_TRAIN: 2000
338
+ SMOOTH_L1_BETA: 0.0
339
+ SEM_SEG_HEAD:
340
+ COMMON_STRIDE: 4
341
+ CONVS_DIM: 128
342
+ IGNORE_VALUE: 255
343
+ IN_FEATURES:
344
+ - p2
345
+ - p3
346
+ - p4
347
+ - p5
348
+ LOSS_WEIGHT: 1.0
349
+ NAME: SemSegFPNHead
350
+ NORM: GN
351
+ NUM_CLASSES: 54
352
+ UMT:
353
+ ENABLED: false
354
+ WEIGHTS: models/model_final_f10217.pkl
355
+ OUTPUT_DIR: outputs/handfishinf/base_inf_sqall/
356
+ SEED: -1
357
+ SOLVER:
358
+ AMP:
359
+ ENABLED: true
360
+ BACKWARD_AT_END: false
361
+ BASE_LR: 0.00125
362
+ BASE_LR_END: 0.0
363
+ BIAS_LR_FACTOR: 1.0
364
+ CHECKPOINT_PERIOD: 2000
365
+ CLIP_GRADIENTS:
366
+ CLIP_TYPE: value
367
+ CLIP_VALUE: 1.0
368
+ ENABLED: false
369
+ NORM_TYPE: 2.0
370
+ GAMMA: 0.1
371
+ IMS_PER_BATCH: 1
372
+ IMS_PER_GPU: 1
373
+ LR_SCHEDULER_NAME: WarmupMultiStepLR
374
+ MAX_ITER: 9000
375
+ MOMENTUM: 0.9
376
+ NESTEROV: false
377
+ NUM_DECAYS: 3
378
+ OPTIMIZER: SGD
379
+ REFERENCE_WORLD_SIZE: 0
380
+ RESCALE_INTERVAL: false
381
+ STEPS:
382
+ - 6000
383
+ - 8000
384
+ WARMUP_FACTOR: 0.01
385
+ WARMUP_ITERS: 100
386
+ WARMUP_METHOD: linear
387
+ WEIGHT_DECAY: 0.0001
388
+ WEIGHT_DECAY_BIAS: null
389
+ WEIGHT_DECAY_NORM: 0.0
390
+ TEST:
391
+ AUG:
392
+ ENABLED: false
393
+ FLIP: true
394
+ MAX_SIZE: 4000
395
+ MIN_SIZES:
396
+ - 400
397
+ - 500
398
+ - 600
399
+ - 700
400
+ - 800
401
+ - 900
402
+ - 1000
403
+ - 1100
404
+ - 1200
405
+ DETECTIONS_PER_IMAGE: 100
406
+ EVAL_PERIOD: 500
407
+ EXPECTED_RESULTS: []
408
+ KEYPOINT_OKS_SIGMAS: []
409
+ PRECISE_BN:
410
+ ENABLED: false
411
+ NUM_ITER: 200
412
+ VERSION: 2
413
+ VIS_PERIOD: 0
414
+ VIT:
415
+ USE_ACT_CHECKPOINT: true
events.out.tfevents.1729832142.nudibranch.1796866.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c3090fff5e5f34e109f6746bb40c48de93daad6f87f4fcb7c3274e1ecefdd5e
3
+ size 440680
model_final.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd1451d481796aa199d33ba8583f49e1a8eaaee01824ceac3107d8dbb67fc9f8
3
+ size 495740870