|
_base_ = './htc-without-semantic_r50_fpn_1x_coco.py' |
|
model = dict( |
|
data_preprocessor=dict(pad_seg=True), |
|
roi_head=dict( |
|
semantic_roi_extractor=dict( |
|
type='SingleRoIExtractor', |
|
roi_layer=dict(type='RoIAlign', output_size=14, sampling_ratio=0), |
|
out_channels=256, |
|
featmap_strides=[8]), |
|
semantic_head=dict( |
|
type='FusedSemanticHead', |
|
num_ins=5, |
|
fusion_level=1, |
|
seg_scale_factor=1 / 8, |
|
num_convs=4, |
|
in_channels=256, |
|
conv_out_channels=256, |
|
num_classes=183, |
|
loss_seg=dict( |
|
type='CrossEntropyLoss', ignore_index=255, loss_weight=0.2)))) |
|
|
|
train_pipeline = [ |
|
dict(type='LoadImageFromFile', backend_args={{_base_.backend_args}}), |
|
dict( |
|
type='LoadAnnotations', with_bbox=True, with_mask=True, with_seg=True), |
|
dict(type='Resize', scale=(1333, 800), keep_ratio=True), |
|
dict(type='RandomFlip', prob=0.5), |
|
dict(type='PackDetInputs') |
|
] |
|
train_dataloader = dict( |
|
dataset=dict( |
|
data_prefix=dict(img='train2017/', seg='stuffthingmaps/train2017/'), |
|
pipeline=train_pipeline)) |
|
|