|
dataset_type = 'OCRDataset' |
|
|
|
root = 'tests/data/ocr_toy_dataset' |
|
img_prefix = f'{root}/imgs' |
|
train_anno_file1 = f'{root}/label.txt' |
|
|
|
train1 = dict( |
|
type=dataset_type, |
|
img_prefix=img_prefix, |
|
ann_file=train_anno_file1, |
|
loader=dict( |
|
type='AnnFileLoader', |
|
repeat=100, |
|
file_format='txt', |
|
file_storage_backend='disk', |
|
parser=dict( |
|
type='LineStrParser', |
|
keys=['filename', 'text'], |
|
keys_idx=[0, 1], |
|
separator=' ')), |
|
pipeline=None, |
|
test_mode=False) |
|
|
|
train_anno_file2 = f'{root}/label.lmdb' |
|
train2 = dict( |
|
type=dataset_type, |
|
img_prefix=img_prefix, |
|
ann_file=train_anno_file2, |
|
loader=dict( |
|
type='AnnFileLoader', |
|
repeat=100, |
|
file_format='lmdb', |
|
file_storage_backend='disk', |
|
parser=dict(type='LineJsonParser', keys=['filename', 'text'])), |
|
pipeline=None, |
|
test_mode=False) |
|
|
|
test_anno_file1 = f'{root}/label.lmdb' |
|
test = dict( |
|
type=dataset_type, |
|
img_prefix=img_prefix, |
|
ann_file=test_anno_file1, |
|
loader=dict( |
|
type='AnnFileLoader', |
|
repeat=1, |
|
file_format='lmdb', |
|
file_storage_backend='disk', |
|
parser=dict(type='LineJsonParser', keys=['filename', 'text'])), |
|
pipeline=None, |
|
test_mode=True) |
|
|
|
train_list = [train1, train2] |
|
|
|
test_list = [test] |
|
|