Robin Chiu
Add the configs
a92ae91
dataset_type = 'OCRDataset'
root = 'tests/data/ocr_toy_dataset'
img_prefix = f'{root}/imgs'
train_anno_file1 = f'{root}/label.txt'
train1 = dict(
type=dataset_type,
img_prefix=img_prefix,
ann_file=train_anno_file1,
loader=dict(
type='AnnFileLoader',
repeat=100,
file_format='txt',
file_storage_backend='disk',
parser=dict(
type='LineStrParser',
keys=['filename', 'text'],
keys_idx=[0, 1],
separator=' ')),
pipeline=None,
test_mode=False)
train_anno_file2 = f'{root}/label.lmdb'
train2 = dict(
type=dataset_type,
img_prefix=img_prefix,
ann_file=train_anno_file2,
loader=dict(
type='AnnFileLoader',
repeat=100,
file_format='lmdb',
file_storage_backend='disk',
parser=dict(type='LineJsonParser', keys=['filename', 'text'])),
pipeline=None,
test_mode=False)
test_anno_file1 = f'{root}/label.lmdb'
test = dict(
type=dataset_type,
img_prefix=img_prefix,
ann_file=test_anno_file1,
loader=dict(
type='AnnFileLoader',
repeat=1,
file_format='lmdb',
file_storage_backend='disk',
parser=dict(type='LineJsonParser', keys=['filename', 'text'])),
pipeline=None,
test_mode=True)
train_list = [train1, train2]
test_list = [test]