File size: 2,369 Bytes
0b4516f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
data_root = 'data/sroie'
cache_path = 'data/cache'

train_preparer = dict(
    obtainer=dict(
        type='NaiveDataObtainer',
        cache_path=cache_path,
        files=[
            dict(
                url='https://download.openmmlab.com/mmocr/data/'
                'sroie/0325updated.task1train(626p).zip',
                save_name='0325updated.task1train(626p).zip',
                md5='16137490f6865caac75772b9111d348c',
                content=['image', 'annotation'],
                mapping=[[
                    '0325updated/0325updated.task1train(626p)/*.jpg',
                    'textdet_imgs/train'
                ],
                         [
                             '0325updated/0325updated.task1train(626p)/*.txt',
                             'annotations/train'
                         ]])
        ]),
    gatherer=dict(
        type='PairGatherer',
        img_suffixes=['.jpg'],
        rule=[r'X(\d+)\.([jJ][pP][gG])', r'X\1.txt']),
    parser=dict(type='SROIETextDetAnnParser', encoding='utf-8-sig'),
    packer=dict(type='TextDetPacker'),
    dumper=dict(type='JsonDumper'),
)

test_preparer = dict(
    obtainer=dict(
        type='NaiveDataObtainer',
        cache_path=cache_path,
        files=[
            dict(
                url='https://download.openmmlab.com/mmocr/data/'
                'sroie/task1&2_test(361p).zip',
                save_name='task1&2_test(361p).zip',
                md5='1bde54705db0995c57a6e34cce437fea',
                content=['image'],
                mapping=[[
                    'task1&2_test(361p)/fulltext_test(361p)',
                    'textdet_imgs/test'
                ]]),
            dict(
                url='https://download.openmmlab.com/mmocr/data/sroie/text.zip',
                save_name='text.zip',
                md5='8c534653f252ff4d3943fa27a956a74b',
                content=['annotation'],
                mapping=[['text', 'annotations/test']]),
        ]),
    gatherer=dict(
        type='PairGatherer',
        img_suffixes=['.jpg'],
        rule=[r'X(\d+)\.([jJ][pP][gG])', r'X\1.txt']),
    parser=dict(type='SROIETextDetAnnParser', encoding='utf-8-sig'),
    packer=dict(type='TextDetPacker'),
    dumper=dict(type='JsonDumper'),
)
delete = ['text', 'task1&2_test(361p)', '0325updated', 'annotations']
config_generator = dict(type='TextDetConfigGenerator')