diff --git a/dataset_zoo/icdar2015/textrecog.py b/dataset_zoo/icdar2015/textrecog.py index eac3ad82..df76e4b3 100644 --- a/dataset_zoo/icdar2015/textrecog.py +++ b/dataset_zoo/icdar2015/textrecog.py @@ -1,3 +1,6 @@ +# This configuration prepares the ICDAR15 1811 and 2077 +# version, and uses ICDAR15 2077 version by default. +# Read https://arxiv.org/pdf/1904.01906.pdf for more info. data_root = 'data/icdar2015' cache_path = 'data/cache' @@ -30,7 +33,18 @@ data_obtainer = dict( md5='d7a71585f4cc69f89edbe534e7706d5d', split=['test'], content=['annotation'], - mapping=[['ic15_textrecog_test_gt.txt', 'annotations/test.txt']]) + mapping=[['ic15_textrecog_test_gt.txt', 'annotations/test.txt']]), + # 3. The 1811 version discards non-alphanumeric character images and + # some extremely rotated, perspective-shifted, and curved images for + # evaluation + dict( + url='https://download.openmmlab.com/mmocr/data/1.x/recog/' + 'icdar_2015/textrecog_test_1811.json', + save_name='textrecog_test_1811.json', + md5='8d218ef1c37540ea959e22eeabc79ae4', + split=['test'], + content=['annotation'], + ), ]) data_converter = dict( @@ -40,3 +54,11 @@ data_converter = dict( gatherer=dict(type='mono_gather', mapping="f'{split}.txt'"), parser=dict(type='ICDARTxtTextRecogAnnParser', encoding='utf-8-sig'), dumper=dict(type='JsonDumper')) + +config_generator = dict( + type='TextRecogConfigGenerator', + data_root=data_root, + test_anns=[ + dict(ann_file='textrecog_test.json'), + dict(dataset_postfix='1811', ann_file='textrecog_test_1811.json') + ])