2021-11-25 16:27:45 +08:00
|
|
|
dataset_type = 'OCRDataset'
|
|
|
|
|
|
|
|
root = 'tests/data/ocr_toy_dataset'
|
|
|
|
img_prefix = f'{root}/imgs'
|
|
|
|
train_anno_file1 = f'{root}/label.txt'
|
|
|
|
|
|
|
|
train1 = dict(
|
|
|
|
type=dataset_type,
|
|
|
|
img_prefix=img_prefix,
|
|
|
|
ann_file=train_anno_file1,
|
|
|
|
loader=dict(
|
2022-04-27 12:53:57 +08:00
|
|
|
type='AnnFileLoader',
|
2021-11-25 16:27:45 +08:00
|
|
|
repeat=100,
|
2022-04-27 12:53:57 +08:00
|
|
|
file_format='txt',
|
|
|
|
file_storage_backend='disk',
|
2021-11-25 16:27:45 +08:00
|
|
|
parser=dict(
|
|
|
|
type='LineStrParser',
|
|
|
|
keys=['filename', 'text'],
|
|
|
|
keys_idx=[0, 1],
|
|
|
|
separator=' ')),
|
|
|
|
pipeline=None,
|
|
|
|
test_mode=False)
|
|
|
|
|
|
|
|
train_anno_file2 = f'{root}/label.lmdb'
|
|
|
|
train2 = dict(
|
|
|
|
type=dataset_type,
|
|
|
|
img_prefix=img_prefix,
|
|
|
|
ann_file=train_anno_file2,
|
|
|
|
loader=dict(
|
2022-04-27 12:53:57 +08:00
|
|
|
type='AnnFileLoader',
|
2021-11-25 16:27:45 +08:00
|
|
|
repeat=100,
|
2022-04-27 12:53:57 +08:00
|
|
|
file_format='lmdb',
|
|
|
|
file_storage_backend='disk',
|
2022-04-29 15:46:36 +08:00
|
|
|
parser=dict(type='LineJsonParser', keys=['filename', 'text'])),
|
2021-11-25 16:27:45 +08:00
|
|
|
pipeline=None,
|
|
|
|
test_mode=False)
|
|
|
|
|
|
|
|
test_anno_file1 = f'{root}/label.lmdb'
|
|
|
|
test = dict(
|
|
|
|
type=dataset_type,
|
|
|
|
img_prefix=img_prefix,
|
|
|
|
ann_file=test_anno_file1,
|
|
|
|
loader=dict(
|
2022-04-27 12:53:57 +08:00
|
|
|
type='AnnFileLoader',
|
2021-11-25 16:27:45 +08:00
|
|
|
repeat=1,
|
2022-04-27 12:53:57 +08:00
|
|
|
file_format='lmdb',
|
|
|
|
file_storage_backend='disk',
|
2022-04-29 15:46:36 +08:00
|
|
|
parser=dict(type='LineJsonParser', keys=['filename', 'text'])),
|
2021-11-25 16:27:45 +08:00
|
|
|
pipeline=None,
|
|
|
|
test_mode=True)
|
|
|
|
|
|
|
|
train_list = [train1, train2]
|
|
|
|
|
|
|
|
test_list = [test]
|