mirror of https://github.com/open-mmlab/mmocr.git
43 lines
1.2 KiB
Python
43 lines
1.2 KiB
Python
|
img_norm_cfg = dict(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
|
||
|
train_pipeline = [
|
||
|
dict(type='LoadImageFromFile'),
|
||
|
dict(
|
||
|
type='ResizeOCR',
|
||
|
height=32,
|
||
|
min_width=32,
|
||
|
max_width=160,
|
||
|
keep_aspect_ratio=True,
|
||
|
width_downsample_ratio=0.25),
|
||
|
dict(type='ToTensorOCR'),
|
||
|
dict(type='NormalizeOCR', **img_norm_cfg),
|
||
|
dict(
|
||
|
type='Collect',
|
||
|
keys=['img'],
|
||
|
meta_keys=[
|
||
|
'filename', 'ori_shape', 'resize_shape', 'text', 'valid_ratio'
|
||
|
]),
|
||
|
]
|
||
|
test_pipeline = [
|
||
|
dict(type='LoadImageFromFile'),
|
||
|
dict(
|
||
|
type='MultiRotateAugOCR',
|
||
|
rotate_degrees=[0, 90, 270],
|
||
|
transforms=[
|
||
|
dict(
|
||
|
type='ResizeOCR',
|
||
|
height=32,
|
||
|
min_width=32,
|
||
|
max_width=160,
|
||
|
keep_aspect_ratio=True,
|
||
|
width_downsample_ratio=0.25),
|
||
|
dict(type='ToTensorOCR'),
|
||
|
dict(type='NormalizeOCR', **img_norm_cfg),
|
||
|
dict(
|
||
|
type='Collect',
|
||
|
keys=['img'],
|
||
|
meta_keys=[
|
||
|
'filename', 'ori_shape', 'resize_shape', 'valid_ratio'
|
||
|
]),
|
||
|
])
|
||
|
]
|