mmocr/configs/_base_/recog_pipelines/nrtr_pipeline.py

img_norm_cfg = dict(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
train_pipeline = [
    dict(type='LoadImageFromFile'),
    dict(
        type='ResizeOCR',
        height=32,
        min_width=32,
        max_width=160,
        keep_aspect_ratio=True,
        width_downsample_ratio=0.25),
    dict(type='ToTensorOCR'),
    dict(type='NormalizeOCR', **img_norm_cfg),
    dict(
        type='Collect',
        keys=['img'],
        meta_keys=[
            'filename', 'ori_shape', 'resize_shape', 'text', 'valid_ratio'
        ]),
]
test_pipeline = [
    dict(type='LoadImageFromFile'),
    dict(
        type='MultiRotateAugOCR',
        rotate_degrees=[0, 90, 270],
        transforms=[
            dict(
                type='ResizeOCR',
                height=32,
                min_width=32,
                max_width=160,
                keep_aspect_ratio=True,
                width_downsample_ratio=0.25),
            dict(type='ToTensorOCR'),
            dict(type='NormalizeOCR', **img_norm_cfg),
            dict(
                type='Collect',
                keys=['img'],
                meta_keys=[
                    'filename', 'ori_shape', 'resize_shape', 'valid_ratio'
                ]),
        ])
]
[Refactor] refactor textrecog config structure (#617) * refactor configs of textrecog * remove duplicate key in config _base_ * fix typo * rename dataset config file 2021-11-25 16:27:45 +08:00			`img_norm_cfg = dict(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])`
			`train_pipeline = [`
			`dict(type='LoadImageFromFile'),`
			`dict(`
			`type='ResizeOCR',`
			`height=32,`
			`min_width=32,`
			`max_width=160,`
			`keep_aspect_ratio=True,`
			`width_downsample_ratio=0.25),`
			`dict(type='ToTensorOCR'),`
			`dict(type='NormalizeOCR', **img_norm_cfg),`
			`dict(`
			`type='Collect',`
			`keys=['img'],`
			`meta_keys=[`
			`'filename', 'ori_shape', 'resize_shape', 'text', 'valid_ratio'`
			`]),`
			`]`
			`test_pipeline = [`
			`dict(type='LoadImageFromFile'),`
			`dict(`
			`type='MultiRotateAugOCR',`
			`rotate_degrees=[0, 90, 270],`
			`transforms=[`
			`dict(`
			`type='ResizeOCR',`
			`height=32,`
			`min_width=32,`
			`max_width=160,`
			`keep_aspect_ratio=True,`
			`width_downsample_ratio=0.25),`
			`dict(type='ToTensorOCR'),`
			`dict(type='NormalizeOCR', **img_norm_cfg),`
			`dict(`
			`type='Collect',`
			`keys=['img'],`
			`meta_keys=[`
			`'filename', 'ori_shape', 'resize_shape', 'valid_ratio'`
			`]),`
			`])`
			`]`