From b26907e9081d18543e969d02c82390912def023b Mon Sep 17 00:00:00 2001 From: Tong Gao Date: Sun, 9 Oct 2022 12:43:45 +0800 Subject: [PATCH] [Config] Update rec configs (#1417) --- configs/textrecog/abinet/_base_abinet-vision.py | 2 +- configs/textrecog/abinet/abinet_20e_st-an_mj.py | 2 +- configs/textrecog/crnn/_base_crnn_mini-vgg.py | 2 +- configs/textrecog/crnn/crnn_mini-vgg_5e_mj.py | 2 +- configs/textrecog/master/_base_master_resnet31.py | 2 +- configs/textrecog/master/master_resnet31_12e_st_mj_sa.py | 2 +- configs/textrecog/nrtr/_base_nrtr_modality-transform.py | 2 +- configs/textrecog/nrtr/_base_nrtr_resnet31.py | 2 +- configs/textrecog/nrtr/nrtr_modality-transform_6e_st_mj.py | 2 +- .../textrecog/robust_scanner/_base_robustscanner_resnet31.py | 2 +- .../robustscanner_resnet31_5e_st-sub_mj-sub_sa_real.py | 4 ++-- configs/textrecog/sar/_base_sar_resnet31_parallel-decoder.py | 2 +- .../sar_resnet31_parallel-decoder_5e_st-sub_mj-sub_sa_real.py | 4 ++-- configs/textrecog/satrn/_base_satrn_shallow.py | 2 +- configs/textrecog/satrn/satrn_shallow_5e_st_mj.py | 4 ++-- 15 files changed, 18 insertions(+), 18 deletions(-) diff --git a/configs/textrecog/abinet/_base_abinet-vision.py b/configs/textrecog/abinet/_base_abinet-vision.py index ee889c28..ef9a482f 100644 --- a/configs/textrecog/abinet/_base_abinet-vision.py +++ b/configs/textrecog/abinet/_base_abinet-vision.py @@ -46,7 +46,7 @@ train_pipeline = [ type='LoadImageFromFile', file_client_args=file_client_args, ignore_empty=True, - min_size=5), + min_size=2), dict(type='LoadOCRAnnotations', with_text=True), dict(type='Resize', scale=(128, 32)), dict( diff --git a/configs/textrecog/abinet/abinet_20e_st-an_mj.py b/configs/textrecog/abinet/abinet_20e_st-an_mj.py index 83277075..f59925c1 100644 --- a/configs/textrecog/abinet/abinet_20e_st-an_mj.py +++ b/configs/textrecog/abinet/abinet_20e_st-an_mj.py @@ -37,7 +37,7 @@ test_dataset = dict( type='ConcatDataset', datasets=test_list, pipeline=_base_.test_pipeline) train_dataloader = dict( - batch_size=192 * 4, + batch_size=192, num_workers=32, persistent_workers=True, sampler=dict(type='DefaultSampler', shuffle=True), diff --git a/configs/textrecog/crnn/_base_crnn_mini-vgg.py b/configs/textrecog/crnn/_base_crnn_mini-vgg.py index 519f95e9..b18a61e7 100644 --- a/configs/textrecog/crnn/_base_crnn_mini-vgg.py +++ b/configs/textrecog/crnn/_base_crnn_mini-vgg.py @@ -25,7 +25,7 @@ train_pipeline = [ color_type='grayscale', file_client_args=file_client_args, ignore_empty=True, - min_size=5), + min_size=2), dict(type='LoadOCRAnnotations', with_text=True), dict(type='Resize', scale=(100, 32), keep_ratio=False), dict( diff --git a/configs/textrecog/crnn/crnn_mini-vgg_5e_mj.py b/configs/textrecog/crnn/crnn_mini-vgg_5e_mj.py index acc76cdd..d3eed5cb 100644 --- a/configs/textrecog/crnn/crnn_mini-vgg_5e_mj.py +++ b/configs/textrecog/crnn/crnn_mini-vgg_5e_mj.py @@ -23,7 +23,7 @@ default_hooks = dict(logger=dict(type='LoggerHook', interval=50), ) train_dataloader = dict( batch_size=64, - num_workers=8, + num_workers=24, persistent_workers=True, sampler=dict(type='DefaultSampler', shuffle=True), dataset=dict( diff --git a/configs/textrecog/master/_base_master_resnet31.py b/configs/textrecog/master/_base_master_resnet31.py index 03ff7afe..decc755d 100644 --- a/configs/textrecog/master/_base_master_resnet31.py +++ b/configs/textrecog/master/_base_master_resnet31.py @@ -79,7 +79,7 @@ train_pipeline = [ type='LoadImageFromFile', file_client_args=file_client_args, ignore_empty=True, - min_size=5), + min_size=2), dict(type='LoadOCRAnnotations', with_text=True), dict( type='RescaleToHeight', diff --git a/configs/textrecog/master/master_resnet31_12e_st_mj_sa.py b/configs/textrecog/master/master_resnet31_12e_st_mj_sa.py index 4695e4cf..01c46192 100644 --- a/configs/textrecog/master/master_resnet31_12e_st_mj_sa.py +++ b/configs/textrecog/master/master_resnet31_12e_st_mj_sa.py @@ -37,7 +37,7 @@ test_dataset = dict( train_dataloader = dict( batch_size=512, - num_workers=4, + num_workers=24, persistent_workers=True, sampler=dict(type='DefaultSampler', shuffle=True), dataset=train_dataset) diff --git a/configs/textrecog/nrtr/_base_nrtr_modality-transform.py b/configs/textrecog/nrtr/_base_nrtr_modality-transform.py index 1ca42dd8..bd119f14 100644 --- a/configs/textrecog/nrtr/_base_nrtr_modality-transform.py +++ b/configs/textrecog/nrtr/_base_nrtr_modality-transform.py @@ -30,7 +30,7 @@ train_pipeline = [ type='LoadImageFromFile', file_client_args=file_client_args, ignore_empty=True, - min_size=5), + min_size=2), dict(type='LoadOCRAnnotations', with_text=True), dict( type='RescaleToHeight', diff --git a/configs/textrecog/nrtr/_base_nrtr_resnet31.py b/configs/textrecog/nrtr/_base_nrtr_resnet31.py index 9a2e4d95..e5757eaa 100644 --- a/configs/textrecog/nrtr/_base_nrtr_resnet31.py +++ b/configs/textrecog/nrtr/_base_nrtr_resnet31.py @@ -36,7 +36,7 @@ train_pipeline = [ type='LoadImageFromFile', file_client_args=file_client_args, ignore_empty=True, - min_size=5), + min_size=2), dict(type='LoadOCRAnnotations', with_text=True), dict( type='RescaleToHeight', diff --git a/configs/textrecog/nrtr/nrtr_modality-transform_6e_st_mj.py b/configs/textrecog/nrtr/nrtr_modality-transform_6e_st_mj.py index 89784a0e..a25afa19 100644 --- a/configs/textrecog/nrtr/nrtr_modality-transform_6e_st_mj.py +++ b/configs/textrecog/nrtr/nrtr_modality-transform_6e_st_mj.py @@ -33,7 +33,7 @@ test_dataset = dict( train_dataloader = dict( batch_size=384, - num_workers=32, + num_workers=24, persistent_workers=True, sampler=dict(type='DefaultSampler', shuffle=True), dataset=train_dataset) diff --git a/configs/textrecog/robust_scanner/_base_robustscanner_resnet31.py b/configs/textrecog/robust_scanner/_base_robustscanner_resnet31.py index d75b1fd5..aab1708b 100644 --- a/configs/textrecog/robust_scanner/_base_robustscanner_resnet31.py +++ b/configs/textrecog/robust_scanner/_base_robustscanner_resnet31.py @@ -36,7 +36,7 @@ train_pipeline = [ type='LoadImageFromFile', file_client_args=file_client_args, ignore_empty=True, - min_size=5), + min_size=2), dict(type='LoadOCRAnnotations', with_text=True), dict( type='RescaleToHeight', diff --git a/configs/textrecog/robust_scanner/robustscanner_resnet31_5e_st-sub_mj-sub_sa_real.py b/configs/textrecog/robust_scanner/robustscanner_resnet31_5e_st-sub_mj-sub_sa_real.py index 2a9edbf1..6651ab7b 100644 --- a/configs/textrecog/robust_scanner/robustscanner_resnet31_5e_st-sub_mj-sub_sa_real.py +++ b/configs/textrecog/robust_scanner/robustscanner_resnet31_5e_st-sub_mj-sub_sa_real.py @@ -43,8 +43,8 @@ train_list = [ ] train_dataloader = dict( - batch_size=64, - num_workers=8, + batch_size=64 * 4, + num_workers=24, persistent_workers=True, sampler=dict(type='DefaultSampler', shuffle=True), dataset=dict(type='ConcatDataset', datasets=train_list, verify_meta=False)) diff --git a/configs/textrecog/sar/_base_sar_resnet31_parallel-decoder.py b/configs/textrecog/sar/_base_sar_resnet31_parallel-decoder.py index 6734fb66..3fcb0cee 100755 --- a/configs/textrecog/sar/_base_sar_resnet31_parallel-decoder.py +++ b/configs/textrecog/sar/_base_sar_resnet31_parallel-decoder.py @@ -41,7 +41,7 @@ train_pipeline = [ type='LoadImageFromFile', file_client_args=file_client_args, ignore_empty=True, - min_size=5), + min_size=2), dict(type='LoadOCRAnnotations', with_text=True), dict( type='RescaleToHeight', diff --git a/configs/textrecog/sar/sar_resnet31_parallel-decoder_5e_st-sub_mj-sub_sa_real.py b/configs/textrecog/sar/sar_resnet31_parallel-decoder_5e_st-sub_mj-sub_sa_real.py index cfcdf502..1db30c22 100644 --- a/configs/textrecog/sar/sar_resnet31_parallel-decoder_5e_st-sub_mj-sub_sa_real.py +++ b/configs/textrecog/sar/sar_resnet31_parallel-decoder_5e_st-sub_mj-sub_sa_real.py @@ -43,8 +43,8 @@ train_list = [ ] train_dataloader = dict( - batch_size=64, - num_workers=8, + batch_size=64 * 6, + num_workers=24, persistent_workers=True, sampler=dict(type='DefaultSampler', shuffle=True), dataset=dict(type='ConcatDataset', datasets=train_list, verify_meta=False)) diff --git a/configs/textrecog/satrn/_base_satrn_shallow.py b/configs/textrecog/satrn/_base_satrn_shallow.py index d8eb7a25..11daee52 100644 --- a/configs/textrecog/satrn/_base_satrn_shallow.py +++ b/configs/textrecog/satrn/_base_satrn_shallow.py @@ -46,7 +46,7 @@ train_pipeline = [ type='LoadImageFromFile', file_client_args=file_client_args, ignore_empty=True, - min_size=5), + min_size=2), dict(type='LoadOCRAnnotations', with_text=True), dict(type='Resize', scale=(100, 32), keep_ratio=False), dict( diff --git a/configs/textrecog/satrn/satrn_shallow_5e_st_mj.py b/configs/textrecog/satrn/satrn_shallow_5e_st_mj.py index 16a7ef50..bbf75c0b 100644 --- a/configs/textrecog/satrn/satrn_shallow_5e_st_mj.py +++ b/configs/textrecog/satrn/satrn_shallow_5e_st_mj.py @@ -28,8 +28,8 @@ test_dataset = dict( optim_wrapper = dict(type='OptimWrapper', optimizer=dict(type='Adam', lr=3e-4)) train_dataloader = dict( - batch_size=64, - num_workers=8, + batch_size=128, + num_workers=24, persistent_workers=True, sampler=dict(type='DefaultSampler', shuffle=True), dataset=train_dataset)