Yike Yuan a673b048a5
[Feature] Add support for VizWiz dataset. (#1636)
* add vizwiz

* update dataset

* [Fix] Build img_path in data_sample.

* Fix isort.

---------

Co-authored-by: ZhangYuanhan-AI <yuanhan002@ntu.edu.sg>
2023-06-16 17:16:17 +08:00

81 lines
2.0 KiB
Python

# data settings
data_preprocessor = dict(
mean=[122.770938, 116.7460125, 104.09373615],
std=[68.5005327, 66.6321579, 70.32316305],
to_rgb=True,
)
train_pipeline = [
dict(type='LoadImageFromFile'),
dict(
type='RandomResizedCrop',
scale=384,
interpolation='bicubic',
backend='pillow'),
dict(
type='PackInputs',
algorithm_keys=['question', 'gt_answer', 'gt_answer_weight'],
meta_keys=['question_id', 'image_id'],
),
]
test_pipeline = [
dict(type='LoadImageFromFile'),
dict(
type='Resize',
scale=(480, 480),
interpolation='bicubic',
backend='pillow'),
dict(
type='CleanCaption',
keys=['question'],
),
dict(
type='PackInputs',
algorithm_keys=['question', 'gt_answer', 'gt_answer_weight'],
meta_keys=['question_id', 'image_id'],
),
]
train_dataloader = dict(
batch_size=16,
num_workers=8,
dataset=dict(
type='VizWiz',
data_root='data/vizwiz/Images',
data_prefix='',
ann_file='Annotations/train.json',
pipeline=train_pipeline),
sampler=dict(type='DefaultSampler', shuffle=True),
persistent_workers=True,
drop_last=True,
)
val_dataloader = dict(
batch_size=16,
num_workers=8,
dataset=dict(
type='VizWiz',
data_root='data/vizwiz/Images',
data_prefix='',
ann_file='Annotations/val.json',
pipeline=test_pipeline),
sampler=dict(type='DefaultSampler', shuffle=False),
persistent_workers=True,
)
val_evaluator = dict(type='VizWizAcc')
test_dataloader = dict(
batch_size=16,
num_workers=8,
dataset=dict(
type='VizWiz',
data_root='data/vizwiz/Images',
data_prefix='',
ann_file='Annotations/test.json',
pipeline=test_pipeline),
sampler=dict(type='DefaultSampler', shuffle=False),
)
test_evaluator = dict(type='ReportVQA', file_path='vqa_test.json')