PaddleOCR/configs/table/table_master.yml

144 lines
3.6 KiB
YAML
Raw Normal View History

2022-06-16 21:24:38 +08:00
Global:
use_gpu: true
epoch_num: 17
log_smooth_window: 20
2022-07-04 18:22:25 +08:00
print_batch_step: 100
2022-06-16 21:24:38 +08:00
save_model_dir: ./output/table_master/
save_epoch_step: 17
2022-07-04 18:22:25 +08:00
eval_batch_step: [0, 6259]
cal_metric_during_train: true
pretrained_model: null
checkpoints:
2022-07-04 18:22:25 +08:00
save_inference_dir: output/table_master/infer
use_visualdl: false
2022-06-16 21:24:38 +08:00
infer_img: ppstructure/docs/table/table.jpg
2022-07-04 18:22:25 +08:00
save_res_path: ./output/table_master
2022-06-16 21:24:38 +08:00
character_dict_path: ppocr/utils/dict/table_master_structure_dict.txt
2022-07-04 18:22:25 +08:00
infer_mode: false
2022-08-08 14:50:27 +08:00
max_text_length: &max_text_length 500
box_format: &box_format 'xywh' # 'xywh', 'xyxy', 'xyxyxyxy'
2022-06-16 21:24:38 +08:00
Optimizer:
name: Adam
beta1: 0.9
beta2: 0.999
lr:
name: MultiStepDecay
learning_rate: 0.001
milestones: [12, 15]
gamma: 0.1
warmup_epoch: 0.02
regularizer:
2022-07-04 18:22:25 +08:00
name: L2
factor: 0.0
2022-06-16 21:24:38 +08:00
Architecture:
model_type: table
algorithm: TableMaster
Backbone:
name: TableResNetExtra
gcb_config:
ratio: 0.0625
headers: 1
att_scale: False
fusion_type: channel_add
layers: [False, True, True, True]
layers: [1,2,5,3]
Head:
name: TableMasterHead
hidden_size: 512
headers: 8
dropout: 0
d_ff: 2024
2022-08-08 14:50:27 +08:00
max_text_length: *max_text_length
loc_reg_num: &loc_reg_num 4
2022-06-16 21:24:38 +08:00
Loss:
name: TableMasterLoss
ignore_index: 42 # set to len of dict + 3
PostProcess:
name: TableMasterLabelDecode
box_shape: pad
merge_no_span_structure: &merge_no_span_structure True
2022-06-16 21:24:38 +08:00
Metric:
name: TableMetric
main_indicator: acc
2022-07-04 18:22:25 +08:00
compute_bbox_metric: False
2022-08-08 14:50:27 +08:00
box_format: *box_format
2022-06-16 21:24:38 +08:00
Train:
dataset:
name: PubTabDataSet
2022-07-04 18:22:25 +08:00
data_dir: train_data/table/pubtabnet/train/
label_file_list: [train_data/table/pubtabnet/PubTabNet_2.0.0_train.jsonl]
2022-06-16 21:24:38 +08:00
transforms:
2022-07-04 18:22:25 +08:00
- DecodeImage:
2022-06-16 21:24:38 +08:00
img_mode: BGR
channel_first: False
- TableMasterLabelEncode:
learn_empty_box: False
merge_no_span_structure: *merge_no_span_structure
2022-06-16 21:24:38 +08:00
replace_empty_cell_token: True
2022-08-08 14:50:27 +08:00
loc_reg_num: *loc_reg_num
max_text_length: *max_text_length
2022-06-16 21:24:38 +08:00
- ResizeTableImage:
max_len: 480
resize_bboxes: True
- PaddingTableImage:
size: [480, 480]
- TableBoxEncode:
2022-08-15 18:04:06 +08:00
in_box_format: *box_format
out_box_format: *box_format
2022-06-16 21:24:38 +08:00
- NormalizeImage:
scale: 1./255.
mean: [0.5, 0.5, 0.5]
std: [0.5, 0.5, 0.5]
2022-07-04 18:22:25 +08:00
order: hwc
- ToCHWImage: null
2022-06-16 21:24:38 +08:00
- KeepKeys:
2022-07-04 18:22:25 +08:00
keep_keys: [image, structure, bboxes, bbox_masks, shape]
2022-06-16 21:24:38 +08:00
loader:
shuffle: True
2022-07-04 18:22:25 +08:00
batch_size_per_card: 10
2022-06-16 21:24:38 +08:00
drop_last: True
2022-07-04 18:22:25 +08:00
num_workers: 8
2022-06-16 21:24:38 +08:00
Eval:
dataset:
name: PubTabDataSet
2022-07-26 16:18:18 +08:00
data_dir: train_data/table/pubtabnet/val/
2022-07-07 15:40:23 +08:00
label_file_list: [train_data/table/pubtabnet/PubTabNet_2.0.0_val.jsonl]
2022-06-16 21:24:38 +08:00
transforms:
2022-07-04 18:22:25 +08:00
- DecodeImage:
2022-06-16 21:24:38 +08:00
img_mode: BGR
channel_first: False
- TableMasterLabelEncode:
learn_empty_box: False
merge_no_span_structure: *merge_no_span_structure
2022-06-16 21:24:38 +08:00
replace_empty_cell_token: True
2022-08-08 14:50:27 +08:00
loc_reg_num: *loc_reg_num
max_text_length: *max_text_length
2022-06-16 21:24:38 +08:00
- ResizeTableImage:
max_len: 480
resize_bboxes: True
- PaddingTableImage:
2022-07-04 18:22:25 +08:00
size: [480, 480]
2022-06-16 21:24:38 +08:00
- TableBoxEncode:
2022-08-15 18:04:06 +08:00
in_box_format: *box_format
out_box_format: *box_format
2022-06-16 21:24:38 +08:00
- NormalizeImage:
scale: 1./255.
2022-07-04 18:22:25 +08:00
mean: [0.5, 0.5, 0.5]
std: [0.5, 0.5, 0.5]
order: hwc
- ToCHWImage: null
2022-06-16 21:24:38 +08:00
- KeepKeys:
2022-07-04 18:22:25 +08:00
keep_keys: [image, structure, bboxes, bbox_masks, shape]
2022-06-16 21:24:38 +08:00
loader:
shuffle: False
drop_last: False
2022-07-04 18:22:25 +08:00
batch_size_per_card: 10
num_workers: 8