mirror of
https://github.com/open-mmlab/mmocr.git
synced 2025-06-03 21:54:47 +08:00
51 lines
1.5 KiB
Python
51 lines
1.5 KiB
Python
|
# Copyright (c) OpenMMLab. All rights reserved.
|
||
|
import argparse
|
||
|
|
||
|
from mmocr.utils import recog2lmdb
|
||
|
|
||
|
|
||
|
def main():
|
||
|
parser = argparse.ArgumentParser()
|
||
|
parser.add_argument('label_path', type=str, help='Path to label file')
|
||
|
parser.add_argument('output', type=str, help='Output lmdb path')
|
||
|
parser.add_argument(
|
||
|
'--img-root', '-i', type=str, help='Input imglist path')
|
||
|
parser.add_argument(
|
||
|
'--label-only',
|
||
|
action='store_true',
|
||
|
help='Only converter label to lmdb')
|
||
|
parser.add_argument(
|
||
|
'--label-format',
|
||
|
'-f',
|
||
|
default='txt',
|
||
|
choices=['txt', 'jsonl'],
|
||
|
help='The format of the label file, either txt or jsonl')
|
||
|
parser.add_argument(
|
||
|
'--batch-size',
|
||
|
'-b',
|
||
|
type=int,
|
||
|
default=1000,
|
||
|
help='Processing batch size, defaults to 1000')
|
||
|
parser.add_argument(
|
||
|
'--encoding',
|
||
|
'-e',
|
||
|
type=str,
|
||
|
default='utf8',
|
||
|
help='Bytes coding scheme, defaults to utf8')
|
||
|
parser.add_argument(
|
||
|
'--lmdb-map-size',
|
||
|
'-m',
|
||
|
type=int,
|
||
|
default=109951162776,
|
||
|
help='Maximum size database may grow to, '
|
||
|
'defaults to 109951162776 bytes')
|
||
|
opt = parser.parse_args()
|
||
|
|
||
|
assert opt.img_root or opt.label_only
|
||
|
recog2lmdb(opt.img_root, opt.label_path, opt.output, opt.label_format,
|
||
|
opt.label_only, opt.batch_size, opt.encoding, opt.lmdb_map_size)
|
||
|
|
||
|
|
||
|
if __name__ == '__main__':
|
||
|
main()
|