mirror of
https://github.com/open-mmlab/mmocr.git
synced 2025-06-03 21:54:47 +08:00
* fix typo of --lmdb-map-size default value * fix Co-authored-by: gaotongxiao <gaotongxiao@gmail.com>
51 lines
1.5 KiB
Python
51 lines
1.5 KiB
Python
# Copyright (c) OpenMMLab. All rights reserved.
|
|
import argparse
|
|
|
|
from mmocr.utils import recog2lmdb
|
|
|
|
|
|
def main():
|
|
parser = argparse.ArgumentParser()
|
|
parser.add_argument('label_path', type=str, help='Path to label file')
|
|
parser.add_argument('output', type=str, help='Output lmdb path')
|
|
parser.add_argument(
|
|
'--img-root', '-i', type=str, help='Input imglist path')
|
|
parser.add_argument(
|
|
'--label-only',
|
|
action='store_true',
|
|
help='Only converter label to lmdb')
|
|
parser.add_argument(
|
|
'--label-format',
|
|
'-f',
|
|
default='txt',
|
|
choices=['txt', 'jsonl'],
|
|
help='The format of the label file, either txt or jsonl')
|
|
parser.add_argument(
|
|
'--batch-size',
|
|
'-b',
|
|
type=int,
|
|
default=1000,
|
|
help='Processing batch size, defaults to 1000')
|
|
parser.add_argument(
|
|
'--encoding',
|
|
'-e',
|
|
type=str,
|
|
default='utf8',
|
|
help='Bytes coding scheme, defaults to utf8')
|
|
parser.add_argument(
|
|
'--lmdb-map-size',
|
|
'-m',
|
|
type=int,
|
|
default=1099511627776,
|
|
help='Maximum size database may grow to, '
|
|
'defaults to 1099511627776 bytes (1TB)')
|
|
opt = parser.parse_args()
|
|
|
|
assert opt.img_root or opt.label_only
|
|
recog2lmdb(opt.img_root, opt.label_path, opt.output, opt.label_format,
|
|
opt.label_only, opt.batch_size, opt.encoding, opt.lmdb_map_size)
|
|
|
|
|
|
if __name__ == '__main__':
|
|
main()
|