mmocr/tools/data/utils/lmdb_converter.py

51 lines
1.5 KiB
Python
Raw Normal View History

# Copyright (c) OpenMMLab. All rights reserved.
import argparse
from mmocr.utils import recog2lmdb
def main():
parser = argparse.ArgumentParser()
parser.add_argument('label_path', type=str, help='Path to label file')
parser.add_argument('output', type=str, help='Output lmdb path')
parser.add_argument(
'--img-root', '-i', type=str, help='Input imglist path')
parser.add_argument(
'--label-only',
action='store_true',
help='Only converter label to lmdb')
parser.add_argument(
'--label-format',
'-f',
default='txt',
choices=['txt', 'jsonl'],
help='The format of the label file, either txt or jsonl')
parser.add_argument(
'--batch-size',
'-b',
type=int,
default=1000,
help='Processing batch size, defaults to 1000')
parser.add_argument(
'--encoding',
'-e',
type=str,
default='utf8',
help='Bytes coding scheme, defaults to utf8')
parser.add_argument(
'--lmdb-map-size',
'-m',
type=int,
default=1099511627776,
help='Maximum size database may grow to, '
'defaults to 1099511627776 bytes (1TB)')
opt = parser.parse_args()
assert opt.img_root or opt.label_only
recog2lmdb(opt.img_root, opt.label_path, opt.output, opt.label_format,
opt.label_only, opt.batch_size, opt.encoding, opt.lmdb_map_size)
if __name__ == '__main__':
main()