mmocr/tools/data/utils/txt2lmdb.py

31 lines
754 B
Python

import argparse
from mmocr.utils import lmdb_converter
def main():
parser = argparse.ArgumentParser()
parser.add_argument(
'--imglist', '-i', required=True, help='input imglist path')
parser.add_argument(
'--output', '-o', required=True, help='output lmdb path')
parser.add_argument(
'--batch_size',
'-b',
type=int,
default=10000,
help='processing batch size, default 10000')
parser.add_argument(
'--coding',
'-c',
default='utf8',
help='bytes coding scheme, default utf8')
opt = parser.parse_args()
lmdb_converter(
opt.imglist, opt.output, batch_size=opt.batch_size, coding=opt.coding)
if __name__ == '__main__':
main()