PaddleOCR/benchmark/PaddleOCR_DBNet/utils/make_trainfile.py

21 lines
670 B
Python

# -*- coding: utf-8 -*-
# @Time : 2019/8/24 12:06
# @Author : zhoujun
import os
import glob
import pathlib
data_path = r'test'
# data_path/img 存放图片
# data_path/gt 存放标签文件
f_w = open(os.path.join(data_path, 'test.txt'), 'w', encoding='utf8')
for img_path in glob.glob(data_path + '/img/*.jpg', recursive=True):
d = pathlib.Path(img_path)
label_path = os.path.join(data_path, 'gt', ('gt_' + str(d.stem) + '.txt'))
if os.path.exists(img_path) and os.path.exists(label_path):
print(img_path, label_path)
else:
print('不存在', img_path, label_path)
f_w.write('{}\t{}\n'.format(img_path, label_path))
f_w.close()