PaddleOCR/tools/infer/predict_system.py

# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import os
import sys
import subprocess

__dir__ = os.path.dirname(os.path.abspath(__file__))
sys.path.append(__dir__)
sys.path.insert(0, os.path.abspath(os.path.join(__dir__, '../..')))

os.environ["FLAGS_allocator_strategy"] = 'auto_growth'

import cv2
import copy
import numpy as np
import json
import time
import logging
from PIL import Image
import tools.infer.utility as utility
import tools.infer.predict_rec as predict_rec
import tools.infer.predict_det as predict_det
import tools.infer.predict_cls as predict_cls
from ppocr.utils.utility import get_image_file_list, check_and_read
from ppocr.utils.logging import get_logger
from tools.infer.utility import draw_ocr_box_txt, get_rotate_crop_image, get_minarea_rect_crop
logger = get_logger()


class TextSystem(object):
    def __init__(self, args):
        if not args.show_log:
            logger.setLevel(logging.INFO)

        self.text_detector = predict_det.TextDetector(args)
        self.text_recognizer = predict_rec.TextRecognizer(args)
        self.use_angle_cls = args.use_angle_cls
        self.drop_score = args.drop_score
        if self.use_angle_cls:
            self.text_classifier = predict_cls.TextClassifier(args)

        self.args = args
        self.crop_image_res_index = 0

    def draw_crop_rec_res(self, output_dir, img_crop_list, rec_res):
        os.makedirs(output_dir, exist_ok=True)
        bbox_num = len(img_crop_list)
        for bno in range(bbox_num):
            cv2.imwrite(
                os.path.join(output_dir,
                             f"mg_crop_{bno+self.crop_image_res_index}.jpg"),
                img_crop_list[bno])
            logger.debug(f"{bno}, {rec_res[bno]}")
        self.crop_image_res_index += bbox_num

    def __call__(self, img, cls=True):
        time_dict = {'det': 0, 'rec': 0, 'cls': 0, 'all': 0}

        if img is None:
            logger.debug("no valid image provided")
            return None, None, time_dict

        start = time.time()
        ori_im = img.copy()
        dt_boxes, elapse = self.text_detector(img)
        time_dict['det'] = elapse

        if dt_boxes is None:
            logger.debug("no dt_boxes found, elapsed : {}".format(elapse))
            end = time.time()
            time_dict['all'] = end - start
            return None, None, time_dict
        else:
            logger.debug("dt_boxes num : {}, elapsed : {}".format(
                len(dt_boxes), elapse))
        img_crop_list = []

        dt_boxes = sorted_boxes(dt_boxes)

        for bno in range(len(dt_boxes)):
            tmp_box = copy.deepcopy(dt_boxes[bno])
            if self.args.det_box_type == "quad":
                img_crop = get_rotate_crop_image(ori_im, tmp_box)
            else:
                img_crop = get_minarea_rect_crop(ori_im, tmp_box)
            img_crop_list.append(img_crop)
        if self.use_angle_cls and cls:
            img_crop_list, angle_list, elapse = self.text_classifier(
                img_crop_list)
            time_dict['cls'] = elapse
            logger.debug("cls num  : {}, elapsed : {}".format(
                len(img_crop_list), elapse))

        rec_res, elapse = self.text_recognizer(img_crop_list)
        time_dict['rec'] = elapse
        logger.debug("rec_res num  : {}, elapsed : {}".format(
            len(rec_res), elapse))
        if self.args.save_crop_res:
            self.draw_crop_rec_res(self.args.crop_res_save_dir, img_crop_list,
                                   rec_res)
        filter_boxes, filter_rec_res = [], []
        for box, rec_result in zip(dt_boxes, rec_res):
            text, score = rec_result[0], rec_result[1]
            if score >= self.drop_score:
                filter_boxes.append(box)
                filter_rec_res.append(rec_result)
        end = time.time()
        time_dict['all'] = end - start
        return filter_boxes, filter_rec_res, time_dict


def sorted_boxes(dt_boxes):
    """
    Sort text boxes in order from top to bottom, left to right
    args:
        dt_boxes(array):detected text boxes with shape [4, 2]
    return:
        sorted boxes(array) with shape [4, 2]
    """
    num_boxes = dt_boxes.shape[0]
    sorted_boxes = sorted(dt_boxes, key=lambda x: (x[0][1], x[0][0]))
    _boxes = list(sorted_boxes)

    for i in range(num_boxes - 1):
        for j in range(i, -1, -1):
            if abs(_boxes[j + 1][0][1] - _boxes[j][0][1]) < 10 and \
                    (_boxes[j + 1][0][0] < _boxes[j][0][0]):
                tmp = _boxes[j]
                _boxes[j] = _boxes[j + 1]
                _boxes[j + 1] = tmp
            else:
                break
    return _boxes


def main(args):
    image_file_list = get_image_file_list(args.image_dir)
    image_file_list = image_file_list[args.process_id::args.total_process_num]
    text_sys = TextSystem(args)
    is_visualize = True
    font_path = args.vis_font_path
    drop_score = args.drop_score
    draw_img_save_dir = args.draw_img_save_dir
    os.makedirs(draw_img_save_dir, exist_ok=True)
    save_results = []

    logger.info(
        "In PP-OCRv3, rec_image_shape parameter defaults to '3, 48, 320', "
        "if you are using recognition model with PP-OCRv2 or an older version, please set --rec_image_shape='3,32,320"
    )

    # warm up 10 times
    if args.warmup:
        img = np.random.uniform(0, 255, [640, 640, 3]).astype(np.uint8)
        for i in range(10):
            res = text_sys(img)

    total_time = 0
    cpu_mem, gpu_mem, gpu_util = 0, 0, 0
    _st = time.time()
    count = 0
    for idx, image_file in enumerate(image_file_list):

        img, flag_gif, flag_pdf = check_and_read(image_file)
        if not flag_gif and not flag_pdf:
            img = cv2.imread(image_file)
        if not flag_pdf:
            if img is None:
                logger.debug("error in loading image:{}".format(image_file))
                continue
            imgs = [img]
        else:
            page_num = args.page_num
            if page_num > len(img) or page_num == 0:
                page_num = len(img)
            imgs = img[:page_num]
        for index, img in enumerate(imgs):
            starttime = time.time()
            dt_boxes, rec_res, time_dict = text_sys(img)
            elapse = time.time() - starttime
            total_time += elapse
            if len(imgs) > 1:
                logger.debug(
                    str(idx) + '_' + str(index) + "  Predict time of %s: %.3fs"
                    % (image_file, elapse))
            else:
                logger.debug(
                    str(idx) + "  Predict time of %s: %.3fs" % (image_file,
                                                                elapse))
            for text, score in rec_res:
                logger.debug("{}, {:.3f}".format(text, score))

            res = [{
                "transcription": rec_res[i][0],
                "points": np.array(dt_boxes[i]).astype(np.int32).tolist(),
            } for i in range(len(dt_boxes))]
            if len(imgs) > 1:
                save_pred = os.path.basename(image_file) + '_' + str(
                    index) + "\t" + json.dumps(
                        res, ensure_ascii=False) + "\n"
            else:
                save_pred = os.path.basename(image_file) + "\t" + json.dumps(
                    res, ensure_ascii=False) + "\n"
            save_results.append(save_pred)

            if is_visualize:
                image = Image.fromarray(cv2.cvtColor(img, cv2.COLOR_BGR2RGB))
                boxes = dt_boxes
                txts = [rec_res[i][0] for i in range(len(rec_res))]
                scores = [rec_res[i][1] for i in range(len(rec_res))]

                draw_img = draw_ocr_box_txt(
                    image,
                    boxes,
                    txts,
                    scores,
                    drop_score=drop_score,
                    font_path=font_path)
                if flag_gif:
                    save_file = image_file[:-3] + "png"
                elif flag_pdf:
                    save_file = image_file.replace('.pdf',
                                                   '_' + str(index) + '.png')
                else:
                    save_file = image_file
                cv2.imwrite(
                    os.path.join(draw_img_save_dir,
                                 os.path.basename(save_file)),
                    draw_img[:, :, ::-1])
                logger.debug("The visualized image saved in {}".format(
                    os.path.join(draw_img_save_dir, os.path.basename(
                        save_file))))

    logger.info("The predict total time is {}".format(time.time() - _st))
    if args.benchmark:
        text_sys.text_detector.autolog.report()
        text_sys.text_recognizer.autolog.report()

    with open(
            os.path.join(draw_img_save_dir, "system_results.txt"),
            'w',
            encoding='utf-8') as f:
        f.writelines(save_results)


if __name__ == "__main__":
    args = utility.parse_args()
    if args.use_mp:
        p_list = []
        total_process_num = args.total_process_num
        for process_id in range(total_process_num):
            cmd = [sys.executable, "-u"] + sys.argv + [
                "--process_id={}".format(process_id),
                "--use_mp={}".format(False)
            ]
            p = subprocess.Popen(cmd, stdout=sys.stdout, stderr=sys.stdout)
            p_list.append(p)
        for p in p_list:
            p.wait()
    else:
        main(args)
upload PaddleOCR code 2020-05-10 16:26:57 +08:00			`# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.`
			`#`
			`# Licensed under the Apache License, Version 2.0 (the "License");`
			`# you may not use this file except in compliance with the License.`
			`# You may obtain a copy of the License at`
			`#`
			`# http://www.apache.org/licenses/LICENSE-2.0`
			`#`
			`# Unless required by applicable law or agreed to in writing, software`
			`# distributed under the License is distributed on an "AS IS" BASIS,`
			`# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`# See the License for the specific language governing permissions and`
			`# limitations under the License.`
在程序中使用os.path.append添加环境变量，不再使用命令设置 2020-06-11 09:45:01 +08:00			`import os`
			`import sys`
revert mp process, test=develop 2021-06-16 10:04:27 +08:00			`import subprocess`
paddleocr whl adaptation dygraph 2020-12-07 19:10:19 +08:00
优化tools/infer/predict_system.py代码 2020-06-20 03:03:39 +08:00			`__dir__ = os.path.dirname(os.path.abspath(__file__))`
在程序中使用os.path.append添加环境变量，不再使用命令设置 2020-06-11 09:45:01 +08:00			`sys.path.append(__dir__)`
fix import order (#5628) 2022-03-04 16:13:54 +08:00			`sys.path.insert(0, os.path.abspath(os.path.join(__dir__, '../..')))`
discard export PYTHONPATH manually 2020-06-12 13:49:24 +08:00
add export to limit GPU-memory-usage 2020-12-22 15:57:21 +08:00			`os.environ["FLAGS_allocator_strategy"] = 'auto_growth'`

upload PaddleOCR code 2020-05-10 16:26:57 +08:00			`import cv2`
			`import copy`
			`import numpy as np`
add system pred save 2022-02-07 07:56:08 +00:00			`import json`
upload PaddleOCR code 2020-05-10 16:26:57 +08:00			`import time`
fix structure pipeline infer bug 2021-06-10 17:12:14 +08:00			`import logging`
add visualize code to predict_eval 2020-05-14 12:08:11 +08:00			`from PIL import Image`
python端预测完成 2020-11-17 17:28:28 +08:00			`import tools.infer.utility as utility`
			`import tools.infer.predict_rec as predict_rec`
			`import tools.infer.predict_det as predict_det`
add predict_cls to predict_system 2020-12-01 16:42:10 +08:00			`import tools.infer.predict_cls as predict_cls`
polish kie doc and code (#7255) * add fapiao kie * fix readme * fix fanli * add readme * add how to do kie en * add algo kie * add algo overview en * rename vqa to kie * fix read gif 2022-08-21 10:55:49 +08:00			`from ppocr.utils.utility import get_image_file_list, check_and_read`
python端预测完成 2020-11-17 17:28:28 +08:00			`from ppocr.utils.logging import get_logger`
add min_area_rect_crop 2022-10-27 15:37:15 +08:00			`from tools.infer.utility import draw_ocr_box_txt, get_rotate_crop_image, get_minarea_rect_crop`
paddleocr whl adaptation dygraph 2020-12-07 19:10:19 +08:00			`logger = get_logger()`

upload PaddleOCR code 2020-05-10 16:26:57 +08:00
			`class TextSystem(object):`
			`def __init__(self, args):`
fix structure pipeline infer bug 2021-06-10 17:12:14 +08:00			`if not args.show_log:`
			`logger.setLevel(logging.INFO)`

upload PaddleOCR code 2020-05-10 16:26:57 +08:00			`self.text_detector = predict_det.TextDetector(args)`
			`self.text_recognizer = predict_rec.TextRecognizer(args)`
add predict_cls to predict_system 2020-12-01 16:42:10 +08:00			`self.use_angle_cls = args.use_angle_cls`
paddleocr whl adaptation dygraph 2020-12-07 19:10:19 +08:00			`self.drop_score = args.drop_score`
add predict_cls to predict_system 2020-12-01 16:42:10 +08:00			`if self.use_angle_cls:`
			`self.text_classifier = predict_cls.TextClassifier(args)`
upload PaddleOCR code 2020-05-10 16:26:57 +08:00
improve system prediction and remove some hard code (#4643) * fix center yaml * rm init_center param * fix typo * improve pred system 2021-11-17 12:32:05 +08:00			`self.args = args`
			`self.crop_image_res_index = 0`

			`def draw_crop_rec_res(self, output_dir, img_crop_list, rec_res):`
			`os.makedirs(output_dir, exist_ok=True)`
upload PaddleOCR code 2020-05-10 16:26:57 +08:00			`bbox_num = len(img_crop_list)`
			`for bno in range(bbox_num):`
improve system prediction and remove some hard code (#4643) * fix center yaml * rm init_center param * fix typo * improve pred system 2021-11-17 12:32:05 +08:00			`cv2.imwrite(`
			`os.path.join(output_dir,`
modified default shape 2022-05-09 12:51:21 +00:00			`f"mg_crop_{bno+self.crop_image_res_index}.jpg"),`
improve system prediction and remove some hard code (#4643) * fix center yaml * rm init_center param * fix typo * improve pred system 2021-11-17 12:32:05 +08:00			`img_crop_list[bno])`
			`logger.debug(f"{bno}, {rec_res[bno]}")`
			`self.crop_image_res_index += bbox_num`
upload PaddleOCR code 2020-05-10 16:26:57 +08:00
combine args in paddleocr and ppocr/infer/utility 2021-05-26 17:34:47 +08:00			`def __call__(self, img, cls=True):`
Don't break overall processing on a bad image (#10216) 2023-07-19 10:46:29 +03:00			`time_dict = {'det': 0, 'rec': 0, 'cls': 0, 'all': 0}`

			`if img is None:`
			`logger.debug("no valid image provided")`
			`return None, None, time_dict`

add SLANet 2022-08-08 06:50:27 +00:00			`start = time.time()`
upload PaddleOCR code 2020-05-10 16:26:57 +08:00			`ori_im = img.copy()`
			`dt_boxes, elapse = self.text_detector(img)`
add SLANet 2022-08-08 06:50:27 +00:00			`time_dict['det'] = elapse`
Don't break overall processing on a bad image (#10216) 2023-07-19 10:46:29 +03:00
upload PaddleOCR code 2020-05-10 16:26:57 +08:00			`if dt_boxes is None:`
Don't break overall processing on a bad image (#10216) 2023-07-19 10:46:29 +03:00			`logger.debug("no dt_boxes found, elapsed : {}".format(elapse))`
			`end = time.time()`
			`time_dict['all'] = end - start`
			`return None, None, time_dict`
			`else:`
			`logger.debug("dt_boxes num : {}, elapsed : {}".format(`
			`len(dt_boxes), elapse))`
upload PaddleOCR code 2020-05-10 16:26:57 +08:00			`img_crop_list = []`
add doc、infer_det.py、requirments.txt 2020-05-11 15:27:52 +08:00
			`dt_boxes = sorted_boxes(dt_boxes)`

upload PaddleOCR code 2020-05-10 16:26:57 +08:00			`for bno in range(len(dt_boxes)):`
			`tmp_box = copy.deepcopy(dt_boxes[bno])`
add min_area_rect_crop 2022-10-27 15:39:31 +08:00			`if self.args.det_box_type == "quad":`
add min_area_rect_crop 2022-10-27 15:37:15 +08:00			`img_crop = get_rotate_crop_image(ori_im, tmp_box)`
			`else:`
			`img_crop = get_minarea_rect_crop(ori_im, tmp_box)`
upload PaddleOCR code 2020-05-10 16:26:57 +08:00			`img_crop_list.append(img_crop)`
combine args in paddleocr and ppocr/infer/utility 2021-05-26 17:34:47 +08:00			`if self.use_angle_cls and cls:`
add predict_cls to predict_system 2020-12-01 16:42:10 +08:00			`img_crop_list, angle_list, elapse = self.text_classifier(`
			`img_crop_list)`
add SLANet 2022-08-08 06:50:27 +00:00			`time_dict['cls'] = elapse`
Don't break overall processing on a bad image (#10216) 2023-07-19 10:46:29 +03:00			`logger.debug("cls num : {}, elapsed : {}".format(`
add predict_cls to predict_system 2020-12-01 16:42:10 +08:00			`len(img_crop_list), elapse))`

upload PaddleOCR code 2020-05-10 16:26:57 +08:00			`rec_res, elapse = self.text_recognizer(img_crop_list)`
add SLANet 2022-08-08 06:50:27 +00:00			`time_dict['rec'] = elapse`
Don't break overall processing on a bad image (#10216) 2023-07-19 10:46:29 +03:00			`logger.debug("rec_res num : {}, elapsed : {}".format(`
paddleocr whl adaptation dygraph 2020-12-07 19:10:19 +08:00			`len(rec_res), elapse))`
improve system prediction and remove some hard code (#4643) * fix center yaml * rm init_center param * fix typo * improve pred system 2021-11-17 12:32:05 +08:00			`if self.args.save_crop_res:`
			`self.draw_crop_rec_res(self.args.crop_res_save_dir, img_crop_list,`
			`rec_res)`
paddleocr whl adaptation dygraph 2020-12-07 19:10:19 +08:00			`filter_boxes, filter_rec_res = [], []`
fix typo 2022-02-07 08:00:14 +00:00			`for box, rec_result in zip(dt_boxes, rec_res):`
CV套件建设专项活动 - 文字识别返回单字识别坐标 (#10515) * modification of return word box * update_implements * Update rec_postprocess.py * Update utility.py 2023-08-02 19:11:28 +08:00			`text, score = rec_result[0], rec_result[1]`
paddleocr whl adaptation dygraph 2020-12-07 19:10:19 +08:00			`if score >= self.drop_score:`
			`filter_boxes.append(box)`
fix typo 2022-02-07 08:00:14 +00:00			`filter_rec_res.append(rec_result)`
add SLANet 2022-08-08 06:50:27 +00:00			`end = time.time()`
			`time_dict['all'] = end - start`
			`return filter_boxes, filter_rec_res, time_dict`
upload PaddleOCR code 2020-05-10 16:26:57 +08:00

add doc、infer_det.py、requirments.txt 2020-05-11 15:27:52 +08:00			`def sorted_boxes(dt_boxes):`
			`"""`
			`Sort text boxes in order from top to bottom, left to right`
			`args:`
update readme 2020-05-14 13:49:28 +08:00			`dt_boxes(array):detected text boxes with shape [4, 2]`
add doc、infer_det.py、requirments.txt 2020-05-11 15:27:52 +08:00			`return:`
			`sorted boxes(array) with shape [4, 2]`
			`"""`
			`num_boxes = dt_boxes.shape[0]`
modify batch num in rec and fix sorted_box func 2020-05-20 16:05:46 +08:00			`sorted_boxes = sorted(dt_boxes, key=lambda x: (x[0][1], x[0][0]))`
add doc、infer_det.py、requirments.txt 2020-05-11 15:27:52 +08:00			`_boxes = list(sorted_boxes)`

			`for i in range(num_boxes - 1):`
fix bug: the index j can not skip 0. (#8918) 2023-01-30 16:10:44 +08:00			`for j in range(i, -1, -1):`
cherry pick PRs from community (#7273) * Merge pull request #6824 from ChenNima/release/2.5-kie-save-res [kie]add write_kie_result to kie infer tool * Merge pull request #6677 from TonyJiangWJ/release/2.5 修复内存泄露问题 * Update native.cpp (#6650) fix issue 6640 * Merge pull request #6625 from ynjang/ynjang update sorted_boxes * fix DeprecationWarning, (#6604) DeprecationWarning: The binary mode of fromstring is deprecated, as it behaves surprisingly on unicode inputs. Use frombuffer instead * Merge pull request #6585 from maxbachmann/release/2.5 replace GPL licensed components * Merge pull request #6575 from Eling486/release/2.5 update win doc * Merge pull request #6477 from MikoyChinese/fix-copy-paste Fix copy_paste no texts augment. * Merge pull request #6361 from mohamadmansourX/patch-9 Update README_en.md Co-authored-by: Double_V <liuvv0203@163.com> Co-authored-by: shawn <1021362695@qq.com> Co-authored-by: paopjian <672034519@qq.com> 2022-08-21 18:03:57 +08:00			`if abs(_boxes[j + 1][0][1] - _boxes[j][0][1]) < 10 and \`
			`(_boxes[j + 1][0][0] < _boxes[j][0][0]):`
			`tmp = _boxes[j]`
			`_boxes[j] = _boxes[j + 1]`
			`_boxes[j + 1] = tmp`
			`else:`
			`break`
add doc、infer_det.py、requirments.txt 2020-05-11 15:27:52 +08:00			`return _boxes`


优化tools/infer/predict_system.py代码 2020-06-20 03:03:39 +08:00			`def main(args):`
add visualize code to predict_eval 2020-05-14 12:08:11 +08:00			`image_file_list = get_image_file_list(args.image_dir)`
revert mp process, test=develop 2021-06-16 10:04:27 +08:00			`image_file_list = image_file_list[args.process_id::args.total_process_num]`
upload PaddleOCR code 2020-05-10 16:26:57 +08:00			`text_sys = TextSystem(args)`
add visualize code to predict_eval 2020-05-14 12:08:11 +08:00			`is_visualize = True`
add predict_cls to predict_system 2020-12-01 16:42:10 +08:00			`font_path = args.vis_font_path`
delete debug code 2020-12-02 15:53:55 +08:00			`drop_score = args.drop_score`
add system pred save 2022-02-07 07:56:08 +00:00			`draw_img_save_dir = args.draw_img_save_dir`
			`os.makedirs(draw_img_save_dir, exist_ok=True)`
			`save_results = []`
Merge branch 'dygraph' into warmup 2021-06-09 14:54:08 +08:00
add SLANet 2022-08-08 06:50:27 +00:00			`logger.info(`
			`"In PP-OCRv3, rec_image_shape parameter defaults to '3, 48, 320', "`
			`"if you are using recognition model with PP-OCRv2 or an older version, please set --rec_image_shape='3,32,320"`
			`)`

add warmup 2021-06-09 13:27:13 +08:00			`# warm up 10 times`
			`if args.warmup:`
			`img = np.random.uniform(0, 255, [640, 640, 3]).astype(np.uint8)`
			`for i in range(10):`
			`res = text_sys(img)`
merge dygraph 2021-06-30 10:55:05 +08:00
add python benchmark for ocr 2021-05-26 10:40:16 +00:00			`total_time = 0`
			`cpu_mem, gpu_mem, gpu_util = 0, 0, 0`
			`_st = time.time()`
			`count = 0`
			`for idx, image_file in enumerate(image_file_list):`
add warmup 2021-06-09 13:27:13 +08:00
support infer pdf file 2022-09-29 07:31:45 +00:00			`img, flag_gif, flag_pdf = check_and_read(image_file)`
			`if not flag_gif and not flag_pdf:`
read gif read func 2020-07-28 11:18:48 +08:00			`img = cv2.imread(image_file)`
support infer pdf file 2022-09-29 07:31:45 +00:00			`if not flag_pdf:`
			`if img is None:`
			`logger.debug("error in loading image:{}".format(image_file))`
			`continue`
			`imgs = [img]`
			`else:`
			`page_num = args.page_num`
			`if page_num > len(img) or page_num == 0:`
			`page_num = len(img)`
			`imgs = img[:page_num]`
			`for index, img in enumerate(imgs):`
			`starttime = time.time()`
			`dt_boxes, rec_res, time_dict = text_sys(img)`
			`elapse = time.time() - starttime`
			`total_time += elapse`
			`if len(imgs) > 1:`
			`logger.debug(`
			`str(idx) + '_' + str(index) + " Predict time of %s: %.3fs"`
			`% (image_file, elapse))`
			`else:`
			`logger.debug(`
			`str(idx) + " Predict time of %s: %.3fs" % (image_file,`
			`elapse))`
			`for text, score in rec_res:`
			`logger.debug("{}, {:.3f}".format(text, score))`

			`res = [{`
			`"transcription": rec_res[i][0],`
			`"points": np.array(dt_boxes[i]).astype(np.int32).tolist(),`
			`} for i in range(len(dt_boxes))]`
			`if len(imgs) > 1:`
			`save_pred = os.path.basename(image_file) + '_' + str(`
			`index) + "\t" + json.dumps(`
			`res, ensure_ascii=False) + "\n"`
			`else:`
			`save_pred = os.path.basename(image_file) + "\t" + json.dumps(`
			`res, ensure_ascii=False) + "\n"`
			`save_results.append(save_pred)`

			`if is_visualize:`
			`image = Image.fromarray(cv2.cvtColor(img, cv2.COLOR_BGR2RGB))`
			`boxes = dt_boxes`
			`txts = [rec_res[i][0] for i in range(len(rec_res))]`
			`scores = [rec_res[i][1] for i in range(len(rec_res))]`

			`draw_img = draw_ocr_box_txt(`
			`image,`
			`boxes,`
			`txts,`
			`scores,`
			`drop_score=drop_score,`
			`font_path=font_path)`
			`if flag_gif:`
			`save_file = image_file[:-3] + "png"`
			`elif flag_pdf:`
			`save_file = image_file.replace('.pdf',`
			`'_' + str(index) + '.png')`
			`else:`
			`save_file = image_file`
			`cv2.imwrite(`
			`os.path.join(draw_img_save_dir,`
			`os.path.basename(save_file)),`
			`draw_img[:, :, ::-1])`
			`logger.debug("The visualized image saved in {}".format(`
			`os.path.join(draw_img_save_dir, os.path.basename(`
			`save_file))))`
优化tools/infer/predict_system.py代码 2020-06-20 03:03:39 +08:00
add python benchmark for ocr 2021-05-26 10:40:16 +00:00			`logger.info("The predict total time is {}".format(time.time() - _st))`
set benchmark in predict_system 2021-08-27 06:46:40 +00:00			`if args.benchmark:`
			`text_sys.text_detector.autolog.report()`
			`text_sys.text_recognizer.autolog.report()`
add python benchmark for ocr 2021-05-26 10:40:16 +00:00
add SLANet 2022-08-08 06:50:27 +00:00			`with open(`
			`os.path.join(draw_img_save_dir, "system_results.txt"),`
			`'w',`
			`encoding='utf-8') as f:`
add system pred save 2022-02-07 07:56:08 +00:00			`f.writelines(save_results)`

set benchmark in predict_system 2021-08-27 06:48:27 +00:00
add python benchmark for ocr 2021-05-26 10:40:16 +00:00			`if __name__ == "__main__":`
revert mp process, test=develop 2021-06-16 10:04:27 +08:00			`args = utility.parse_args()`
			`if args.use_mp:`
			`p_list = []`
			`total_process_num = args.total_process_num`
			`for process_id in range(total_process_num):`
			`cmd = [sys.executable, "-u"] + sys.argv + [`
			`"--process_id={}".format(process_id),`
			`"--use_mp={}".format(False)`
			`]`
			`p = subprocess.Popen(cmd, stdout=sys.stdout, stderr=sys.stdout)`
			`p_list.append(p)`
			`for p in p_list:`
			`p.wait()`
			`else:`
			`main(args)`