add ci for paddleocr test (#12062)

* add ci for paddleocr test * fix flake8 error * fix paddlepaddle deps * add dep * fix * move flake8 to pre-commit * update ut * fix bug * fix bug set paddlepaddle==2.5 * fix bug * fix bug * fix bug * update test * remove lscpu
2024-05-22 13:02:24 +08:00 · 2024-05-22 13:02:24 +08:00 · af87691591
parent 579d0c34d4
commit af87691591
14 changed files with 184 additions and 18 deletions
--- a/.github/workflows/pre-commit.yml
+++ b/.github/workflows/pre-commit.yml
@ -1,4 +1,4 @@
-name: pre-commit
+name: PaddleOCR Code Style Check
 on:
  pull_request:
@ -6,11 +6,13 @@ on:
    branches: ['main', 'release/*']
 jobs:
-  pre-commit:
+  check-code-style:
    runs-on: ubuntu-latest
    steps:
-    - uses: actions/checkout@v3
+    - uses: actions/checkout@v4
-    - uses: actions/setup-python@v3
+      with:
        ref: ${{ github.ref }}
    - uses: actions/setup-python@v5
      with:
        python-version: '3.10'
    # Install Dependencies for Python
--- a/.github/workflows/tests.yaml
+++ b/.github/workflows/tests.yaml
@ -0,0 +1,30 @@
 name: PaddleOCR PR Tests
 on:
  push:
  pull_request:
    branches: ["main", "release/*"]
 permissions:
  contents: read
 jobs:
  test-pr:
    runs-on: ubuntu-latest
    steps:
    - uses: actions/checkout@v4
    - name: Set up Python 3.10
      uses: actions/setup-python@v5
      with:
        python-version: "3.10"
    - name: Install dependencies
      run: |
        python -m pip install --upgrade pip
        pip install pytest
        if [ -f requirements.txt ]; then pip install -r requirements.txt; fi
        pip install "paddlepaddle==2.5" requests
        pip install -e .
    - name: Test with pytest
      run: |
        pytest tests/
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@ -35,3 +35,16 @@ repos:
    hooks:
    -   id: black
        files: (.*\.(py|pyi|bzl)|BUILD|.*\.BUILD|WORKSPACE)$
 # Flake8
 -   repo: https://github.com/pycqa/flake8
    rev: 7.0.0
    hooks:
    -   id: flake8
        args:
            - --count
            - --select=E9,F63,F7,F82
            - --show-source
            - --statistics
        exclude: ^benchmark/|^test_tipc/
--- a/benchmark/PaddleOCR_DBNet/data_loader/modules/augment.py
+++ b/benchmark/PaddleOCR_DBNet/data_loader/modules/augment.py
@ -25,7 +25,7 @@ class RandomNoise:
            return data
        data["img"] = (
            random_noise(data["img"], mode="gaussian", clip=True) * 255
-        ).astype(im.dtype)
+        ).astype(data["img"].dtype)
        return data
--- a/deploy/hubserving/kie_ser/module.py
+++ b/deploy/hubserving/kie_ser/module.py
@ -142,7 +142,7 @@ class KIESer(hub.Module):
 if __name__ == "__main__":
-    ocr = OCRSystem()
+    ocr = KIESer()
    ocr._initialize()
    image_path = [
        "./doc/imgs/11.jpg",
--- a/deploy/hubserving/kie_ser_re/module.py
+++ b/deploy/hubserving/kie_ser_re/module.py
@ -144,7 +144,7 @@ class KIESerRE(hub.Module):
 if __name__ == "__main__":
-    ocr = OCRSystem()
+    ocr = KIESerRE()
    ocr._initialize()
    image_path = [
        "./doc/imgs/11.jpg",
--- a/ppocr/data/imaug/label_ops.py
+++ b/ppocr/data/imaug/label_ops.py
@ -841,11 +841,11 @@ class TableBoxEncode(object):
        return data
    def xyxyxyxy2xywh(self, boxes):
-        new_bboxes = np.zeros([len(bboxes), 4])
+        new_bboxes = np.zeros([len(boxes), 4])
-        new_bboxes[:, 0] = bboxes[:, 0::2].min()  # x1
+        new_bboxes[:, 0] = boxes[:, 0::2].min()  # x1
-        new_bboxes[:, 1] = bboxes[:, 1::2].min()  # y1
+        new_bboxes[:, 1] = boxes[:, 1::2].min()  # y1
-        new_bboxes[:, 2] = bboxes[:, 0::2].max() - new_bboxes[:, 0]  # w
+        new_bboxes[:, 2] = boxes[:, 0::2].max() - new_bboxes[:, 0]  # w
-        new_bboxes[:, 3] = bboxes[:, 1::2].max() - new_bboxes[:, 1]  # h
+        new_bboxes[:, 3] = boxes[:, 1::2].max() - new_bboxes[:, 1]  # h
        return new_bboxes
    def xyxy2xywh(self, bboxes):
--- a/ppocr/losses/distillation_loss.py
+++ b/ppocr/losses/distillation_loss.py
@ -1184,7 +1184,9 @@ class DistillCTCLogits(KLCTCLogits):
            loss = super().forward(out1, out2, ctc_label)
            if isinstance(loss, dict):
                for key in loss:
-                    loss_dict["{}_{}_{}".format(self.name, model_name, idx)] = loss[key]
+                    loss_dict[
                        "{}_{}_{}".format(self.name, self.model_name_pairs, idx)
                    ] = loss[key]
            else:
                loss_dict["{}_{}".format(self.name, idx)] = loss
        return loss_dict
--- a/ppocr/metrics/vqa_token_re_metric.py
+++ b/ppocr/metrics/vqa_token_re_metric.py
@ -19,7 +19,7 @@ from __future__ import print_function
 import numpy as np
 import paddle
-__all__ = ["KIEMetric"]
+__all__ = ["VQAReTokenMetric"]
 class VQAReTokenMetric(object):
--- a/ppocr/metrics/vqa_token_ser_metric.py
+++ b/ppocr/metrics/vqa_token_ser_metric.py
@ -19,7 +19,7 @@ from __future__ import print_function
 import numpy as np
 import paddle
-__all__ = ["KIEMetric"]
+__all__ = ["VQASerTokenMetric"]
 class VQASerTokenMetric(object):
--- a/ppocr/modeling/backbones/rec_efficientb3_pren.py
+++ b/ppocr/modeling/backbones/rec_efficientb3_pren.py
@ -27,7 +27,7 @@ import paddle
 import paddle.nn as nn
 import paddle.nn.functional as F
-__all__ = ["EfficientNetb3"]
+__all__ = ["EfficientNetb3_PREN"]
 GlobalParams = collections.namedtuple(
    "GlobalParams",
--- a/ppocr/modeling/heads/rec_aster_head.py
+++ b/ppocr/modeling/heads/rec_aster_head.py
@ -132,7 +132,7 @@ class AttentionRecognitionHead(nn.Layer):
        # Decoder
        state = paddle.zeros([1, batch_size, self.sDim])
-        predicted_ids, predicted_scores = [], []
+        predicted_ids, predicted_scores, predicted = [], [], None
        for i in range(self.max_len_labels):
            if i == 0:
                y_prev = paddle.full(shape=[batch_size], fill_value=self.num_classes)
--- a/ppocr/utils/loggers/wandb_logger.py
+++ b/ppocr/utils/loggers/wandb_logger.py
@ -1,5 +1,8 @@
 import os
 from .base_logger import BaseLogger
 from ppocr.utils.logging import get_logger
 logger = get_logger()
 class WandbLogger(BaseLogger):
@ -11,7 +14,7 @@ class WandbLogger(BaseLogger):
        entity=None,
        save_dir=None,
        config=None,
-        **kwargs
+        **kwargs,
    ):
        try:
            import wandb
--- a/tests/test_paddleocr_api.py
+++ b/tests/test_paddleocr_api.py
@ -0,0 +1,116 @@
 from typing import Any
 import pytest
 from paddleocr import PaddleOCR, PPStructure
 # Test image paths
 IMAGE_PATHS_OCR = ["./doc/imgs_en/254.jpg", "./doc/imgs_en/img_10.jpg"]
 IMAGE_PATHS_STRUCTURE = [
    "./ppstructure/docs/table/layout.jpg",
    "./ppstructure/docs/table/1.png",
 ]
@pytest.fixture(params=["en", "ch"])
 def ocr_engine(request: Any) -> PaddleOCR:
    """
    Initialize PaddleOCR engine with different languages.
    Args:
        request: pytest fixture request object.
    Returns:
        An instance of PaddleOCR.
    """
    return PaddleOCR(lang=request.param)
 def test_ocr_initialization(ocr_engine: PaddleOCR) -> None:
    """
    Test PaddleOCR initialization.
    Args:
        ocr_engine: An instance of PaddleOCR.
    """
    assert ocr_engine is not None
@pytest.mark.parametrize("image_path", IMAGE_PATHS_OCR)
 def test_ocr_function(ocr_engine: PaddleOCR, image_path: str) -> None:
    """
    Test PaddleOCR OCR functionality with different images.
    Args:
        ocr_engine: An instance of PaddleOCR.
        image_path: Path to the image to be processed.
    """
    result = ocr_engine.ocr(image_path)
    assert result is not None
    assert isinstance(result, list)
@pytest.mark.parametrize("image_path", IMAGE_PATHS_OCR)
 def test_ocr_det_only(ocr_engine: PaddleOCR, image_path: str) -> None:
    """
    Test PaddleOCR OCR functionality with detection only.
    Args:
        ocr_engine: An instance of PaddleOCR.
        image_path: Path to the image to be processed.
    """
    result = ocr_engine.ocr(image_path, det=True, rec=False)
    assert result is not None
    assert isinstance(result, list)
@pytest.mark.parametrize("image_path", IMAGE_PATHS_OCR)
 def test_ocr_rec_only(ocr_engine: PaddleOCR, image_path: str) -> None:
    """
    Test PaddleOCR OCR functionality with recognition only.
    Args:
        ocr_engine: An instance of PaddleOCR.
        image_path: Path to the image to be processed.
    """
    result = ocr_engine.ocr(image_path, det=False, rec=True)
    assert result is not None
    assert isinstance(result, list)
@pytest.fixture(params=["en", "ch"])
 def structure_engine(request: Any) -> PPStructure:
    """
    Initialize PPStructure engine with different languages.
    Args:
        request: pytest fixture request object.
    Returns:
        An instance of PPStructure.
    """
    return PPStructure(lang=request.param)
 def test_structure_initialization(structure_engine: PPStructure) -> None:
    """
    Test PPStructure initialization.
    Args:
        structure_engine: An instance of PPStructure.
    """
    assert structure_engine is not None
@pytest.mark.parametrize("image_path", IMAGE_PATHS_STRUCTURE)
 def test_structure_function(structure_engine: PPStructure, image_path: str) -> None:
    """
    Test PPStructure structure analysis functionality with different images.
    Args:
        structure_engine: An instance of PPStructure.
        image_path: Path to the image to be processed.
    """
    result = structure_engine(image_path)
    assert result is not None
    assert isinstance(result, list)