PaddleOCR/deploy/cpp_infer/include/postprocess_op.h

118 lines
3.9 KiB
C
Raw Normal View History

2020-07-13 01:21:47 +08:00
// Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
#pragma once
#include "include/clipper.h"
2020-07-13 16:59:21 +08:00
#include "include/utility.h"
2020-07-13 01:21:47 +08:00
namespace PaddleOCR {
2022-08-10 14:05:02 +08:00
class DBPostProcessor {
2020-07-13 01:21:47 +08:00
public:
2020-07-13 21:05:36 +08:00
void GetContourArea(const std::vector<std::vector<float>> &box,
float unclip_ratio, float &distance);
2020-07-13 01:21:47 +08:00
2020-07-13 21:05:36 +08:00
cv::RotatedRect UnClip(std::vector<std::vector<float>> box,
const float &unclip_ratio);
2020-07-13 01:21:47 +08:00
float **Mat2Vec(cv::Mat mat);
std::vector<std::vector<int>>
2020-07-13 21:05:36 +08:00
OrderPointsClockwise(std::vector<std::vector<int>> pts);
2020-07-13 01:21:47 +08:00
2020-07-13 21:05:36 +08:00
std::vector<std::vector<float>> GetMiniBoxes(cv::RotatedRect box,
float &ssid);
2020-07-13 01:21:47 +08:00
2020-07-13 21:05:36 +08:00
float BoxScoreFast(std::vector<std::vector<float>> box_array, cv::Mat pred);
float PolygonScoreAcc(std::vector<cv::Point> contour, cv::Mat pred);
2020-07-13 01:21:47 +08:00
std::vector<std::vector<std::vector<int>>>
2020-07-13 16:59:21 +08:00
BoxesFromBitmap(const cv::Mat pred, const cv::Mat bitmap,
const float &box_thresh, const float &det_db_unclip_ratio,
const std::string &det_db_score_mode);
2020-07-13 01:21:47 +08:00
std::vector<std::vector<std::vector<int>>>
2020-07-13 16:59:21 +08:00
FilterTagDetRes(std::vector<std::vector<std::vector<int>>> boxes,
float ratio_h, float ratio_w, cv::Mat srcimg);
2020-07-13 01:21:47 +08:00
private:
2020-07-13 21:05:36 +08:00
static bool XsortInt(std::vector<int> a, std::vector<int> b);
static bool XsortFp32(std::vector<float> a, std::vector<float> b);
std::vector<std::vector<float>> Mat2Vector(cv::Mat mat);
2020-07-13 01:21:47 +08:00
inline int _max(int a, int b) { return a >= b ? a : b; }
inline int _min(int a, int b) { return a >= b ? b : a; }
template <class T> inline T clamp(T x, T min, T max) {
if (x > max)
return max;
if (x < min)
return min;
return x;
}
2020-07-13 16:59:21 +08:00
2020-07-13 01:21:47 +08:00
inline float clampf(float x, float min, float max) {
if (x > max)
return max;
if (x < min)
return min;
return x;
}
};
2022-08-10 14:05:02 +08:00
class TablePostProcessor {
public:
2022-09-20 11:40:05 +08:00
void init(std::string label_path, bool merge_no_span_structure = true);
2022-09-09 20:24:08 +08:00
void Run(std::vector<float> &loc_preds, std::vector<float> &structure_probs,
std::vector<float> &rec_scores, std::vector<int> &loc_preds_shape,
std::vector<int> &structure_probs_shape,
std::vector<std::vector<std::string>> &rec_html_tag_batch,
std::vector<std::vector<std::vector<int>>> &rec_boxes_batch,
std::vector<int> &width_list, std::vector<int> &height_list);
2022-08-10 14:05:02 +08:00
private:
std::vector<std::string> label_list_;
std::string end = "eos";
std::string beg = "sos";
};
2022-09-19 17:37:41 +08:00
class PicodetPostProcessor {
public:
void init(std::string label_path, const double score_threshold = 0.4,
const double nms_threshold = 0.5,
2022-09-20 11:40:05 +08:00
const std::vector<int> &fpn_stride = {8, 16, 32, 64});
2022-09-19 17:37:41 +08:00
void Run(std::vector<StructurePredictResult> &results,
std::vector<std::vector<float>> outs, std::vector<int> ori_shape,
std::vector<int> resize_shape, int eg_max);
std::vector<int> fpn_stride_ = {8, 16, 32, 64};
private:
StructurePredictResult disPred2Bbox(std::vector<float> bbox_pred, int label,
float score, int x, int y, int stride,
std::vector<int> im_shape, int reg_max);
void nms(std::vector<StructurePredictResult> &input_boxes,
float nms_threshold);
std::vector<std::string> label_list_;
double score_threshold_ = 0.4;
double nms_threshold_ = 0.5;
int num_class_ = 5;
};
2020-07-13 16:59:21 +08:00
} // namespace PaddleOCR