mmdeploy/csrc/apis/c/text_recognizer.cpp
lzhangzz 640aa03538
Support Windows (#106)
* minor changes

* support windows

* fix GCC build

* fix lint

* reformat

* fix Windows build

* fix GCC build

* search backend ops for onnxruntime

* fix lint

* fix lint

* code clean-up

* code clean-up

* fix clang build

* fix trt support

* fix cmake for ncnn

* fix cmake for openvino

* fix SDK Python API

* handle ops for other backends (ncnn, trt)

* handle SDK Python API library location

* robustify linkage

* fix cuda

* minor fix for openvino & ncnn

* use CMAKE_CUDA_ARCHITECTURES if set

* fix cuda preprocessor

* fix misc

* fix pplnn & pplcv, drop support for pplcv<0.6.0

* robustify cmake

* update build.md (#2)

* build dynamic modules as module library & fix demo (partially)

* fix candidate path for mmdeploy_python

* move "enable CUDA" to cmake config for demo

* refine demo cmake

* add comment

* fix ubuntu build

* revert docs/en/build.md

* fix C API

* fix lint

* Windows build doc (#3)

* check in docs related to mmdeploy build on windows

* update build guide on windows platform

* update build guide on windows platform

* make path of thirdparty libraries consistent

* make path consistency

* correct build command for custom ops

* correct build command for sdk

* update sdk build instructions

* update doc

* correct build command

* fix lint

* correct build command and fix lint

Co-authored-by: lvhan <lvhan@pjlab.org>

* trailing whitespace (#4)

* minor fix

* fix sr sdk model

* fix type deduction

* fix cudaFree after driver shutting down

* update ppl.cv installation warning (#5)

* fix device allocator threshold & fix lint

* update doc (#6)

* update ppl.cv installation warning

* missing 'git clone'

Co-authored-by: chenxin <chenxin2@sensetime.com>
Co-authored-by: zhangli <zhangli@sensetime.com>
Co-authored-by: lvhan028 <lvhan_028@163.com>
Co-authored-by: lvhan <lvhan@pjlab.org>
2022-02-24 20:08:44 +08:00

197 lines
6.1 KiB
C++

// Copyright (c) OpenMMLab. All rights reserved.
#include "text_recognizer.h"
#include <numeric>
#include "archive/value_archive.h"
#include "codebase/mmocr/mmocr.h"
#include "core/device.h"
#include "core/mat.h"
#include "core/operator.h"
#include "core/status_code.h"
#include "core/utils/formatter.h"
#include "handle.h"
using namespace mmdeploy;
namespace {
const Value &config_template() {
// clang-format off
static Value v {
{
"pipeline", {
{
"tasks", {
{
{"name", "warp"},
{"type", "Task"},
{"module", "WarpBoxes"},
{"input", {"img", "dets"}},
{"output", {"patches"}}
},
{
{"name", "flatten"},
{"type", "Flatten"},
{"input", {"patches"}},
{"output", {"patch_flat", "patch_index"}},
},
{
{"name", "recog"},
{"type", "Inference"},
{"params", {{"model", "TBD"},{"batch_size", 1}}},
{"input", {"patch_flat"}},
{"output", {"texts"}}
},
{
{"name", "unflatten"},
{"type", "Unflatten"},
{"input", {"texts", "patch_index"}},
{"output", {"text_unflat"}},
}
}
},
{"input", {"img", "dets"}},
{"output", {"text_unflat"}}
}
}
};
// clang-format on
return v;
}
template <class ModelType>
int mmdeploy_text_recognizer_create_impl(ModelType &&m, const char *device_name, int device_id,
mm_handle_t *handle) {
try {
auto value = config_template();
value["pipeline"]["tasks"][2]["params"]["model"] = std::forward<ModelType>(m);
auto recognizer = std::make_unique<Handle>(device_name, device_id, std::move(value));
*handle = recognizer.release();
return MM_SUCCESS;
} catch (const std::exception &e) {
MMDEPLOY_ERROR("exception caught: {}", e.what());
} catch (...) {
MMDEPLOY_ERROR("unknown exception caught");
}
return MM_E_FAIL;
}
} // namespace
int mmdeploy_text_recognizer_create(mm_model_t model, const char *device_name, int device_id,
mm_handle_t *handle) {
return mmdeploy_text_recognizer_create_impl(*static_cast<Model *>(model), device_name, device_id,
handle);
}
int mmdeploy_text_recognizer_create_by_path(const char *model_path, const char *device_name,
int device_id, mm_handle_t *handle) {
return mmdeploy_text_recognizer_create_impl(model_path, device_name, device_id, handle);
}
int mmdeploy_text_recognizer_apply(mm_handle_t handle, const mm_mat_t *images, int count,
mm_text_recognize_t **results) {
return mmdeploy_text_recognizer_apply_bbox(handle, images, count, nullptr, nullptr, results);
}
int mmdeploy_text_recognizer_apply_bbox(mm_handle_t handle, const mm_mat_t *images, int image_count,
const mm_text_detect_t *bboxes, const int *bbox_count,
mm_text_recognize_t **results) {
if (handle == nullptr || images == nullptr || image_count == 0 || results == nullptr) {
return MM_E_INVALID_ARG;
}
try {
auto recognizer = static_cast<Handle *>(handle);
Value input{Value::kArray, Value::kArray};
auto _bboxes = bboxes;
auto result_count = 0;
for (int i = 0; i < image_count; ++i) {
mmdeploy::Mat _mat{images[i].height, images[i].width, PixelFormat(images[i].format),
DataType(images->type), images[i].data, Device{"cpu"}};
input[0].push_back({{"ori_img", _mat}});
if (bboxes && bbox_count) {
Value boxes(Value::kArray);
for (int j = 0; j < bbox_count[i]; ++j) {
Value box;
for (const auto &p : _bboxes[j].bbox) {
box.push_back(p.x);
box.push_back(p.y);
}
boxes.push_back(std::move(box));
}
_bboxes += bbox_count[i];
result_count += bbox_count[i];
input[1].push_back({{"boxes", boxes}});
} else {
input[1].push_back(Value::kNull);
result_count += 1;
}
}
auto output = recognizer->Run(std::move(input)).value().front();
auto recognizer_outputs =
from_value<std::vector<std::vector<mmocr::TextRecognizerOutput>>>(output);
std::vector<int> counts;
if (bboxes && bbox_count) {
counts = std::vector<int>(bbox_count, bbox_count + image_count);
} else {
counts.resize(image_count, 1);
}
std::vector<int> offsets{0};
std::partial_sum(begin(counts), end(counts), back_inserter(offsets));
auto deleter = [&](mm_text_recognize_t *p) {
mmdeploy_text_recognizer_release_result(p, offsets.back());
};
std::unique_ptr<mm_text_recognize_t[], decltype(deleter)> _results(
new mm_text_recognize_t[result_count]{}, deleter);
for (int i = 0; i < image_count; ++i) {
auto &recog_output = recognizer_outputs[i];
for (int j = 0; j < recog_output.size(); ++j) {
auto &res = _results[offsets[i] + j];
auto &box_result = recog_output[j];
auto &score = box_result.score;
res.length = static_cast<int>(score.size());
res.score = new float[score.size()];
std::copy_n(score.data(), score.size(), res.score);
auto text = box_result.text;
res.text = new char[text.length() + 1];
std::copy_n(text.data(), text.length() + 1, res.text);
}
}
*results = _results.release();
return MM_SUCCESS;
} catch (const std::exception &e) {
MMDEPLOY_ERROR("exception caught: {}", e.what());
} catch (...) {
MMDEPLOY_ERROR("unknown exception caught");
}
return MM_E_FAIL;
}
void mmdeploy_text_recognizer_release_result(mm_text_recognize_t *results, int count) {
for (int i = 0; i < count; ++i) {
delete[] results[i].score;
delete[] results[i].text;
}
delete[] results;
}
void mmdeploy_text_recognizer_destroy(mm_handle_t handle) { delete static_cast<Handle *>(handle); }