mmdeploy/csrc/codebase/mmdet/instance_segmentation.cpp

101 lines
3.7 KiB
C++

// Copyright (c) OpenMMLab. All rights reserved.
#include "core/registry.h"
#include "experimental/module_adapter.h"
#include "object_detection.h"
#include "opencv2/imgproc/imgproc.hpp"
#include "preprocess/cpu/opencv_utils.h"
#include "preprocess/transform/transform_utils.h"
namespace mmdeploy::mmdet {
class ResizeInstanceMask : public ResizeBBox {
public:
explicit ResizeInstanceMask(const Value& cfg) : ResizeBBox(cfg) {
if (cfg.contains("params")) {
mask_thr_binary_ = cfg["params"].value("mask_thr_binary", mask_thr_binary_);
}
}
Result<Value> operator()(const Value& prep_res, const Value& infer_res) {
DEBUG("prep_res: {}\ninfer_res: {}", prep_res, infer_res);
try {
assert(prep_res.contains("img_metas"));
// Value res = prep_res;
auto dets = infer_res["dets"].get<Tensor>();
auto labels = infer_res["labels"].get<Tensor>();
auto masks = infer_res["masks"].get<Tensor>();
DEBUG("dets.shape: {}", dets.shape());
DEBUG("labels.shape: {}", labels.shape());
DEBUG("masks.shape: {}", masks.shape());
// `dets` is supposed to have 3 dims. They are 'batch', 'bboxes_number'
// and 'channels' respectively
assert(dets.shape().size() == 3);
assert(dets.data_type() == DataType::kFLOAT);
assert(masks.data_type() == DataType::kFLOAT);
// `labels` is supposed to have 2 dims, which are 'batch' and
// 'bboxes_number'
assert(labels.shape().size() == 2);
OUTCOME_TRY(auto _dets, MakeAvailableOnDevice(dets, kHost, stream()));
OUTCOME_TRY(auto _labels, MakeAvailableOnDevice(labels, kHost, stream()));
OUTCOME_TRY(auto _masks, MakeAvailableOnDevice(masks, kHost, stream()));
OUTCOME_TRY(stream().Wait());
OUTCOME_TRY(auto result, DispatchGetBBoxes(prep_res["img_metas"], _dets, _labels));
auto ori_w = prep_res["img_metas"]["ori_shape"][2].get<int>();
auto ori_h = prep_res["img_metas"]["ori_shape"][1].get<int>();
ProcessMasks(result, _masks, ori_w, ori_h);
return to_value(result);
} catch (const std::exception& e) {
ERROR("{}", e.what());
return Status(eFail);
}
}
protected:
void ProcessMasks(DetectorOutput& result, Tensor cpu_masks, int img_w, int img_h) const {
auto shape = TensorShape{cpu_masks.shape(1), cpu_masks.shape(2), cpu_masks.shape(3)};
cpu_masks.Reshape(shape);
for (auto& det : result.detections) {
auto mask = cpu_masks.Slice(det.index);
cv::Mat mask_mat(mask.shape(1), mask.shape(2), CV_32F, mask.data<float>());
cv::Mat warped_mask;
auto& bbox = det.bbox;
// same as mmdet with skip_empty = True
auto x0 = std::max(std::floor(bbox[0]) - 1, 0.f);
auto y0 = std::max(std::floor(bbox[1]) - 1, 0.f);
auto x1 = std::min(std::ceil(bbox[2]) + 1, (float)img_w);
auto y1 = std::min(std::ceil(bbox[3]) + 1, (float)img_h);
auto width = static_cast<int>(x1 - x0);
auto height = static_cast<int>(y1 - y0);
// params align_corners = False
auto fx = (float)mask_mat.cols / (bbox[2] - bbox[0]);
auto fy = (float)mask_mat.rows / (bbox[3] - bbox[1]);
auto tx = (x0 + .5f - bbox[0]) * fx - .5f;
auto ty = (y0 + .5f - bbox[1]) * fy - .5f;
cv::Mat m = (cv::Mat_<float>(2, 3) << fx, 0, tx, 0, fy, ty);
cv::warpAffine(mask_mat, warped_mask, m, cv::Size{width, height},
cv::INTER_LINEAR | cv::WARP_INVERSE_MAP);
warped_mask = warped_mask > mask_thr_binary_;
det.mask = cpu::CVMat2Mat(warped_mask, PixelFormat::kGRAYSCALE);
}
}
float mask_thr_binary_{.5f};
};
REGISTER_CODEBASE_COMPONENT(MMDetection, ResizeInstanceMask);
} // namespace mmdeploy::mmdet