通过templateMatch算法,可以得到目标与原图像中等大子图像对应归一化的相关系数,这个归一化的相关系数可以看作是对于的概率(其实不是这样),可以设定一个阈值,把大于这个阈值的坐标都筛选出来。但是这样在一个成功匹配的坐标附近也会存在许多相关性稍小的坐标也大于这个阈值,我们无法区分这些坐标对于的图像是原来的图像还是其他的图像,这样就把这个问题转化为了怎么把这些副产物给去除。有cv经验的应该很快会想到[nms算法](非极大值抑制(NMS)算法讲解|理论+代码 - 知乎 (zhihu.com))。想了解的同学可以点进去看看。下面就只提供代码实现。
需要注意的是部分算法来自于nonfree的xfeature,使用时请注意避免纠纷,当然也需要使用者手动打开这个编译开关,相关代码Fork自OpenCV: Features2D + Homography to find a known object
#define LIBMATCH_API extern "C" __declspec(dllexport)
struct objectEx
cv::Rect_<float> rect;
float prob;
struct objectEx2
cv::Point2f dots[4];
static void qsort_descent_inplace(std::vector<objectEx>& objects)
if (objects.empty())
std::sort(objects.begin(), objects.end(), [](const objectEx& a, const objectEx& b) {return a.prob > b.prob; });
static inline float intersection_area(const objectEx& a, const objectEx& b)
cv::Rect_<float> inter = a.rect & b.rect;
return inter.area();
static void nms_sorted_bboxes(const std::vector<objectEx>& faceobjects, std::vector<int>& picked, float nms_threshold)
const int n = faceobjects.size();
std::vector<float> areas(n);
for (int i = 0; i < n; i++)
areas[i] = faceobjects[i].rect.area();
for (int i = 0; i < n; i++)
const objectEx& a = faceobjects[i];
int keep = 1;
for (int j = 0; j < (int)picked.size(); j++)
const objectEx& b = faceobjects[picked[j]];
// intersection over union
float inter_area = intersection_area(a, b);
float union_area = areas[i] + areas[picked[j]] - inter_area;
// float IoU = inter_area / union_area
if (inter_area / union_area > nms_threshold)
keep = 0;
if (keep)
const int version = 230622;
#define LIBMATCH_API extern "C" __declspec(dllimport)
struct objectEx
struct Rect{
float x, y, width, height;
} rect;
float prob;
struct objectEx2
float x, y;
LIBMATCH_API int match_get_version();
LIBMATCH_API size_t match_scan(
uint8_t* src_img_data,
const size_t src_img_size,
uint8_t* target_img_data,
const size_t target_img_size,
const float prob_threshold,
const float nms_threshold,
objectEx* RetObejectArr,
const size_t maxRetCount,
const uint32_t MaskColor //Just For BGR,if high 2bit isn`t zero,mask will be disabled
LIBMATCH_API bool match_feat(
uint8_t* src_img_data,
const size_t src_img_size,
uint8_t* target_img_data,
const size_t target_img_size,
objectEx2 &result
// libmatch.cpp : 定义 DLL 的导出函数。
#include "pch.h"
#include "framework.h"
#include "libmatch.h"
LIBMATCH_API int match_get_version()
return version;
LIBMATCH_API size_t match_scan(
uint8_t* src_img_data,
const size_t src_img_size,
uint8_t* target_img_data,
const size_t target_img_size,
const float prob_threshold,
const float nms_threshold,
objectEx* RetObejectArr,
const size_t maxRetCount,
const uint32_t MaskColor //Just For BGR,if high 2bit isn`t zero,mask will be disabled
//Read and Process img Start
cv::_InputArray src_img_arr(src_img_data, src_img_size);
cv::Mat src_mat = cv::imdecode(src_img_arr, cv::IMREAD_GRAYSCALE);
if (src_mat.empty())
std::cout << "[Match] Err Can`t Read src_img" << std::endl;
return -1;
cv::_InputArray target_img_arr(target_img_data, target_img_size);
cv::Mat target_mat = cv::imdecode(target_img_arr, cv::IMREAD_GRAYSCALE);
if (target_mat.empty())
std::cout << "[Match] Err Can`t Read target_img" << std::endl;
return -1;
if (target_mat.cols > src_mat.cols || target_mat.rows > src_mat.rows)
std::cout << "[Match]ERR Target is too large" << std::endl;
return false;
//Read Over
//Template Match Start
cv::Mat result(src_mat.cols - target_mat.cols + 1, src_mat.rows - target_mat.rows + 1, CV_32FC1);
if ((MaskColor & 0xff000000) != 0)
cv::matchTemplate(src_mat, target_mat, result, cv::TM_CCOEFF_NORMED);
cv::Mat temp_target_mat = cv::imdecode(target_img_arr, cv::IMREAD_COLOR);
cv::Mat maks_mat = cv::Mat::zeros(target_mat.rows, target_mat.cols, CV_8U);
//Replace MaskColor
for (int i = 0; i < temp_target_mat.rows; i++)
for (int j = 0; j < temp_target_mat.cols; j++) {
cv::Vec3b temp_color=temp_target_mat.at<cv::Vec3b>(cv::Point(j, i));
if (((temp_color[0] << 16) | (temp_color[1] << 8) | temp_color[2]) != MaskColor) {
// std::cout << ((temp_color[0] << 16) | (temp_color[1] << 8) | temp_color[2]) << std::endl;
maks_mat.at<uint8_t>(cv::Point(j, i)) = 255;
// cv::imshow("result", maks_mat);
// cv::waitKey();
cv::matchTemplate(src_mat, target_mat, result, cv::TM_CCOEFF_NORMED, maks_mat);
//Template Match Over
//BackEnd Process
std::vector <objectEx> proposals;
for (int i = 0; i < result.rows; ++i)
for (int j = 0; j < result.cols; ++j)
if (result.at<float>(cv::Point(j, i)) >= prob_threshold)
objectEx buf;
buf.prob = result.at<float>(cv::Point(j, i));
buf.rect.x = j;
buf.rect.y = i;
buf.rect.height = target_mat.rows;
buf.rect.width = target_mat.cols;
std::vector<int> picked;
nms_sorted_bboxes(proposals, picked, nms_threshold);
std::vector <objectEx> objects;
for (auto x : picked)
//BackEnd Over
memcpy(RetObejectArr, objects.data(), sizeof(objectEx) * std::min(objects.size(), maxRetCount));
return objects.size();
LIBMATCH_API bool match_feat(
uint8_t* src_img_data,
const size_t src_img_size,
uint8_t* target_img_data,
const size_t target_img_size,
objectEx2 &result
//Read and Process img Start
cv::_InputArray src_img_arr(src_img_data, src_img_size);
cv::Mat src_mat = cv::imdecode(src_img_arr, cv::IMREAD_GRAYSCALE);
if (src_mat.empty())
std::cout << "[Match] Err Can`t Read src_img" << std::endl;
return false;
cv::_InputArray target_img_arr(target_img_data, target_img_size);
cv::Mat target_mat = cv::imdecode(target_img_arr, cv::IMREAD_GRAYSCALE);
if (target_mat.empty())
std::cout << "[Match] Err Can`t Read target_img" << std::endl;
return false;
//Read Over
//-- Step 1: Detect the keypoints using SURF Detector, compute the descriptors
int minHessian = 400;
cv::Ptr<cv::xfeatures2d::SURF> detector = cv::xfeatures2d::SURF::create(minHessian);
std::vector<cv::KeyPoint> keypoints_object, keypoints_scene;
cv::Mat descriptors_object, descriptors_scene;
detector->detectAndCompute(target_mat, cv::noArray(), keypoints_object, descriptors_object);
detector->detectAndCompute(src_mat,cv::noArray(), keypoints_scene, descriptors_scene);
//-- Step 2: Matching descriptor vectors with a FLANN based matcher
// Since SURF is a floating-point descriptor NORM_L2 is used
cv::Ptr<cv::DescriptorMatcher> matcher = cv::DescriptorMatcher::create(cv::DescriptorMatcher::FLANNBASED);
std::vector< std::vector<cv::DMatch> > knn_matches;
matcher->knnMatch(descriptors_object, descriptors_scene, knn_matches, 2);
//-- Filter matches using the Lowe's ratio test
const float ratio_thresh = 0.75f;
std::vector<cv::DMatch> good_matches;
for (size_t i = 0; i < knn_matches.size(); i++)
if (knn_matches[i][0].distance < ratio_thresh * knn_matches[i][1].distance)
if (good_matches.size() == 0)
return false;
//-- Draw matches
//Mat img_matches;
//drawMatches(img_object, keypoints_object, img_scene, keypoints_scene, good_matches, img_matches, Scalar::all(-1),
// Scalar::all(-1), std::vector<char>(), DrawMatchesFlags::NOT_DRAW_SINGLE_POINTS);
//-- Localize the object
std::vector<cv::Point2f> obj;
std::vector<cv::Point2f> scene;
for (size_t i = 0; i < good_matches.size(); i++)
//-- Get the keypoints from the good matches
cv::Mat H = findHomography(obj, scene, cv::RANSAC);
//-- Get the corners from the image_1 ( the object to be "detected" )
std::vector<cv::Point2f> obj_corners(4);
obj_corners[0] = cv::Point2f(0, 0);
obj_corners[1] = cv::Point2f((float)target_mat.cols, 0);
obj_corners[2] = cv::Point2f((float)target_mat.cols, (float)target_mat.rows);
obj_corners[3] = cv::Point2f(0, (float)target_mat.rows);
std::vector<cv::Point2f> buf_corners(4);
cv::perspectiveTransform(obj_corners, buf_corners, H);
memcpy(result.dots, buf_corners.data(), buf_corners.size() * sizeof(cv::Point2f));
return true;