mirror of
https://github.com/opencv/opencv.git
synced 2024-11-25 03:30:34 +08:00
156 lines
5.2 KiB
C++
156 lines
5.2 KiB
C++
#include "opencv2/highgui/highgui.hpp"
|
|
#include "opencv2/core/core.hpp"
|
|
#include "opencv2/imgproc/imgproc.hpp"
|
|
#include "opencv2/features2d/features2d.hpp"
|
|
#include "opencv2/objdetect/objdetect.hpp"
|
|
#include "opencv2/legacy/legacy.hpp"
|
|
|
|
#include <algorithm>
|
|
#include <iostream>
|
|
#include <vector>
|
|
#include <stdio.h>
|
|
|
|
using namespace cv;
|
|
static void help()
|
|
{
|
|
printf( "This program shows the use of the \"fern\" plannar PlanarObjectDetector point\n"
|
|
"descriptor classifier\n"
|
|
"Usage:\n"
|
|
"./find_obj_ferns <object_filename> <scene_filename>, default: box.png and box_in_scene.png\n\n");
|
|
return;
|
|
}
|
|
|
|
|
|
int main(int argc, char** argv)
|
|
{
|
|
int i;
|
|
|
|
const char* object_filename = argc > 1 ? argv[1] : "box.png";
|
|
const char* scene_filename = argc > 2 ? argv[2] : "box_in_scene.png";
|
|
|
|
help();
|
|
|
|
Mat object = imread( object_filename, CV_LOAD_IMAGE_GRAYSCALE );
|
|
Mat scene = imread( scene_filename, CV_LOAD_IMAGE_GRAYSCALE );
|
|
|
|
if( !object.data || !scene.data )
|
|
{
|
|
fprintf( stderr, "Can not load %s and/or %s\n",
|
|
object_filename, scene_filename );
|
|
exit(-1);
|
|
}
|
|
|
|
double imgscale = 1;
|
|
Mat image;
|
|
|
|
resize(scene, image, Size(), 1./imgscale, 1./imgscale, INTER_CUBIC);
|
|
|
|
cvNamedWindow("Object", 1);
|
|
cvNamedWindow("Image", 1);
|
|
cvNamedWindow("Object Correspondence", 1);
|
|
|
|
Size patchSize(32, 32);
|
|
LDetector ldetector(7, 20, 2, 2000, patchSize.width, 2);
|
|
ldetector.setVerbose(true);
|
|
PlanarObjectDetector detector;
|
|
|
|
vector<Mat> objpyr, imgpyr;
|
|
int blurKSize = 3;
|
|
double sigma = 0;
|
|
GaussianBlur(object, object, Size(blurKSize, blurKSize), sigma, sigma);
|
|
GaussianBlur(image, image, Size(blurKSize, blurKSize), sigma, sigma);
|
|
buildPyramid(object, objpyr, ldetector.nOctaves-1);
|
|
buildPyramid(image, imgpyr, ldetector.nOctaves-1);
|
|
|
|
vector<KeyPoint> objKeypoints, imgKeypoints;
|
|
PatchGenerator gen(0,256,5,true,0.8,1.2,-CV_PI/2,CV_PI/2,-CV_PI/2,CV_PI/2);
|
|
|
|
string model_filename = format("%s_model.xml.gz", object_filename);
|
|
printf("Trying to load %s ...\n", model_filename.c_str());
|
|
FileStorage fs(model_filename, FileStorage::READ);
|
|
if( fs.isOpened() )
|
|
{
|
|
detector.read(fs.getFirstTopLevelNode());
|
|
printf("Successfully loaded %s.\n", model_filename.c_str());
|
|
}
|
|
else
|
|
{
|
|
printf("The file not found and can not be read. Let's train the model.\n");
|
|
printf("Step 1. Finding the robust keypoints ...\n");
|
|
ldetector.setVerbose(true);
|
|
ldetector.getMostStable2D(object, objKeypoints, 100, gen);
|
|
printf("Done.\nStep 2. Training ferns-based planar object detector ...\n");
|
|
detector.setVerbose(true);
|
|
|
|
detector.train(objpyr, objKeypoints, patchSize.width, 100, 11, 10000, ldetector, gen);
|
|
printf("Done.\nStep 3. Saving the model to %s ...\n", model_filename.c_str());
|
|
if( fs.open(model_filename, FileStorage::WRITE) )
|
|
detector.write(fs, "ferns_model");
|
|
}
|
|
printf("Now find the keypoints in the image, try recognize them and compute the homography matrix\n");
|
|
fs.release();
|
|
|
|
vector<Point2f> dst_corners;
|
|
Mat correspond( object.rows + image.rows, std::max(object.cols, image.cols), CV_8UC3);
|
|
correspond = Scalar(0.);
|
|
Mat part(correspond, Rect(0, 0, object.cols, object.rows));
|
|
cvtColor(object, part, CV_GRAY2BGR);
|
|
part = Mat(correspond, Rect(0, object.rows, image.cols, image.rows));
|
|
cvtColor(image, part, CV_GRAY2BGR);
|
|
|
|
vector<int> pairs;
|
|
Mat H;
|
|
|
|
double t = (double)getTickCount();
|
|
objKeypoints = detector.getModelPoints();
|
|
ldetector(imgpyr, imgKeypoints, 300);
|
|
|
|
std::cout << "Object keypoints: " << objKeypoints.size() << "\n";
|
|
std::cout << "Image keypoints: " << imgKeypoints.size() << "\n";
|
|
bool found = detector(imgpyr, imgKeypoints, H, dst_corners, &pairs);
|
|
t = (double)getTickCount() - t;
|
|
printf("%gms\n", t*1000/getTickFrequency());
|
|
|
|
if( found )
|
|
{
|
|
for( i = 0; i < 4; i++ )
|
|
{
|
|
Point r1 = dst_corners[i%4];
|
|
Point r2 = dst_corners[(i+1)%4];
|
|
line( correspond, Point(r1.x, r1.y+object.rows),
|
|
Point(r2.x, r2.y+object.rows), Scalar(0,0,255) );
|
|
}
|
|
}
|
|
|
|
for( i = 0; i < (int)pairs.size(); i += 2 )
|
|
{
|
|
line( correspond, objKeypoints[pairs[i]].pt,
|
|
imgKeypoints[pairs[i+1]].pt + Point2f(0,(float)object.rows),
|
|
Scalar(0,255,0) );
|
|
}
|
|
|
|
imshow( "Object Correspondence", correspond );
|
|
Mat objectColor;
|
|
cvtColor(object, objectColor, CV_GRAY2BGR);
|
|
for( i = 0; i < (int)objKeypoints.size(); i++ )
|
|
{
|
|
circle( objectColor, objKeypoints[i].pt, 2, Scalar(0,0,255), -1 );
|
|
circle( objectColor, objKeypoints[i].pt, (1 << objKeypoints[i].octave)*15, Scalar(0,255,0), 1 );
|
|
}
|
|
Mat imageColor;
|
|
cvtColor(image, imageColor, CV_GRAY2BGR);
|
|
for( i = 0; i < (int)imgKeypoints.size(); i++ )
|
|
{
|
|
circle( imageColor, imgKeypoints[i].pt, 2, Scalar(0,0,255), -1 );
|
|
circle( imageColor, imgKeypoints[i].pt, (1 << imgKeypoints[i].octave)*15, Scalar(0,255,0), 1 );
|
|
}
|
|
|
|
imwrite("correspond.png", correspond );
|
|
imshow( "Object", objectColor );
|
|
imshow( "Image", imageColor );
|
|
|
|
waitKey(0);
|
|
|
|
return 0;
|
|
}
|