2010-05-12 01:44:00 +08:00
|
|
|
/*M///////////////////////////////////////////////////////////////////////////////////////
|
|
|
|
//
|
|
|
|
// IMPORTANT: READ BEFORE DOWNLOADING, COPYING, INSTALLING OR USING.
|
|
|
|
//
|
|
|
|
// By downloading, copying, installing or using the software you agree to this license.
|
|
|
|
// If you do not agree to this license, do not download, install,
|
|
|
|
// copy or use the software.
|
|
|
|
//
|
|
|
|
//
|
2014-07-30 03:54:23 +08:00
|
|
|
// License Agreement
|
|
|
|
// For Open Source Computer Vision Library
|
2010-05-12 01:44:00 +08:00
|
|
|
//
|
|
|
|
// Copyright (C) 2000, Intel Corporation, all rights reserved.
|
2014-07-30 03:54:23 +08:00
|
|
|
// Copyright (C) 2014, Itseez Inc, all rights reserved.
|
2010-05-12 01:44:00 +08:00
|
|
|
// Third party copyrights are property of their respective owners.
|
|
|
|
//
|
|
|
|
// Redistribution and use in source and binary forms, with or without modification,
|
|
|
|
// are permitted provided that the following conditions are met:
|
|
|
|
//
|
|
|
|
// * Redistribution's of source code must retain the above copyright notice,
|
|
|
|
// this list of conditions and the following disclaimer.
|
|
|
|
//
|
|
|
|
// * Redistribution's in binary form must reproduce the above copyright notice,
|
|
|
|
// this list of conditions and the following disclaimer in the documentation
|
|
|
|
// and/or other materials provided with the distribution.
|
|
|
|
//
|
2014-07-30 03:54:23 +08:00
|
|
|
// * The name of the copyright holders may not be used to endorse or promote products
|
2010-05-12 01:44:00 +08:00
|
|
|
// derived from this software without specific prior written permission.
|
|
|
|
//
|
|
|
|
// This software is provided by the copyright holders and contributors "as is" and
|
|
|
|
// any express or implied warranties, including, but not limited to, the implied
|
|
|
|
// warranties of merchantability and fitness for a particular purpose are disclaimed.
|
|
|
|
// In no event shall the Intel Corporation or contributors be liable for any direct,
|
|
|
|
// indirect, incidental, special, exemplary, or consequential damages
|
|
|
|
// (including, but not limited to, procurement of substitute goods or services;
|
|
|
|
// loss of use, data, or profits; or business interruption) however caused
|
|
|
|
// and on any theory of liability, whether in contract, strict liability,
|
|
|
|
// or tort (including negligence or otherwise) arising in any way out of
|
|
|
|
// the use of this software, even if advised of the possibility of such damage.
|
|
|
|
//
|
|
|
|
//M*/
|
|
|
|
|
|
|
|
#include "precomp.hpp"
|
|
|
|
|
|
|
|
/****************************************************************************************\
|
2014-07-30 03:54:23 +08:00
|
|
|
* K-Nearest Neighbors Classifier *
|
2010-05-12 01:44:00 +08:00
|
|
|
\****************************************************************************************/
|
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
namespace cv {
|
|
|
|
namespace ml {
|
2010-05-12 01:44:00 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
class KNearestImpl : public KNearest
|
2010-05-12 01:44:00 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
public:
|
|
|
|
KNearestImpl(bool __isClassifier=true)
|
2010-05-12 01:44:00 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
defaultK = 3;
|
|
|
|
_isClassifier = __isClassifier;
|
2010-05-12 01:44:00 +08:00
|
|
|
}
|
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
virtual ~KNearestImpl() {}
|
2010-05-12 01:44:00 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
bool isClassifier() const { return _isClassifier; }
|
|
|
|
bool isTrained() const { return !samples.empty(); }
|
2010-05-12 01:44:00 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
String getDefaultModelName() const { return "opencv_ml_knn"; }
|
2010-05-12 01:44:00 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
void clear()
|
2010-05-12 01:44:00 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
samples.release();
|
|
|
|
responses.release();
|
2010-05-12 01:44:00 +08:00
|
|
|
}
|
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
int getVarCount() const { return samples.cols; }
|
2010-05-12 01:44:00 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
bool train( const Ptr<TrainData>& data, int flags )
|
|
|
|
{
|
|
|
|
Mat new_samples = data->getTrainSamples(ROW_SAMPLE);
|
|
|
|
Mat new_responses;
|
|
|
|
data->getTrainResponses().convertTo(new_responses, CV_32F);
|
|
|
|
bool update = (flags & UPDATE_MODEL) != 0 && !samples.empty();
|
|
|
|
|
|
|
|
CV_Assert( new_samples.type() == CV_32F );
|
2010-05-12 01:44:00 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
if( !update )
|
|
|
|
{
|
|
|
|
clear();
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
CV_Assert( new_samples.cols == samples.cols &&
|
|
|
|
new_responses.cols == responses.cols );
|
|
|
|
}
|
2010-05-12 01:44:00 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
samples.push_back(new_samples);
|
|
|
|
responses.push_back(new_responses);
|
2012-06-15 21:04:17 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
return true;
|
|
|
|
}
|
2010-05-12 01:44:00 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
void findNearestCore( const Mat& _samples, int k0, const Range& range,
|
|
|
|
Mat* results, Mat* neighbor_responses,
|
|
|
|
Mat* dists, float* presult ) const
|
|
|
|
{
|
|
|
|
int testidx, baseidx, i, j, d = samples.cols, nsamples = samples.rows;
|
|
|
|
int testcount = range.end - range.start;
|
|
|
|
int k = std::min(k0, nsamples);
|
2010-05-12 01:44:00 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
AutoBuffer<float> buf(testcount*k*2);
|
|
|
|
float* dbuf = buf;
|
|
|
|
float* rbuf = dbuf + testcount*k;
|
2010-05-12 01:44:00 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
const float* rptr = responses.ptr<float>();
|
2010-05-12 01:44:00 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
for( testidx = 0; testidx < testcount; testidx++ )
|
|
|
|
{
|
|
|
|
for( i = 0; i < k; i++ )
|
|
|
|
{
|
|
|
|
dbuf[testidx*k + i] = FLT_MAX;
|
|
|
|
rbuf[testidx*k + i] = 0.f;
|
|
|
|
}
|
|
|
|
}
|
2010-05-12 01:44:00 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
for( baseidx = 0; baseidx < nsamples; baseidx++ )
|
2010-05-12 01:44:00 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
for( testidx = 0; testidx < testcount; testidx++ )
|
2010-05-12 01:44:00 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
const float* v = samples.ptr<float>(baseidx);
|
|
|
|
const float* u = _samples.ptr<float>(testidx + range.start);
|
|
|
|
|
|
|
|
float s = 0;
|
|
|
|
for( i = 0; i <= d - 4; i += 4 )
|
2010-05-12 01:44:00 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
float t0 = u[i] - v[i], t1 = u[i+1] - v[i+1];
|
|
|
|
float t2 = u[i+2] - v[i+2], t3 = u[i+3] - v[i+3];
|
|
|
|
s += t0*t0 + t1*t1 + t2*t2 + t3*t3;
|
2010-05-12 01:44:00 +08:00
|
|
|
}
|
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
for( ; i < d; i++ )
|
2010-05-12 01:44:00 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
float t0 = u[i] - v[i];
|
|
|
|
s += t0*t0;
|
2010-05-12 01:44:00 +08:00
|
|
|
}
|
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
Cv32suf si;
|
|
|
|
si.f = (float)s;
|
|
|
|
Cv32suf* dd = (Cv32suf*)(&dbuf[testidx*k]);
|
|
|
|
float* nr = &rbuf[testidx*k];
|
|
|
|
|
|
|
|
for( i = k; i > 0; i-- )
|
|
|
|
if( si.i >= dd[i-1].i )
|
2010-05-12 01:44:00 +08:00
|
|
|
break;
|
2014-07-30 03:54:23 +08:00
|
|
|
if( i >= k )
|
2010-05-12 01:44:00 +08:00
|
|
|
continue;
|
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
for( j = k-2; j >= i; j-- )
|
2010-05-12 01:44:00 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
dd[j+1].i = dd[j].i;
|
|
|
|
nr[j+1] = nr[j];
|
2010-05-12 01:44:00 +08:00
|
|
|
}
|
2014-07-30 03:54:23 +08:00
|
|
|
dd[i].i = si.i;
|
|
|
|
nr[i] = rptr[baseidx];
|
2010-05-12 01:44:00 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
float result = 0.f;
|
|
|
|
float inv_scale = 1./k;
|
2010-05-12 01:44:00 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
for( testidx = 0; testidx < testcount; testidx++ )
|
2010-05-12 01:44:00 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
if( neighbor_responses )
|
2010-05-12 01:44:00 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
float* nr = neighbor_responses->ptr<float>(testidx + range.start);
|
|
|
|
for( j = 0; j < k; j++ )
|
|
|
|
nr[j] = rbuf[testidx*k + j];
|
|
|
|
for( ; j < k0; j++ )
|
|
|
|
nr[j] = 0.f;
|
2010-05-12 01:44:00 +08:00
|
|
|
}
|
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
if( dists )
|
|
|
|
{
|
|
|
|
float* dptr = dists->ptr<float>(testidx + range.start);
|
|
|
|
for( j = 0; j < k; j++ )
|
|
|
|
dptr[j] = dbuf[testidx*k + j];
|
|
|
|
for( ; j < k0; j++ )
|
|
|
|
dptr[j] = 0.f;
|
|
|
|
}
|
2010-05-12 01:44:00 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
if( results || testidx+range.start == 0 )
|
|
|
|
{
|
|
|
|
if( !_isClassifier || k == 1 )
|
2010-05-12 01:44:00 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
float s = 0.f;
|
|
|
|
for( j = 0; j < k; j++ )
|
|
|
|
s += rbuf[testidx*k + j];
|
|
|
|
result = (float)(s*inv_scale);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
float* rp = rbuf + testidx*k;
|
|
|
|
for( j = k-1; j > 0; j-- )
|
|
|
|
{
|
|
|
|
bool swap_fl = false;
|
|
|
|
for( i = 0; i < j; i++ )
|
2010-05-12 01:44:00 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
if( rp[i] > rp[i+1] )
|
|
|
|
{
|
|
|
|
std::swap(rp[i], rp[i+1]);
|
|
|
|
swap_fl = true;
|
|
|
|
}
|
2010-05-12 01:44:00 +08:00
|
|
|
}
|
2014-07-30 03:54:23 +08:00
|
|
|
if( !swap_fl )
|
|
|
|
break;
|
|
|
|
}
|
2010-05-12 01:44:00 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
result = rp[0];
|
|
|
|
int prev_start = 0;
|
|
|
|
int best_count = 0;
|
|
|
|
for( j = 1; j <= k; j++ )
|
2010-05-12 01:44:00 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
if( j == k || rp[j] != rp[j-1] )
|
2010-05-12 01:44:00 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
int count = j - prev_start;
|
|
|
|
if( best_count < count )
|
|
|
|
{
|
|
|
|
best_count = count;
|
|
|
|
result = rp[j-1];
|
|
|
|
}
|
|
|
|
prev_start = j;
|
2010-05-12 01:44:00 +08:00
|
|
|
}
|
|
|
|
}
|
2014-07-30 03:54:23 +08:00
|
|
|
}
|
|
|
|
if( results )
|
|
|
|
results->at<float>(testidx + range.start) = result;
|
|
|
|
if( presult && testidx+range.start == 0 )
|
|
|
|
*presult = result;
|
2010-05-12 01:44:00 +08:00
|
|
|
}
|
|
|
|
}
|
2014-07-30 03:54:23 +08:00
|
|
|
}
|
2010-05-12 01:44:00 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
struct findKNearestInvoker : public ParallelLoopBody
|
|
|
|
{
|
|
|
|
findKNearestInvoker(const KNearestImpl* _p, int _k, const Mat& __samples,
|
|
|
|
Mat* __results, Mat* __neighbor_responses, Mat* __dists, float* _presult)
|
2010-05-12 01:44:00 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
p = _p;
|
|
|
|
k = _k;
|
|
|
|
_samples = &__samples;
|
|
|
|
_results = __results;
|
|
|
|
_neighbor_responses = __neighbor_responses;
|
|
|
|
_dists = __dists;
|
|
|
|
presult = _presult;
|
2010-05-12 01:44:00 +08:00
|
|
|
}
|
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
void operator()( const Range& range ) const
|
2010-05-12 01:44:00 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
int delta = std::min(range.end - range.start, 256);
|
|
|
|
for( int start = range.start; start < range.end; start += delta )
|
|
|
|
{
|
|
|
|
p->findNearestCore( *_samples, k, Range(start, std::min(start + delta, range.end)),
|
|
|
|
_results, _neighbor_responses, _dists, presult );
|
|
|
|
}
|
2010-05-12 01:44:00 +08:00
|
|
|
}
|
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
const KNearestImpl* p;
|
|
|
|
int k;
|
|
|
|
const Mat* _samples;
|
|
|
|
Mat* _results;
|
|
|
|
Mat* _neighbor_responses;
|
|
|
|
Mat* _dists;
|
|
|
|
float* presult;
|
|
|
|
};
|
|
|
|
|
|
|
|
float findNearest( InputArray _samples, int k,
|
|
|
|
OutputArray _results,
|
|
|
|
OutputArray _neighborResponses,
|
|
|
|
OutputArray _dists ) const
|
2011-04-01 19:24:15 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
float result = 0.f;
|
|
|
|
CV_Assert( 0 < k );
|
2011-04-01 19:24:15 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
Mat test_samples = _samples.getMat();
|
|
|
|
CV_Assert( test_samples.type() == CV_32F && test_samples.cols == samples.cols );
|
|
|
|
int testcount = test_samples.rows;
|
2011-04-01 19:24:15 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
if( testcount == 0 )
|
|
|
|
{
|
|
|
|
_results.release();
|
|
|
|
_neighborResponses.release();
|
|
|
|
_dists.release();
|
|
|
|
return 0.f;
|
|
|
|
}
|
2010-05-12 01:44:00 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
Mat res, nr, d, *pres = 0, *pnr = 0, *pd = 0;
|
|
|
|
if( _results.needed() )
|
|
|
|
{
|
|
|
|
_results.create(testcount, 1, CV_32F);
|
|
|
|
pres = &(res = _results.getMat());
|
|
|
|
}
|
|
|
|
if( _neighborResponses.needed() )
|
|
|
|
{
|
|
|
|
_neighborResponses.create(testcount, k, CV_32F);
|
|
|
|
pnr = &(nr = _neighborResponses.getMat());
|
|
|
|
}
|
|
|
|
if( _dists.needed() )
|
|
|
|
{
|
|
|
|
_dists.create(testcount, k, CV_32F);
|
|
|
|
pd = &(d = _dists.getMat());
|
|
|
|
}
|
2010-05-12 01:44:00 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
findKNearestInvoker invoker(this, k, test_samples, pres, pnr, pd, &result);
|
|
|
|
parallel_for_(Range(0, testcount), invoker);
|
|
|
|
//invoker(Range(0, testcount));
|
|
|
|
return result;
|
2010-05-12 01:44:00 +08:00
|
|
|
}
|
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
float predict(InputArray inputs, OutputArray outputs, int) const
|
2010-05-12 01:44:00 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
return findNearest( inputs, defaultK, outputs, noArray(), noArray() );
|
2010-05-12 01:44:00 +08:00
|
|
|
}
|
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
void write( FileStorage& fs ) const
|
2010-05-12 01:44:00 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
fs << "is_classifier" << (int)_isClassifier;
|
2012-06-15 21:04:17 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
fs << "samples" << samples;
|
|
|
|
fs << "responses" << responses;
|
2010-05-12 01:44:00 +08:00
|
|
|
}
|
2012-06-15 21:04:17 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
void read( const FileNode& fn )
|
2010-05-12 01:44:00 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
clear();
|
|
|
|
_isClassifier = (int)fn["is_classifier"] != 0;
|
|
|
|
|
|
|
|
fn["samples"] >> samples;
|
|
|
|
fn["responses"] >> responses;
|
2010-05-12 01:44:00 +08:00
|
|
|
}
|
2012-06-15 21:04:17 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
void setDefaultK(int _k) { defaultK = _k; }
|
|
|
|
int getDefaultK() const { return defaultK; }
|
2010-05-12 01:44:00 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
Mat samples;
|
|
|
|
Mat responses;
|
|
|
|
bool _isClassifier;
|
|
|
|
int defaultK;
|
|
|
|
};
|
2010-11-03 01:58:22 +08:00
|
|
|
|
2014-07-30 03:54:23 +08:00
|
|
|
Ptr<KNearest> KNearest::create(bool isClassifier)
|
2010-11-03 01:58:22 +08:00
|
|
|
{
|
2014-07-30 03:54:23 +08:00
|
|
|
return makePtr<KNearestImpl>(isClassifier);
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
2010-11-03 01:58:22 +08:00
|
|
|
}
|
|
|
|
|
2010-05-12 01:44:00 +08:00
|
|
|
/* End of file */
|