mirror of
https://github.com/opencv/opencv.git
synced 2024-12-17 19:08:01 +08:00
ed86bd34b1
cuda_canny : multi stream safety (#11483) * CUDA_ImgProc/Canny Asynchronous test * cuda_canny : multi stream safety (1/3) - Convert global variable canny::counter to class local variable * cuda_canny : multi stream safety (2/3) - Use texture objects rather than texture reference for cc >= 3.0, since texture reference must be declared as a static global variable which results in race condition when ran concurrently * cuda_canny : multi stream safety (3/3) - Refrain from using global variable in row_filter and column_filter (converts column_filter::c_kernel and row_filter::c_kernel to local variables) * Fixes #11193
161 lines
5.7 KiB
C++
161 lines
5.7 KiB
C++
/*M///////////////////////////////////////////////////////////////////////////////////////
|
|
//
|
|
// IMPORTANT: READ BEFORE DOWNLOADING, COPYING, INSTALLING OR USING.
|
|
//
|
|
// By downloading, copying, installing or using the software you agree to this license.
|
|
// If you do not agree to this license, do not download, install,
|
|
// copy or use the software.
|
|
//
|
|
//
|
|
// License Agreement
|
|
// For Open Source Computer Vision Library
|
|
//
|
|
// Copyright (C) 2000-2008, Intel Corporation, all rights reserved.
|
|
// Copyright (C) 2009, Willow Garage Inc., all rights reserved.
|
|
// Third party copyrights are property of their respective owners.
|
|
//
|
|
// Redistribution and use in source and binary forms, with or without modification,
|
|
// are permitted provided that the following conditions are met:
|
|
//
|
|
// * Redistribution's of source code must retain the above copyright notice,
|
|
// this list of conditions and the following disclaimer.
|
|
//
|
|
// * Redistribution's in binary form must reproduce the above copyright notice,
|
|
// this list of conditions and the following disclaimer in the documentation
|
|
// and/or other materials provided with the distribution.
|
|
//
|
|
// * The name of the copyright holders may not be used to endorse or promote products
|
|
// derived from this software without specific prior written permission.
|
|
//
|
|
// This software is provided by the copyright holders and contributors "as is" and
|
|
// any express or implied warranties, including, but not limited to, the implied
|
|
// warranties of merchantability and fitness for a particular purpose are disclaimed.
|
|
// In no event shall the Intel Corporation or contributors be liable for any direct,
|
|
// indirect, incidental, special, exemplary, or consequential damages
|
|
// (including, but not limited to, procurement of substitute goods or services;
|
|
// loss of use, data, or profits; or business interruption) however caused
|
|
// and on any theory of liability, whether in contract, strict liability,
|
|
// or tort (including negligence or otherwise) arising in any way out of
|
|
// the use of this software, even if advised of the possibility of such damage.
|
|
//
|
|
//M*/
|
|
|
|
#include "test_precomp.hpp"
|
|
|
|
#ifdef HAVE_CUDA
|
|
|
|
namespace opencv_test { namespace {
|
|
|
|
////////////////////////////////////////////////////////
|
|
// Canny
|
|
|
|
namespace
|
|
{
|
|
IMPLEMENT_PARAM_CLASS(AppertureSize, int)
|
|
IMPLEMENT_PARAM_CLASS(L2gradient, bool)
|
|
}
|
|
|
|
PARAM_TEST_CASE(Canny, cv::cuda::DeviceInfo, AppertureSize, L2gradient, UseRoi)
|
|
{
|
|
cv::cuda::DeviceInfo devInfo;
|
|
int apperture_size;
|
|
bool useL2gradient;
|
|
bool useRoi;
|
|
|
|
virtual void SetUp()
|
|
{
|
|
devInfo = GET_PARAM(0);
|
|
apperture_size = GET_PARAM(1);
|
|
useL2gradient = GET_PARAM(2);
|
|
useRoi = GET_PARAM(3);
|
|
|
|
cv::cuda::setDevice(devInfo.deviceID());
|
|
}
|
|
};
|
|
|
|
CUDA_TEST_P(Canny, Accuracy)
|
|
{
|
|
cv::Mat img = readImage("stereobm/aloe-L.png", cv::IMREAD_GRAYSCALE);
|
|
ASSERT_FALSE(img.empty());
|
|
|
|
double low_thresh = 50.0;
|
|
double high_thresh = 100.0;
|
|
|
|
cv::Ptr<cv::cuda::CannyEdgeDetector> canny = cv::cuda::createCannyEdgeDetector(low_thresh, high_thresh, apperture_size, useL2gradient);
|
|
|
|
cv::cuda::GpuMat edges;
|
|
canny->detect(loadMat(img, useRoi), edges);
|
|
|
|
cv::Mat edges_gold;
|
|
cv::Canny(img, edges_gold, low_thresh, high_thresh, apperture_size, useL2gradient);
|
|
|
|
EXPECT_MAT_SIMILAR(edges_gold, edges, 2e-2);
|
|
}
|
|
|
|
class CannyAsyncParallelLoopBody : public cv::ParallelLoopBody
|
|
{
|
|
public:
|
|
CannyAsyncParallelLoopBody(const cv::cuda::GpuMat& d_img_, cv::cuda::GpuMat* edges_, double low_thresh_, double high_thresh_, int apperture_size_, bool useL2gradient_)
|
|
: d_img(d_img_), edges(edges_), low_thresh(low_thresh_), high_thresh(high_thresh_), apperture_size(apperture_size_), useL2gradient(useL2gradient_) {}
|
|
~CannyAsyncParallelLoopBody() {};
|
|
void operator()(const cv::Range& r) const
|
|
{
|
|
for (int i = r.start; i < r.end; i++) {
|
|
cv::cuda::Stream stream;
|
|
cv::Ptr<cv::cuda::CannyEdgeDetector> canny = cv::cuda::createCannyEdgeDetector(low_thresh, high_thresh, apperture_size, useL2gradient);
|
|
canny->detect(d_img, edges[i], stream);
|
|
stream.waitForCompletion();
|
|
}
|
|
}
|
|
protected:
|
|
const cv::cuda::GpuMat& d_img;
|
|
cv::cuda::GpuMat* edges;
|
|
double low_thresh;
|
|
double high_thresh;
|
|
int apperture_size;
|
|
bool useL2gradient;
|
|
};
|
|
|
|
#define NUM_STREAMS 64
|
|
|
|
CUDA_TEST_P(Canny, Async)
|
|
{
|
|
if (!supportFeature(devInfo, cv::cuda::FEATURE_SET_COMPUTE_30))
|
|
{
|
|
throw SkipTestException("CUDA device doesn't support texture objects");
|
|
}
|
|
else
|
|
{
|
|
const cv::Mat img = readImage("stereobm/aloe-L.png", cv::IMREAD_GRAYSCALE);
|
|
ASSERT_FALSE(img.empty());
|
|
|
|
const cv::cuda::GpuMat d_img_roi = loadMat(img, useRoi);
|
|
|
|
double low_thresh = 50.0;
|
|
double high_thresh = 100.0;
|
|
|
|
// Synchronous call
|
|
cv::Ptr<cv::cuda::CannyEdgeDetector> canny = cv::cuda::createCannyEdgeDetector(low_thresh, high_thresh, apperture_size, useL2gradient);
|
|
cv::cuda::GpuMat edges_gold;
|
|
canny->detect(d_img_roi, edges_gold);
|
|
|
|
// Asynchronous call
|
|
cv::cuda::GpuMat edges[NUM_STREAMS];
|
|
cv::parallel_for_(cv::Range(0, NUM_STREAMS), CannyAsyncParallelLoopBody(d_img_roi, edges, low_thresh, high_thresh, apperture_size, useL2gradient));
|
|
|
|
// Compare the results of synchronous call and asynchronous call
|
|
for (int i = 0; i < NUM_STREAMS; i++)
|
|
EXPECT_MAT_NEAR(edges_gold, edges[i], 0.0);
|
|
}
|
|
}
|
|
|
|
INSTANTIATE_TEST_CASE_P(CUDA_ImgProc, Canny, testing::Combine(
|
|
ALL_DEVICES,
|
|
testing::Values(AppertureSize(3), AppertureSize(5), AppertureSize(7)),
|
|
testing::Values(L2gradient(false), L2gradient(true)),
|
|
WHOLE_SUBMAT));
|
|
|
|
|
|
}} // namespace
|
|
#endif // HAVE_CUDA
|