mirror of
https://github.com/opencv/opencv.git
synced 2024-11-25 11:40:44 +08:00
C.C. Labeling: added stream support
This commit is contained in:
parent
350621057f
commit
51433a9331
@ -918,7 +918,7 @@ CV_EXPORTS void graphcut(GpuMat& terminals, GpuMat& leftTransp, GpuMat& rightTra
|
|||||||
GpuMat& buf, Stream& stream = Stream::Null());
|
GpuMat& buf, Stream& stream = Stream::Null());
|
||||||
|
|
||||||
//! performs connected componnents labeling.
|
//! performs connected componnents labeling.
|
||||||
CV_EXPORTS void labelComponents(const GpuMat& image, GpuMat& mask, GpuMat& components, const cv::Scalar& lo, const cv::Scalar& hi);
|
CV_EXPORTS void labelComponents(const GpuMat& image, GpuMat& mask, GpuMat& components, const cv::Scalar& lo, const cv::Scalar& hi, Stream& stream = Stream::Null());
|
||||||
|
|
||||||
////////////////////////////////// Histograms //////////////////////////////////
|
////////////////////////////////// Histograms //////////////////////////////////
|
||||||
|
|
||||||
|
@ -83,7 +83,7 @@ namespace cv { namespace gpu { namespace device
|
|||||||
};
|
};
|
||||||
|
|
||||||
template<typename F>
|
template<typename F>
|
||||||
__global__ void computeComponents(const DevMem2D image, DevMem2D components, F connected)
|
__global__ void computeConnectivity(const DevMem2D image, DevMem2D components, F connected)
|
||||||
{
|
{
|
||||||
int x = threadIdx.x + blockIdx.x * blockDim.x;
|
int x = threadIdx.x + blockIdx.x * blockDim.x;
|
||||||
int y = threadIdx.y + blockIdx.y * blockDim.y;
|
int y = threadIdx.y + blockIdx.y * blockDim.y;
|
||||||
@ -108,15 +108,16 @@ namespace cv { namespace gpu { namespace device
|
|||||||
components(y, x) = c;
|
components(y, x) = c;
|
||||||
}
|
}
|
||||||
|
|
||||||
void computeEdges(const DevMem2D& image, DevMem2D components, const int lo, const int hi)
|
void computeEdges(const DevMem2D& image, DevMem2D edges, const int lo, const int hi, cudaStream_t stream)
|
||||||
{
|
{
|
||||||
dim3 block(CTA_SIZE_X, CTA_SIZE_Y);
|
dim3 block(CTA_SIZE_X, CTA_SIZE_Y);
|
||||||
dim3 grid(divUp(image.cols, block.x), divUp(image.rows, block.y));
|
dim3 grid(divUp(image.cols, block.x), divUp(image.rows, block.y));
|
||||||
InInterval<int> inInt(lo, hi);
|
InInterval<int> inInt(lo, hi);
|
||||||
computeComponents<InInterval<int> ><<<grid, block>>>(image, components, inInt);
|
computeConnectivity<InInterval<int> ><<<grid, block, 0, stream>>>(image, edges, inInt);
|
||||||
|
|
||||||
cudaSafeCall( cudaGetLastError() );
|
cudaSafeCall( cudaGetLastError() );
|
||||||
cudaSafeCall( cudaDeviceSynchronize() );
|
if (stream == 0)
|
||||||
|
cudaSafeCall( cudaDeviceSynchronize() );
|
||||||
}
|
}
|
||||||
|
|
||||||
__global__ void lableTiles(const DevMem2D edges, DevMem2Di comps)
|
__global__ void lableTiles(const DevMem2D edges, DevMem2Di comps)
|
||||||
@ -384,25 +385,25 @@ namespace cv { namespace gpu { namespace device
|
|||||||
comps(y, x) = root(comps, comps(y, x));
|
comps(y, x) = root(comps, comps(y, x));
|
||||||
}
|
}
|
||||||
|
|
||||||
void labelComponents(const DevMem2D& edges, DevMem2Di comps)
|
void labelComponents(const DevMem2D& edges, DevMem2Di comps, cudaStream_t stream)
|
||||||
{
|
{
|
||||||
dim3 block(CTA_SIZE_X, CTA_SIZE_Y);
|
dim3 block(CTA_SIZE_X, CTA_SIZE_Y);
|
||||||
dim3 grid(divUp(edges.cols, TILE_COLS), divUp(edges.rows, TILE_ROWS));
|
dim3 grid(divUp(edges.cols, TILE_COLS), divUp(edges.rows, TILE_ROWS));
|
||||||
|
|
||||||
lableTiles<<<grid, block>>>(edges, comps);
|
lableTiles<<<grid, block, 0, stream>>>(edges, comps);
|
||||||
cudaSafeCall( cudaGetLastError() );
|
cudaSafeCall( cudaGetLastError() );
|
||||||
|
|
||||||
int tileSizeX = TILE_COLS, tileSizeY = TILE_ROWS;
|
int tileSizeX = TILE_COLS, tileSizeY = TILE_ROWS;
|
||||||
|
|
||||||
cudaSafeCall( cudaGetLastError() );
|
cudaSafeCall( cudaGetLastError() );
|
||||||
cudaSafeCall( cudaDeviceSynchronize() );
|
// cudaSafeCall( cudaDeviceSynchronize() );
|
||||||
|
|
||||||
while (grid.x > 1 || grid.y > 1)
|
while (grid.x > 1 || grid.y > 1)
|
||||||
{
|
{
|
||||||
dim3 mergeGrid(ceilf(grid.x / 2.0), ceilf(grid.y / 2.0));
|
dim3 mergeGrid(ceilf(grid.x / 2.0), ceilf(grid.y / 2.0));
|
||||||
dim3 mergeBlock(STA_SIZE_MARGE_X, STA_SIZE_MARGE_Y);
|
dim3 mergeBlock(STA_SIZE_MARGE_X, STA_SIZE_MARGE_Y);
|
||||||
std::cout << "merging: " << grid.y << " x " << grid.x << " ---> " << mergeGrid.y << " x " << mergeGrid.x << " for tiles: " << tileSizeY << " x " << tileSizeX << std::endl;
|
std::cout << "merging: " << grid.y << " x " << grid.x << " ---> " << mergeGrid.y << " x " << mergeGrid.x << " for tiles: " << tileSizeY << " x " << tileSizeX << std::endl;
|
||||||
crossMerge<<<mergeGrid, mergeBlock>>>(2, 2, tileSizeY, tileSizeX, edges, comps, ceilf(grid.y / 2.0) - grid.y / 2, ceilf(grid.x / 2.0) - grid.x / 2);
|
crossMerge<<<mergeGrid, mergeBlock, 0, stream>>>(2, 2, tileSizeY, tileSizeX, edges, comps, ceilf(grid.y / 2.0) - grid.y / 2, ceilf(grid.x / 2.0) - grid.x / 2);
|
||||||
tileSizeX <<= 1;
|
tileSizeX <<= 1;
|
||||||
tileSizeY <<= 1;
|
tileSizeY <<= 1;
|
||||||
grid = mergeGrid;
|
grid = mergeGrid;
|
||||||
@ -412,9 +413,10 @@ namespace cv { namespace gpu { namespace device
|
|||||||
|
|
||||||
grid.x = divUp(edges.cols, block.x);
|
grid.x = divUp(edges.cols, block.x);
|
||||||
grid.y = divUp(edges.rows, block.y);
|
grid.y = divUp(edges.rows, block.y);
|
||||||
flatten<<<grid, block>>>(edges, comps);
|
flatten<<<grid, block, 0, stream>>>(edges, comps);
|
||||||
cudaSafeCall( cudaGetLastError() );
|
cudaSafeCall( cudaGetLastError() );
|
||||||
cudaSafeCall( cudaDeviceSynchronize() );
|
if (stream == 0)
|
||||||
|
cudaSafeCall( cudaDeviceSynchronize() );
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
} } }
|
} } }
|
@ -47,7 +47,7 @@
|
|||||||
void cv::gpu::graphcut(GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, Stream&) { throw_nogpu(); }
|
void cv::gpu::graphcut(GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, Stream&) { throw_nogpu(); }
|
||||||
void cv::gpu::graphcut(GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, Stream&) { throw_nogpu(); }
|
void cv::gpu::graphcut(GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, GpuMat&, Stream&) { throw_nogpu(); }
|
||||||
|
|
||||||
void cv::gpu::labelComponents(const GpuMat& image, GpuMat& mask, GpuMat& components, const cv::Scalar& lo, const cv::Scalar& hi) { throw_nogpu(); }
|
void cv::gpu::labelComponents(const GpuMat&, GpuMat&, GpuMat&, const cv::Scalar&, const cv::Scalar&, Stream&) { throw_nogpu(); }
|
||||||
|
|
||||||
#else /* !defined (HAVE_CUDA) */
|
#else /* !defined (HAVE_CUDA) */
|
||||||
|
|
||||||
@ -55,15 +55,28 @@ namespace cv { namespace gpu { namespace device
|
|||||||
{
|
{
|
||||||
namespace ccl
|
namespace ccl
|
||||||
{
|
{
|
||||||
void labelComponents(const DevMem2D& edges, DevMem2Di comps);
|
void labelComponents(const DevMem2D& edges, DevMem2Di comps, cudaStream_t stream);
|
||||||
void computeEdges(const DevMem2D& image, DevMem2D edges, const int lo, const int hi);
|
void computeEdges(const DevMem2D& image, DevMem2D edges, const int lo, const int hi, cudaStream_t stream);
|
||||||
}
|
}
|
||||||
}}}
|
}}}
|
||||||
|
|
||||||
void cv::gpu::labelComponents(const GpuMat& image, GpuMat& mask, GpuMat& components, const cv::Scalar& lo, const cv::Scalar& hi)
|
void cv::gpu::labelComponents(const GpuMat& image, GpuMat& mask, GpuMat& components, const cv::Scalar& lo, const cv::Scalar& hi, Stream& s)
|
||||||
{
|
{
|
||||||
device::ccl::computeEdges(image, mask, lo[0], hi[0]);
|
CV_Assert(!image.empty());
|
||||||
device::ccl::labelComponents(mask, components);
|
|
||||||
|
int type = image.type();
|
||||||
|
CV_Assert(type == CV_8UC1);
|
||||||
|
|
||||||
|
if (image.size() != mask.size() || mask.type() != CV_8UC1)
|
||||||
|
mask.create(image.size(), CV_8UC1);
|
||||||
|
|
||||||
|
if (image.size() != components.size() || components.type() != CV_32SC1)
|
||||||
|
components.create(image.size(), CV_32SC1);
|
||||||
|
|
||||||
|
cudaStream_t stream = StreamAccessor::getStream(s);
|
||||||
|
|
||||||
|
device::ccl::computeEdges(image, mask, lo[0], hi[0], stream);
|
||||||
|
device::ccl::labelComponents(mask, components, stream);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
@ -63,9 +63,6 @@ TEST_P(Labeling, ConnectedComponents)
|
|||||||
{
|
{
|
||||||
cv::Mat image;
|
cv::Mat image;
|
||||||
cvtColor(loat_image(), image, CV_BGR2GRAY);
|
cvtColor(loat_image(), image, CV_BGR2GRAY);
|
||||||
cv::Mat image_cpu = image.clone();
|
|
||||||
|
|
||||||
// cv::floodFill(image, cv::Point(1,1),cv::Scalar::all(64), 0, cv::Scalar::all(0), cv::Scalar::all(256));
|
|
||||||
|
|
||||||
cv::gpu::GpuMat mask;
|
cv::gpu::GpuMat mask;
|
||||||
mask.create(image.rows, image.cols, CV_8UC1);
|
mask.create(image.rows, image.cols, CV_8UC1);
|
||||||
@ -73,21 +70,8 @@ TEST_P(Labeling, ConnectedComponents)
|
|||||||
cv::gpu::GpuMat components;
|
cv::gpu::GpuMat components;
|
||||||
components.create(image.rows, image.cols, CV_32SC1);
|
components.create(image.rows, image.cols, CV_32SC1);
|
||||||
|
|
||||||
std::cout << "summary: " << image.cols << " " << image.rows << " "
|
|
||||||
<< cv::gpu::GpuMat(image).cols << " " << cv::gpu::GpuMat(image).rows<< " "
|
|
||||||
<< mask.cols << " " << mask.rows<< " "
|
|
||||||
<< components.cols << " " << components.rows<< std::endl;
|
|
||||||
|
|
||||||
|
|
||||||
cv::gpu::labelComponents(cv::gpu::GpuMat(image), mask, components, cv::Scalar::all(0), cv::Scalar::all(2));
|
cv::gpu::labelComponents(cv::gpu::GpuMat(image), mask, components, cv::Scalar::all(0), cv::Scalar::all(2));
|
||||||
|
|
||||||
// // for(int i = 0; i + 32 < image.rows; i += 32)
|
|
||||||
// // for(int j = 0; j + 32 < image.cols; j += 32)
|
|
||||||
// // {
|
|
||||||
// // std::cout << cv::Mat(cv::Mat(mask), cv::Rect(j, i, 32, 32 ))<< std::endl;
|
|
||||||
// // std::cout << cv::Mat(cv::Mat(components), cv::Rect(j, i, 32, 32 )) << std::endl;
|
|
||||||
// // }
|
|
||||||
|
|
||||||
// std::cout << cv::Mat(components) << std::endl;
|
// std::cout << cv::Mat(components) << std::endl;
|
||||||
// cv::imshow("test", image);
|
// cv::imshow("test", image);
|
||||||
// cv::waitKey(0);
|
// cv::waitKey(0);
|
||||||
@ -102,7 +86,6 @@ TEST_P(Labeling, ConnectedComponents)
|
|||||||
cv::waitKey(0);
|
cv::waitKey(0);
|
||||||
cv::imshow("test", cv::Mat(components) * 2);
|
cv::imshow("test", cv::Mat(components) * 2);
|
||||||
cv::waitKey(0);
|
cv::waitKey(0);
|
||||||
std::cout << "test! " << image.cols << std::endl;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
INSTANTIATE_TEST_CASE_P(ConnectedComponents, Labeling, ALL_DEVICES);
|
INSTANTIATE_TEST_CASE_P(ConnectedComponents, Labeling, ALL_DEVICES);
|
Loading…
Reference in New Issue
Block a user