2010-07-14 23:55:16 +08:00
|
|
|
/*M///////////////////////////////////////////////////////////////////////////////////////
|
|
|
|
//
|
|
|
|
// IMPORTANT: READ BEFORE DOWNLOADING, COPYING, INSTALLING OR USING.
|
|
|
|
//
|
|
|
|
// By downloading, copying, installing or using the software you agree to this license.
|
|
|
|
// If you do not agree to this license, do not download, install,
|
|
|
|
// copy or use the software.
|
|
|
|
//
|
|
|
|
//
|
|
|
|
// License Agreement
|
|
|
|
// For Open Source Computer Vision Library
|
|
|
|
//
|
|
|
|
// Copyright (C) 2000-2008, Intel Corporation, all rights reserved.
|
|
|
|
// Copyright (C) 2009, Willow Garage Inc., all rights reserved.
|
|
|
|
// Third party copyrights are property of their respective owners.
|
|
|
|
//
|
|
|
|
// Redistribution and use in source and binary forms, with or without modification,
|
|
|
|
// are permitted provided that the following conditions are met:
|
|
|
|
//
|
|
|
|
// * Redistribution's of source code must retain the above copyright notice,
|
|
|
|
// this list of conditions and the following disclaimer.
|
|
|
|
//
|
|
|
|
// * Redistribution's in binary form must reproduce the above copyright notice,
|
|
|
|
// this list of conditions and the following disclaimer in the documentation
|
|
|
|
// and/or other materials provided with the distribution.
|
|
|
|
//
|
|
|
|
// * The name of the copyright holders may not be used to endorse or promote products
|
|
|
|
// derived from this software without specific prior written permission.
|
|
|
|
//
|
|
|
|
// This software is provided by the copyright holders and contributors "as is" and
|
|
|
|
// any express or implied warranties, including, but not limited to, the implied
|
|
|
|
// warranties of merchantability and fitness for a particular purpose are disclaimed.
|
|
|
|
// In no event shall the Intel Corporation or contributors be liable for any direct,
|
|
|
|
// indirect, incidental, special, exemplary, or consequential damages
|
|
|
|
// (including, but not limited to, procurement of substitute goods or services;
|
|
|
|
// loss of use, data, or profits; or business interruption) however caused
|
|
|
|
// and on any theory of liability, whether in contract, strict liability,
|
|
|
|
// or tort (including negligence or otherwise) arising in any way out of
|
|
|
|
// the use of this software, even if advised of the possibility of such damage.
|
|
|
|
//
|
|
|
|
//M*/
|
|
|
|
|
2010-12-07 00:37:32 +08:00
|
|
|
#ifndef __OPENCV_internal_shared_HPP__
|
|
|
|
#define __OPENCV_internal_shared_HPP__
|
2010-07-14 23:55:16 +08:00
|
|
|
|
|
|
|
#include "opencv2/gpu/devmem2d.hpp"
|
2010-07-26 23:04:56 +08:00
|
|
|
#include "safe_call.hpp"
|
2010-11-11 20:05:48 +08:00
|
|
|
#include "cuda_runtime.h"
|
2011-05-31 16:31:10 +08:00
|
|
|
#include "npp.h"
|
|
|
|
#include "NPP_staging.hpp"
|
2010-07-14 23:55:16 +08:00
|
|
|
|
2011-06-30 22:39:48 +08:00
|
|
|
#ifndef CV_PI_F
|
|
|
|
#ifndef CV_PI
|
|
|
|
#define CV_PI_F 3.14159265f
|
|
|
|
#else
|
|
|
|
#define CV_PI_F ((float)CV_PI)
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
|
2010-07-14 23:55:16 +08:00
|
|
|
namespace cv
|
|
|
|
{
|
|
|
|
namespace gpu
|
2010-07-19 18:49:35 +08:00
|
|
|
{
|
2010-07-14 23:55:16 +08:00
|
|
|
typedef unsigned char uchar;
|
2010-07-22 17:31:33 +08:00
|
|
|
typedef signed char schar;
|
2010-07-14 23:55:16 +08:00
|
|
|
typedef unsigned short ushort;
|
2010-12-07 00:37:32 +08:00
|
|
|
typedef unsigned int uint;
|
|
|
|
|
|
|
|
enum
|
|
|
|
{
|
|
|
|
BORDER_REFLECT101_GPU = 0,
|
2010-12-13 16:43:04 +08:00
|
|
|
BORDER_REPLICATE_GPU,
|
|
|
|
BORDER_CONSTANT_GPU
|
2010-12-07 00:37:32 +08:00
|
|
|
};
|
2011-01-13 21:04:00 +08:00
|
|
|
|
2010-12-07 00:37:32 +08:00
|
|
|
// Converts CPU border extrapolation mode into GPU internal analogue.
|
|
|
|
// Returns true if the GPU analogue exists, false otherwise.
|
|
|
|
bool tryConvertToGpuBorderType(int cpuBorderType, int& gpuBorderType);
|
|
|
|
|
2010-10-31 21:23:25 +08:00
|
|
|
static inline int divUp(int total, int grain) { return (total + grain - 1) / grain; }
|
2010-07-19 18:49:35 +08:00
|
|
|
|
2010-11-11 01:05:36 +08:00
|
|
|
template<class T> static inline void uploadConstant(const char* name, const T& value)
|
|
|
|
{
|
|
|
|
cudaSafeCall( cudaMemcpyToSymbol(name, &value, sizeof(T)) );
|
|
|
|
}
|
|
|
|
|
|
|
|
template<class T> static inline void uploadConstant(const char* name, const T& value, cudaStream_t stream)
|
2010-11-16 15:40:37 +08:00
|
|
|
{
|
|
|
|
cudaSafeCall( cudaMemcpyToSymbolAsync(name, &value, sizeof(T), 0, cudaMemcpyHostToDevice, stream) );
|
2010-11-11 01:05:36 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
template<class T> static inline void bindTexture(const char* name, const DevMem2D_<T>& img/*, bool normalized = false,
|
|
|
|
enum cudaTextureFilterMode filterMode = cudaFilterModePoint, enum cudaTextureAddressMode addrMode = cudaAddressModeClamp*/)
|
|
|
|
{
|
|
|
|
//!!!! const_cast is disabled!
|
|
|
|
//!!!! Please use constructor of 'class texture' instead.
|
|
|
|
|
|
|
|
//textureReference* tex;
|
|
|
|
//cudaSafeCall( cudaGetTextureReference((const textureReference**)&tex, name) );
|
|
|
|
//tex->normalized = normalized;
|
|
|
|
//tex->filterMode = filterMode;
|
|
|
|
//tex->addressMode[0] = addrMode;
|
|
|
|
//tex->addressMode[1] = addrMode;
|
|
|
|
|
|
|
|
const textureReference* tex;
|
|
|
|
cudaSafeCall( cudaGetTextureReference(&tex, name) );
|
|
|
|
|
|
|
|
cudaChannelFormatDesc desc = cudaCreateChannelDesc<T>();
|
|
|
|
cudaSafeCall( cudaBindTexture2D(0, tex, img.ptr(), &desc, img.cols, img.rows, img.step) );
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void unbindTexture(const char *name)
|
|
|
|
{
|
|
|
|
const textureReference* tex;
|
|
|
|
cudaSafeCall( cudaGetTextureReference(&tex, name) );
|
|
|
|
cudaSafeCall( cudaUnbindTexture(tex) );
|
2011-05-23 15:59:20 +08:00
|
|
|
}
|
2011-05-31 16:31:10 +08:00
|
|
|
|
2011-08-10 19:32:48 +08:00
|
|
|
class TextureBinder
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
TextureBinder() : tex_(0) {}
|
|
|
|
template <typename T> TextureBinder(const textureReference* tex, const DevMem2D_<T>& img) : tex_(0)
|
|
|
|
{
|
|
|
|
bind(tex, img);
|
|
|
|
}
|
|
|
|
template <typename T> TextureBinder(const char* tex_name, const DevMem2D_<T>& img) : tex_(0)
|
|
|
|
{
|
|
|
|
bind(tex_name, img);
|
|
|
|
}
|
|
|
|
~TextureBinder() { unbind(); }
|
|
|
|
|
|
|
|
template <typename T> void bind(const textureReference* tex, const DevMem2D_<T>& img)
|
|
|
|
{
|
|
|
|
unbind();
|
|
|
|
|
|
|
|
cudaChannelFormatDesc desc = cudaCreateChannelDesc<T>();
|
|
|
|
cudaSafeCall( cudaBindTexture2D(0, tex, img.ptr(), &desc, img.cols, img.rows, img.step) );
|
|
|
|
|
|
|
|
tex_ = tex;
|
|
|
|
}
|
|
|
|
template <typename T> void bind(const char* tex_name, const DevMem2D_<T>& img)
|
|
|
|
{
|
|
|
|
const textureReference* tex;
|
|
|
|
cudaSafeCall( cudaGetTextureReference(&tex, tex_name) );
|
|
|
|
bind(tex, img);
|
|
|
|
}
|
|
|
|
|
|
|
|
void unbind()
|
|
|
|
{
|
|
|
|
if (tex_)
|
|
|
|
{
|
|
|
|
cudaUnbindTexture(tex_);
|
|
|
|
tex_ = 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
|
|
|
const textureReference* tex_;
|
|
|
|
};
|
|
|
|
|
2011-05-31 16:31:10 +08:00
|
|
|
class NppStreamHandler
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
inline explicit NppStreamHandler(cudaStream_t newStream = 0)
|
|
|
|
{
|
|
|
|
oldStream = nppGetStream();
|
|
|
|
nppSetStream(newStream);
|
|
|
|
}
|
|
|
|
|
|
|
|
inline ~NppStreamHandler()
|
|
|
|
{
|
|
|
|
nppSetStream(oldStream);
|
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
|
|
|
cudaStream_t oldStream;
|
|
|
|
};
|
|
|
|
|
|
|
|
class NppStStreamHandler
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
inline explicit NppStStreamHandler(cudaStream_t newStream = 0)
|
|
|
|
{
|
|
|
|
oldStream = nppStSetActiveCUDAstream(newStream);
|
|
|
|
}
|
|
|
|
|
|
|
|
inline ~NppStStreamHandler()
|
|
|
|
{
|
|
|
|
nppStSetActiveCUDAstream(oldStream);
|
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
|
|
|
cudaStream_t oldStream;
|
|
|
|
};
|
2010-07-14 23:55:16 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2010-07-19 17:31:12 +08:00
|
|
|
|
2010-12-07 00:37:32 +08:00
|
|
|
#endif /* __OPENCV_internal_shared_HPP__ */
|