mirror of
https://github.com/opencv/opencv.git
synced 2025-01-07 19:54:18 +08:00
120 lines
4.7 KiB
Common Lisp
120 lines
4.7 KiB
Common Lisp
/*M///////////////////////////////////////////////////////////////////////////////////////
|
|
//
|
|
// IMPORTANT: READ BEFORE DOWNLOADING, COPYING, INSTALLING OR USING.
|
|
//
|
|
// By downloading, copying, installing or using the software you agree to this license.
|
|
// If you do not agree to this license, do not download, install,
|
|
// copy or use the software.
|
|
//
|
|
//
|
|
// License Agreement
|
|
// For Open Source Computer Vision Library
|
|
//
|
|
// Copyright (c) 2016-2017 Fabian David Tschopp, all rights reserved.
|
|
// Third party copyrights are property of their respective owners.
|
|
//
|
|
// Redistribution and use in source and binary forms, with or without modification,
|
|
// are permitted provided that the following conditions are met:
|
|
//
|
|
// * Redistribution's of source code must retain the above copyright notice,
|
|
// this list of conditions and the following disclaimer.
|
|
//
|
|
// * Redistribution's in binary form must reproduce the above copyright notice,
|
|
// this list of conditions and the following disclaimer in the documentation
|
|
// and/or other materials provided with the distribution.
|
|
//
|
|
// * The name of the copyright holders may not be used to endorse or promote products
|
|
// derived from this software without specific prior written permission.
|
|
//
|
|
// This software is provided by the copyright holders and contributors "as is" and
|
|
// any express or implied warranties, including, but not limited to, the implied
|
|
// warranties of merchantability and fitness for a particular purpose are disclaimed.
|
|
// In no event shall the Intel Corporation or contributors be liable for any direct,
|
|
// indirect, incidental, special, exemplary, or consequential damages
|
|
// (including, but not limited to, procurement of substitute goods or services;
|
|
// loss of use, data, or profits; or business interruption) however caused
|
|
// and on any theory of liability, whether in contract, strict liability,
|
|
// or tort (including negligence or otherwise) arising in any way out of
|
|
// the use of this software, even if advised of the possibility of such damage.
|
|
//
|
|
//M*/
|
|
|
|
#if defined(cl_khr_fp16)
|
|
#pragma OPENCL EXTENSION cl_khr_fp16 : enable
|
|
#endif
|
|
|
|
__kernel void prior_box(const int nthreads,
|
|
const float stepX,
|
|
const float stepY,
|
|
__global const float* _offsetsX,
|
|
__global const float* _offsetsY,
|
|
const int offsetsX_size,
|
|
__global const float* _widths,
|
|
__global const float* _heights,
|
|
const int widths_size,
|
|
__global Dtype* dst,
|
|
const int _layerHeight,
|
|
const int _layerWidth,
|
|
const int imgHeight,
|
|
const int imgWidth)
|
|
{
|
|
for (int index = get_global_id(0); index < nthreads; index += get_global_size(0))
|
|
{
|
|
int w = index % _layerWidth;
|
|
int h = index / _layerWidth;
|
|
__global Dtype* outputPtr;
|
|
|
|
outputPtr = dst + index * 4 * offsetsX_size * widths_size;
|
|
|
|
float _boxWidth, _boxHeight;
|
|
Dtype4 vec;
|
|
for (int i = 0; i < widths_size; ++i)
|
|
{
|
|
_boxWidth = _widths[i];
|
|
_boxHeight = _heights[i];
|
|
for (int j = 0; j < offsetsX_size; ++j)
|
|
{
|
|
Dtype center_x = (w + _offsetsX[j]) * (Dtype)stepX;
|
|
Dtype center_y = (h + _offsetsY[j]) * (Dtype)stepY;
|
|
|
|
vec.x = (center_x - _boxWidth * 0.5f) / imgWidth; // xmin
|
|
vec.y = (center_y - _boxHeight * 0.5f) / imgHeight; // ymin
|
|
vec.z = (center_x + _boxWidth * 0.5f) / imgWidth; // xmax
|
|
vec.w = (center_y + _boxHeight * 0.5f) / imgHeight; // ymax
|
|
vstore4(vec, 0, outputPtr);
|
|
|
|
outputPtr += 4;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
__kernel void set_variance(const int nthreads,
|
|
const int offset,
|
|
const int variance_size,
|
|
__global const float* variance,
|
|
__global Dtype* dst)
|
|
{
|
|
for (int index = get_global_id(0); index < nthreads; index += get_global_size(0))
|
|
{
|
|
Dtype4 var_vec;
|
|
|
|
if (variance_size == 1)
|
|
var_vec = (Dtype4)(variance[0]);
|
|
else
|
|
var_vec = convert_T(vload4(0, variance));
|
|
|
|
vstore4(var_vec, 0, dst + offset + index * 4);
|
|
}
|
|
}
|
|
|
|
__kernel void clip(const int nthreads,
|
|
__global Dtype* dst)
|
|
{
|
|
for (int index = get_global_id(0); index < nthreads; index += get_global_size(0))
|
|
{
|
|
Dtype4 vec = vload4(index, dst);
|
|
vstore4(clamp(vec, (Dtype)0.0f, (Dtype)1.0f), index, dst);
|
|
}
|
|
}
|