Open Source Computer Vision Library
https://opencv.org/
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
199 lines
7.6 KiB
199 lines
7.6 KiB
/*M/////////////////////////////////////////////////////////////////////////////////////// |
|
// |
|
// IMPORTANT: READ BEFORE DOWNLOADING, COPYING, INSTALLING OR USING. |
|
// |
|
// By downloading, copying, installing or using the software you agree to this license. |
|
// If you do not agree to this license, do not download, install, |
|
// copy or use the software. |
|
// |
|
// |
|
// License Agreement |
|
// For Open Source Computer Vision Library |
|
// |
|
// Copyright (c) 2016-2017 Fabian David Tschopp, all rights reserved. |
|
// Third party copyrights are property of their respective owners. |
|
// |
|
// Redistribution and use in source and binary forms, with or without modification, |
|
// are permitted provided that the following conditions are met: |
|
// |
|
// * Redistribution's of source code must retain the above copyright notice, |
|
// this list of conditions and the following disclaimer. |
|
// |
|
// * Redistribution's in binary form must reproduce the above copyright notice, |
|
// this list of conditions and the following disclaimer in the documentation |
|
// and/or other materials provided with the distribution. |
|
// |
|
// * The name of the copyright holders may not be used to endorse or promote products |
|
// derived from this software without specific prior written permission. |
|
// |
|
// This software is provided by the copyright holders and contributors "as is" and |
|
// any express or implied warranties, including, but not limited to, the implied |
|
// warranties of merchantability and fitness for a particular purpose are disclaimed. |
|
// In no event shall the Intel Corporation or contributors be liable for any direct, |
|
// indirect, incidental, special, exemplary, or consequential damages |
|
// (including, but not limited to, procurement of substitute goods or services; |
|
// loss of use, data, or profits; or business interruption) however caused |
|
// and on any theory of liability, whether in contract, strict liability, |
|
// or tort (including negligence or otherwise) arising in any way out of |
|
// the use of this software, even if advised of the possibility of such damage. |
|
// |
|
//M*/ |
|
|
|
#define Dtype float |
|
#define Dtype4 float4 |
|
|
|
__kernel void DecodeBBoxesCORNER(const int nthreads, |
|
__global const Dtype* loc_data, |
|
__global const Dtype* prior_data, |
|
const int variance_encoded_in_target, |
|
const int num_priors, |
|
const int share_location, |
|
const int num_loc_classes, |
|
const int background_label_id, |
|
const int clip_bbox, |
|
const int locPredTransposed, |
|
__global Dtype* bbox_data) |
|
{ |
|
for (int index = get_global_id(0); index < nthreads; index += get_global_size(0)) |
|
{ |
|
Dtype bbox_xmin, bbox_ymin, bbox_xmax, bbox_ymax; |
|
const int i = index % 4; |
|
const int p = ((index / 4 / num_loc_classes) % num_priors) * 4; |
|
|
|
const int c = (index / 4) % num_loc_classes; |
|
int label = share_location ? -1 : c; |
|
if (label == background_label_id) |
|
return; // Ignore background class. |
|
|
|
Dtype4 loc_vec = vload4(0, loc_data + index - i); |
|
Dtype4 bbox_vec, prior_variance; |
|
if (variance_encoded_in_target) |
|
{ |
|
bbox_vec = loc_vec; |
|
} else { |
|
const int start_index = num_priors * 4 + p; |
|
prior_variance = vload4(0, prior_data + start_index); |
|
bbox_vec = loc_vec * prior_variance; |
|
} |
|
|
|
if (locPredTransposed) |
|
{ |
|
bbox_ymin = bbox_vec.x; |
|
bbox_xmin = bbox_vec.y; |
|
bbox_ymax = bbox_vec.z; |
|
bbox_xmax = bbox_vec.w; |
|
} else { |
|
bbox_xmin = bbox_vec.x; |
|
bbox_ymin = bbox_vec.y; |
|
bbox_xmax = bbox_vec.z; |
|
bbox_ymax = bbox_vec.w; |
|
} |
|
|
|
Dtype4 prior_vec = vload4(0, prior_data + p); |
|
Dtype val; |
|
switch (i) |
|
{ |
|
case 0: |
|
val = prior_vec.x + bbox_xmin; |
|
break; |
|
case 1: |
|
val = prior_vec.y + bbox_ymin; |
|
break; |
|
case 2: |
|
val = prior_vec.z + bbox_xmax; |
|
break; |
|
case 3: |
|
val = prior_vec.w + bbox_ymax; |
|
break; |
|
} |
|
|
|
if (clip_bbox) |
|
val = max(min(val, (Dtype)1.), (Dtype)0.); |
|
|
|
bbox_data[index] = val; |
|
} |
|
} |
|
|
|
__kernel void DecodeBBoxesCENTER_SIZE(const int nthreads, |
|
__global const Dtype* loc_data, |
|
__global const Dtype* prior_data, |
|
const int variance_encoded_in_target, |
|
const int num_priors, |
|
const int share_location, |
|
const int num_loc_classes, |
|
const int background_label_id, |
|
const int clip_bbox, |
|
const int locPredTransposed, |
|
__global Dtype* bbox_data) |
|
{ |
|
for (int index = get_global_id(0); index < nthreads; index += get_global_size(0)) |
|
{ |
|
Dtype bbox_xmin, bbox_ymin, bbox_xmax, bbox_ymax; |
|
const int i = index % 4; |
|
const int p = ((index / 4 / num_loc_classes) % num_priors) * 4; |
|
|
|
const int c = (index / 4) % num_loc_classes; |
|
int label = share_location ? -1 : c; |
|
if (label == background_label_id) |
|
return; // Ignore background class. |
|
|
|
Dtype4 loc_vec = vload4(0, loc_data + index - i); |
|
Dtype4 bbox_vec, prior_variance; |
|
if (variance_encoded_in_target) |
|
{ |
|
bbox_vec = loc_vec; |
|
} else { |
|
const int start_index = num_priors * 4 + p; |
|
prior_variance = vload4(0, prior_data + start_index); |
|
bbox_vec = loc_vec * prior_variance; |
|
} |
|
|
|
if (locPredTransposed) |
|
{ |
|
bbox_ymin = bbox_vec.x; |
|
bbox_xmin = bbox_vec.y; |
|
bbox_ymax = bbox_vec.z; |
|
bbox_xmax = bbox_vec.w; |
|
} else { |
|
bbox_xmin = bbox_vec.x; |
|
bbox_ymin = bbox_vec.y; |
|
bbox_xmax = bbox_vec.z; |
|
bbox_ymax = bbox_vec.w; |
|
} |
|
|
|
Dtype4 prior_vec = vload4(0, prior_data + p); |
|
Dtype prior_width = prior_vec.z - prior_vec.x; |
|
Dtype prior_height = prior_vec.w - prior_vec.y; |
|
Dtype prior_center_x = (prior_vec.x + prior_vec.z) * .5; |
|
Dtype prior_center_y = (prior_vec.y + prior_vec.w) * .5; |
|
|
|
Dtype decode_bbox_center_x, decode_bbox_center_y; |
|
Dtype decode_bbox_width, decode_bbox_height; |
|
decode_bbox_center_x = bbox_xmin * prior_width + prior_center_x; |
|
decode_bbox_center_y = bbox_ymin * prior_height + prior_center_y; |
|
decode_bbox_width = exp(bbox_xmax) * prior_width; |
|
decode_bbox_height = exp(bbox_ymax) * prior_height; |
|
|
|
Dtype val; |
|
switch (i) |
|
{ |
|
case 0: |
|
val = decode_bbox_center_x - decode_bbox_width * .5; |
|
break; |
|
case 1: |
|
val = decode_bbox_center_y - decode_bbox_height * .5; |
|
break; |
|
case 2: |
|
val = decode_bbox_center_x + decode_bbox_width * .5; |
|
break; |
|
case 3: |
|
val = decode_bbox_center_y + decode_bbox_height * .5; |
|
break; |
|
} |
|
|
|
if (clip_bbox) |
|
val = max(min(val, (Dtype)1.), (Dtype)0.); |
|
|
|
bbox_data[index] = val; |
|
} |
|
}
|
|
|