kmeans_kernel.cl 3.73 KB
Newer Older
wester committed
1 2 3 4 5 6 7 8 9 10 11 12 13
/*M///////////////////////////////////////////////////////////////////////////////////////
//
//  IMPORTANT: READ BEFORE DOWNLOADING, COPYING, INSTALLING OR USING.
//
//  By downloading, copying, installing or using the software you agree to this license.
//  If you do not agree to this license, do not download, install,
//  copy or use the software.
//
//
//                           License Agreement
//                For Open Source Computer Vision Library
//
// Copyright (C) 2010-2012, Multicoreware, Inc., all rights reserved.
wester committed
14
// Copyright (C) 2010,2014, Advanced Micro Devices, Inc., all rights reserved.
wester committed
15 16 17
// Third party copyrights are property of their respective owners.
//
// @Authors
wester committed
18 19
//    Xiaopeng Fu, fuxiaopeng2222@163.com
//    Peng Xiao, pengxiao@outlook.com
wester committed
20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46
//
// Redistribution and use in source and binary forms, with or without modification,
// are permitted provided that the following conditions are met:
//
//   * Redistribution's of source code must retain the above copyright notice,
//     this list of conditions and the following disclaimer.
//
//   * Redistribution's in binary form must reproduce the above copyright notice,
//     this list of conditions and the following disclaimer in the documentation
//     and/or other materials provided with the distribution.
//
//   * The name of the copyright holders may not be used to endorse or promote products
//     derived from this software without specific prior written permission.
//
// This software is provided by the copyright holders and contributors as is and
// any express or implied warranties, including, but not limited to, the implied
// warranties of merchantability and fitness for a particular purpose are disclaimed.
// In no event shall the Intel Corporation or contributors be liable for any direct,
// indirect, incidental, special, exemplary, or consequential damages
// (including, but not limited to, procurement of substitute goods or services;
// loss of use, data, or profits; or business interruption) however caused
// and on any theory of liability, whether in contract, strict liability,
// or tort (including negligence or otherwise) arising in any way out of
// the use of this software, even if advised of the possibility of such damage.
//
//M*/

wester committed
47 48 49 50 51
float distance_(__global const float * center, __global const float * src, int feature_length)
{
    float res = 0;
    float4 v0, v1, v2;
    int i = 0;
wester committed
52

wester committed
53 54 55
#ifdef L1_DIST
    float4 sum = (float4)(0.0f);
#endif
wester committed
56

wester committed
57
    for ( ; i <= feature_length - 4; i += 4)
wester committed
58
    {
wester committed
59 60 61 62 63 64 65 66 67
        v0 = vload4(0, center + i);
        v1 = vload4(0, src + i);
        v2 = v1 - v0;
#ifdef L1_DIST
        v0 = fabs(v2);
        sum += v0;
#else
        res += dot(v2, v2);
#endif
wester committed
68 69
    }

wester committed
70 71 72
#ifdef L1_DIST
    res = sum.x + sum.y + sum.z + sum.w;
#endif
wester committed
73

wester committed
74 75 76 77 78 79 80 81 82 83 84
    for ( ; i < feature_length; ++i)
    {
        float t0 = src[i];
        float t1 = center[i];
#ifdef L1_DIST
        res += fabs(t0 - t1);
#else
        float t2 = t0 - t1;
        res += t2 * t2;
#endif
    }
wester committed
85

wester committed
86 87
    return res;
}
wester committed
88

wester committed
89 90 91 92 93 94 95
__kernel void distanceToCenters(__global const float * src, __global const float * centers,
                                __global float * dists, int feature_length,
                                int src_step, int centers_step,
                                int features_count, int centers_count,
                                int src_offset, int centers_offset)
{
    int gid = get_global_id(0);
wester committed
96

wester committed
97 98 99 100
    if (gid < (features_count * centers_count))
    {
        int feature_index = gid / centers_count;
        int center_index = gid % centers_count;
wester committed
101

wester committed
102 103
        int center_idx = mad24(center_index, centers_step, centers_offset);
        int src_idx = mad24(feature_index, src_step, src_offset);
wester committed
104

wester committed
105 106 107
        dists[gid] = distance_(centers + center_idx, src + src_idx, feature_length);
    }
}