1 /*
2 * By downloading, copying, installing or using the software you agree to this license.
3 * If you do not agree to this license, do not download, install,
4 * copy or use the software.
5 *
6 *
7 * License Agreement
8 * For Open Source Computer Vision Library
9 * (3-clause BSD License)
10 *
11 * Copyright (C) 2014-2015, NVIDIA Corporation, all rights reserved.
12 * Third party copyrights are property of their respective owners.
13 *
14 * Redistribution and use in source and binary forms, with or without modification,
15 * are permitted provided that the following conditions are met:
16 *
17 * * Redistributions of source code must retain the above copyright notice,
18 * this list of conditions and the following disclaimer.
19 *
20 * * Redistributions in binary form must reproduce the above copyright notice,
21 * this list of conditions and the following disclaimer in the documentation
22 * and/or other materials provided with the distribution.
23 *
24 * * Neither the names of the copyright holders nor the names of the contributors
25 * may be used to endorse or promote products derived from this software
26 * without specific prior written permission.
27 *
28 * This software is provided by the copyright holders and contributors "as is" and
29 * any express or implied warranties, including, but not limited to, the implied
30 * warranties of merchantability and fitness for a particular purpose are disclaimed.
31 * In no event shall copyright holders or contributors be liable for any direct,
32 * indirect, incidental, special, exemplary, or consequential damages
33 * (including, but not limited to, procurement of substitute goods or services;
34 * loss of use, data, or profits; or business interruption) however caused
35 * and on any theory of liability, whether in contract, strict liability,
36 * or tort (including negligence or otherwise) arising in any way out of
37 * the use of this software, even if advised of the possibility of such damage.
38 */
39
40 #include <algorithm>
41
42 #include "common.hpp"
43 #include "vtransform.hpp"
44
45 namespace CAROTENE_NS {
46
47 #ifdef CAROTENE_NEON
48
49 namespace {
50
51 template <typename T>
52 struct AbsDiff
53 {
54 typedef T type;
55
operator ()CAROTENE_NS::__anon6d3cc1a20111::AbsDiff56 void operator() (const typename internal::VecTraits<T>::vec128 & v_src0,
57 const typename internal::VecTraits<T>::vec128 & v_src1,
58 typename internal::VecTraits<T>::vec128 & v_dst) const
59 {
60 v_dst = internal::vabdq(v_src0, v_src1);
61 }
62
operator ()CAROTENE_NS::__anon6d3cc1a20111::AbsDiff63 void operator() (const typename internal::VecTraits<T>::vec64 & v_src0,
64 const typename internal::VecTraits<T>::vec64 & v_src1,
65 typename internal::VecTraits<T>::vec64 & v_dst) const
66 {
67 v_dst = internal::vabd(v_src0, v_src1);
68 }
69
operator ()CAROTENE_NS::__anon6d3cc1a20111::AbsDiff70 void operator() (const T * src0, const T * src1, T * dst) const
71 {
72 dst[0] = src0[0] >= src1[0] ? src0[0] - src1[0] : src1[0] - src0[0];
73 }
74 };
75
76 template <typename T>
77 struct AbsDiffSigned
78 {
79 typedef T type;
80
operator ()CAROTENE_NS::__anon6d3cc1a20111::AbsDiffSigned81 void operator() (const typename internal::VecTraits<T>::vec128 & v_src0,
82 const typename internal::VecTraits<T>::vec128 & v_src1,
83 typename internal::VecTraits<T>::vec128 & v_dst) const
84 {
85 typename internal::VecTraits<T>::vec128 v_min = internal::vminq(v_src0, v_src1);
86 typename internal::VecTraits<T>::vec128 v_max = internal::vmaxq(v_src0, v_src1);
87 v_dst = internal::vqsubq(v_max, v_min);
88 }
89
operator ()CAROTENE_NS::__anon6d3cc1a20111::AbsDiffSigned90 void operator() (const typename internal::VecTraits<T>::vec64 & v_src0,
91 const typename internal::VecTraits<T>::vec64 & v_src1,
92 typename internal::VecTraits<T>::vec64 & v_dst) const
93 {
94 typename internal::VecTraits<T>::vec64 v_min = internal::vmin(v_src0, v_src1);
95 typename internal::VecTraits<T>::vec64 v_max = internal::vmax(v_src0, v_src1);
96 v_dst = internal::vqsub(v_max, v_min);
97 }
98
operator ()CAROTENE_NS::__anon6d3cc1a20111::AbsDiffSigned99 void operator() (const T * src0, const T * src1, T * dst) const
100 {
101 dst[0] = internal::saturate_cast<T>(src0[0] >= src1[0] ? (s64)src0[0] - src1[0] : (s64)src1[0] - src0[0]);
102 }
103 };
104
105 } // namespace
106
107 #endif
108
absDiff(const Size2D & size,const u8 * src0Base,ptrdiff_t src0Stride,const u8 * src1Base,ptrdiff_t src1Stride,u8 * dstBase,ptrdiff_t dstStride)109 void absDiff(const Size2D &size,
110 const u8 *src0Base, ptrdiff_t src0Stride,
111 const u8 *src1Base, ptrdiff_t src1Stride,
112 u8 *dstBase, ptrdiff_t dstStride)
113 {
114 internal::assertSupportedConfiguration();
115 #ifdef CAROTENE_NEON
116 internal::vtransform(size,
117 src0Base, src0Stride,
118 src1Base, src1Stride,
119 dstBase, dstStride, AbsDiff<u8>());
120 #else
121 (void)size;
122 (void)src0Base;
123 (void)src0Stride;
124 (void)src1Base;
125 (void)src1Stride;
126 (void)dstBase;
127 (void)dstStride;
128 #endif
129 }
130
absDiff(const Size2D & size,const u16 * src0Base,ptrdiff_t src0Stride,const u16 * src1Base,ptrdiff_t src1Stride,u16 * dstBase,ptrdiff_t dstStride)131 void absDiff(const Size2D &size,
132 const u16 *src0Base, ptrdiff_t src0Stride,
133 const u16 *src1Base, ptrdiff_t src1Stride,
134 u16 *dstBase, ptrdiff_t dstStride)
135 {
136 internal::assertSupportedConfiguration();
137 #ifdef CAROTENE_NEON
138 internal::vtransform(size,
139 src0Base, src0Stride,
140 src1Base, src1Stride,
141 dstBase, dstStride, AbsDiff<u16>());
142 #else
143 (void)size;
144 (void)src0Base;
145 (void)src0Stride;
146 (void)src1Base;
147 (void)src1Stride;
148 (void)dstBase;
149 (void)dstStride;
150 #endif
151 }
152
absDiff(const Size2D & size,const s8 * src0Base,ptrdiff_t src0Stride,const s8 * src1Base,ptrdiff_t src1Stride,s8 * dstBase,ptrdiff_t dstStride)153 void absDiff(const Size2D &size,
154 const s8 *src0Base, ptrdiff_t src0Stride,
155 const s8 *src1Base, ptrdiff_t src1Stride,
156 s8 *dstBase, ptrdiff_t dstStride)
157 {
158 internal::assertSupportedConfiguration();
159 #ifdef CAROTENE_NEON
160 internal::vtransform(size,
161 src0Base, src0Stride,
162 src1Base, src1Stride,
163 dstBase, dstStride, AbsDiffSigned<s8>());
164 #else
165 (void)size;
166 (void)src0Base;
167 (void)src0Stride;
168 (void)src1Base;
169 (void)src1Stride;
170 (void)dstBase;
171 (void)dstStride;
172 #endif
173 }
174
absDiff(const Size2D & size,const s16 * src0Base,ptrdiff_t src0Stride,const s16 * src1Base,ptrdiff_t src1Stride,s16 * dstBase,ptrdiff_t dstStride)175 void absDiff(const Size2D &size,
176 const s16 *src0Base, ptrdiff_t src0Stride,
177 const s16 *src1Base, ptrdiff_t src1Stride,
178 s16 *dstBase, ptrdiff_t dstStride)
179 {
180 internal::assertSupportedConfiguration();
181 #ifdef CAROTENE_NEON
182 internal::vtransform(size,
183 src0Base, src0Stride,
184 src1Base, src1Stride,
185 dstBase, dstStride, AbsDiffSigned<s16>());
186 #else
187 (void)size;
188 (void)src0Base;
189 (void)src0Stride;
190 (void)src1Base;
191 (void)src1Stride;
192 (void)dstBase;
193 (void)dstStride;
194 #endif
195 }
196
absDiff(const Size2D & size,const s32 * src0Base,ptrdiff_t src0Stride,const s32 * src1Base,ptrdiff_t src1Stride,s32 * dstBase,ptrdiff_t dstStride)197 void absDiff(const Size2D &size,
198 const s32 *src0Base, ptrdiff_t src0Stride,
199 const s32 *src1Base, ptrdiff_t src1Stride,
200 s32 *dstBase, ptrdiff_t dstStride)
201 {
202 internal::assertSupportedConfiguration();
203 #ifdef CAROTENE_NEON
204 internal::vtransform(size,
205 src0Base, src0Stride,
206 src1Base, src1Stride,
207 dstBase, dstStride, AbsDiffSigned<s32>());
208 #else
209 (void)size;
210 (void)src0Base;
211 (void)src0Stride;
212 (void)src1Base;
213 (void)src1Stride;
214 (void)dstBase;
215 (void)dstStride;
216 #endif
217 }
218
absDiff(const Size2D & size,const f32 * src0Base,ptrdiff_t src0Stride,const f32 * src1Base,ptrdiff_t src1Stride,f32 * dstBase,ptrdiff_t dstStride)219 void absDiff(const Size2D &size,
220 const f32 * src0Base, ptrdiff_t src0Stride,
221 const f32 * src1Base, ptrdiff_t src1Stride,
222 f32 * dstBase, ptrdiff_t dstStride)
223 {
224 internal::assertSupportedConfiguration();
225 #ifdef CAROTENE_NEON
226 internal::vtransform(size,
227 src0Base, src0Stride,
228 src1Base, src1Stride,
229 dstBase, dstStride, AbsDiff<f32>());
230 #else
231 (void)size;
232 (void)src0Base;
233 (void)src0Stride;
234 (void)src1Base;
235 (void)src1Stride;
236 (void)dstBase;
237 (void)dstStride;
238 #endif
239 }
240
241 } // namespace CAROTENE_NS
242