/dports/graphics/opencv/opencv-4.5.3/3rdparty/carotene/src/ |
H A D | bitwise.cpp | 51 void operator() (const uint8x16_t & v_src0, const uint8x16_t & v_src1, in operator ()() 54 v_dst = vandq_u8(v_src0, v_src1); in operator ()() 57 void operator() (const uint8x8_t & v_src0, const uint8x8_t & v_src1, in operator ()() 60 v_dst = vand_u8(v_src0, v_src1); in operator ()() 73 void operator() (const uint8x16_t & v_src0, const uint8x16_t & v_src1, in operator ()() 76 v_dst = vorrq_u8(v_src0, v_src1); in operator ()() 79 void operator() (const uint8x8_t & v_src0, const uint8x8_t & v_src1, in operator ()() 82 v_dst = vorr_u8(v_src0, v_src1); in operator ()() 98 v_dst = veorq_u8(v_src0, v_src1); in operator ()() 101 void operator() (const uint8x8_t & v_src0, const uint8x8_t & v_src1, in operator ()() [all …]
|
H A D | magnitude.cpp | 55 void operator() (const int16x8_t & v_src0, const int16x8_t & v_src1, in operator ()() 58 int16x4_t v_src0_p = vget_low_s16(v_src0), v_src1_p = vget_low_s16(v_src1); in operator ()() 61 v_src0_p = vget_high_s16(v_src0); in operator ()() 72 void operator() (const int16x4_t & v_src0, const int16x4_t & v_src1, in operator ()() 75 float32x4_t v_tmp = vaddq_f32(vcvtq_f32_s32(vmull_s16(v_src0, v_src0)), in operator ()() 92 void operator() (const float32x4_t & v_src0, const float32x4_t & v_src1, in operator ()() 95 … v_dst = internal::vsqrtq_f32(vaddq_f32(vmulq_f32(v_src0, v_src0), vmulq_f32(v_src1, v_src1))); in operator ()() 98 void operator() (const float32x2_t & v_src0, const float32x2_t & v_src1, in operator ()() 101 v_dst = internal::vsqrt_f32(vadd_f32(vmul_f32(v_src0, v_src0), vmul_f32(v_src1, v_src1))); in operator ()()
|
H A D | cmp.cpp | 80 vec128 v_src0, v_src1; in compare() local 83 v_src0 = internal::vld1q(src0 + x); in compare() 85 op(v_src0, v_src1, v_dst); in compare() 105 vec128 v_src0, v_src1; in compare() local 108 v_src0 = internal::vld1q(src0 + x); in compare() 110 op(v_src0, v_src1, v_dst); in compare() 116 vec64 v_src0, v_src1; in compare() local 119 v_src0 = internal::vld1(src0 + x); in compare() 121 op(v_src0, v_src1, v_dst); in compare() 194 v_dst = internal::vceq(v_src0, v_src1); in operator ()() [all …]
|
H A D | add_weighted.cpp | 71 void operator() (const typename VecTraits<T>::vec128 & v_src0, in operator ()() 82 void operator() (const typename VecTraits<T>::vec64 & v_src0, in operator ()() 87 wideAdd(vmovl(v_src0), vmovl(v_src1), vr); in operator ()() 112 void operator() (const typename VecTraits<s32>::vec128 & v_src0, in operator ()() 116 float32x4_t vs1 = vcvtq_f32_s32(v_src0); in operator ()() 124 void operator() (const typename VecTraits<s32>::vec64 & v_src0, in operator ()() 128 float32x2_t vs1 = vcvt_f32_s32(v_src0); in operator ()() 160 float32x4_t vs1 = vcvtq_f32_u32(v_src0); in operator ()() 168 void operator() (const typename VecTraits<u32>::vec64 & v_src0, in operator ()() 172 float32x2_t vs1 = vcvt_f32_u32(v_src0); in operator ()() [all …]
|
H A D | min_max.cpp | 56 void operator() (const typename internal::VecTraits<T>::vec128 & v_src0, in operator ()() 60 v_dst = internal::vminq(v_src0, v_src1); in operator ()() 63 void operator() (const typename internal::VecTraits<T>::vec64 & v_src0, in operator ()() 67 v_dst = internal::vmin(v_src0, v_src1); in operator ()() 81 void operator() (const typename internal::VecTraits<T>::vec128 & v_src0, in operator ()() 85 v_dst = internal::vmaxq(v_src0, v_src1); in operator ()() 88 void operator() (const typename internal::VecTraits<T>::vec64 & v_src0, in operator ()() 92 v_dst = internal::vmax(v_src0, v_src1); in operator ()()
|
H A D | mul.cpp | 335 uint8x16_t v_src0 = vld1q_u8(src0 + j); in mul() local 344 v_src0_p = vmovl_u8(vget_high_u8(v_src0)); in mul() 408 uint8x16_t v_src0 = vld1q_u8(src0 + j); in mul() local 417 v_src0_p = vmovl_u8(vget_high_u8(v_src0)); in mul() 567 uint8x16_t v_src0 = vld1q_u8(src0 + j); in mul() local 579 v_src0_p = vmovl_u8(vget_high_u8(v_src0)); in mul() 641 uint8x16_t v_src0 = vld1q_u8(src0 + j); in mul() local 736 uint8x16_t v_src0 = vld1q_u8(src0 + j); in mul() local 771 uint8x16_t v_src0 = vld1q_u8(src0 + j); in mul() local 818 uint8x16_t v_src0 = vld1q_u8(src0 + j); in mul() local [all …]
|
H A D | add.cpp | 58 v_dst = internal::vaddq(v_src0, v_src1); in operator ()() 61 void operator() (const typename internal::VecTraits<T>::vec64 & v_src0, in operator ()() 65 v_dst = internal::vadd(v_src0, v_src1); in operator ()() 83 v_dst = internal::vqaddq(v_src0, v_src1); in operator ()() 90 v_dst = internal::vqadd(v_src0, v_src1); in operator ()() 206 uint8x8_t v_src0 = vld1_u8(src0 + j); in add() local 208 vst1q_u16(dst + j, vaddl_u8(v_src0, v_src1)); in add() 249 uint8x16_t v_src0 = vld1q_u8(src0 + j); in add() local 262 int16x8_t v_dst = vqaddq_s16(v_src0, v_src1); in add() 275 uint8x16_t v_src0 = vld1q_u8(src0 + j); in add() local [all …]
|
H A D | absdiff.cpp | 56 void operator() (const typename internal::VecTraits<T>::vec128 & v_src0, in operator ()() 60 v_dst = internal::vabdq(v_src0, v_src1); in operator ()() 63 void operator() (const typename internal::VecTraits<T>::vec64 & v_src0, in operator ()() 67 v_dst = internal::vabd(v_src0, v_src1); in operator ()() 81 void operator() (const typename internal::VecTraits<T>::vec128 & v_src0, in operator ()() 85 typename internal::VecTraits<T>::vec128 v_min = internal::vminq(v_src0, v_src1); in operator ()() 86 typename internal::VecTraits<T>::vec128 v_max = internal::vmaxq(v_src0, v_src1); in operator ()() 90 void operator() (const typename internal::VecTraits<T>::vec64 & v_src0, in operator ()() 94 typename internal::VecTraits<T>::vec64 v_min = internal::vmin(v_src0, v_src1); in operator ()() 95 typename internal::VecTraits<T>::vec64 v_max = internal::vmax(v_src0, v_src1); in operator ()()
|
H A D | sub.cpp | 58 v_dst = internal::vsubq(v_src0, v_src1); in operator ()() 65 v_dst = internal::vsub(v_src0, v_src1); in operator ()() 83 v_dst = internal::vqsubq(v_src0, v_src1); in operator ()() 90 v_dst = internal::vqsub(v_src0, v_src1); in operator ()() 171 uint8x8_t v_src0 = vld1_u8(src0 + j); in sub() local 173 vst1q_u16(dstu16 + j, vsubl_u8(v_src0, v_src1)); in sub() 231 uint8x8_t v_src0 = vld1_u8(src0 + j); in sub() local 276 uint8x16_t v_src0 = vld1q_u8(src0 + j); in sub() local 302 uint8x16_t v_src0 = vld1q_u8(src0 + j); in sub() local 370 int16x8_t v_src0 = vld1q_s16(src0 + j); in sub() local [all …]
|
H A D | accumulate.cpp | 72 v_dst0 = vqaddq_s16(v_dst0, v_src0); in accumulate() 125 int16x4_t v_srclo = vget_low_s16(v_src0), v_srchi = vget_high_s16(v_src0); in accumulateSquareConst() 178 int16x4_t v_srclo = vget_low_s16(v_src0), v_srchi = vget_high_s16(v_src0); in accumulateSquareConst() 277 void operator() (const uint8x16_t & v_src0, const uint8x16_t & v_src1, in operator ()() 280 v_dst = vhaddq_u8(v_src0, v_src1); in operator ()() 283 void operator() (const uint8x8_t & v_src0, const uint8x8_t & v_src1, in operator ()() 286 v_dst = vhadd_u8(v_src0, v_src1); in operator ()() 309 void operator() (const uint8x16_t & v_src0, const uint8x16_t & v_src1, in operator ()() 312 uint16x8_t v_src0_p = vmovl_u8(vget_low_u8(v_src0)); in operator ()() 321 v_src0_p = vmovl_u8(vget_high_u8(v_src0)); in operator ()() [all …]
|
H A D | fill_minmaxloc.cpp | 189 uint16x8_t v_src0 = vld1q_u16(src + j), v_src1 = vld1q_u16(src + j + 8); in fillMinMaxLocs() local 191 … uint16x8_t v_mask0 = vorrq_u16(vceqq_u16(v_src0, v_maxval8), vceqq_u16(v_src0, v_minval8)); in fillMinMaxLocs() 269 int16x8_t v_src0 = vld1q_s16(src + j), v_src1 = vld1q_s16(src + j + 8); in fillMinMaxLocs() local 271 … uint16x8_t v_mask0 = vorrq_u16(vceqq_s16(v_src0, v_maxval8), vceqq_s16(v_src0, v_minval8)); in fillMinMaxLocs() 348 int32x4_t v_src0 = vld1q_s32(src + j), v_src1 = vld1q_s32(src + j + 4); in fillMinMaxLocs() local 350 … uint32x4_t v_mask0 = vorrq_u32(vceqq_s32(v_src0, v_maxval4), vceqq_s32(v_src0, v_minval4)); in fillMinMaxLocs() 407 uint32x4_t v_src0 = vld1q_u32(src + j), v_src1 = vld1q_u32(src + j + 4); in fillMinMaxLocs() local 409 … uint32x4_t v_mask0 = vorrq_u32(vceqq_u32(v_src0, v_maxval4), vceqq_u32(v_src0, v_minval4)); in fillMinMaxLocs()
|
H A D | convert_depth.cpp | 144 int16x8_t v_src0 = vshrq_n_s16(vld1q_s16(src + j), shift), in rshiftConst() local 146 uint8x16_t v_dst = vcombine_u8(vqmovun_s16(v_src0), in rshiftConst() 166 int16x8_t v_src0 = vshrq_n_s16(vld1q_s16(src + j), shift), in rshiftConst() local 168 int8x16_t v_dst = vcombine_s8(vmovn_s16(v_src0), in rshiftConst() 206 int16x8_t v_src0 = vld1q_s16(src + j), v_src1 = vld1q_s16(src + j + 8); in rshiftConst() local 207 uint8x16_t v_dst = vcombine_u8(vqmovun_s16(v_src0), vqmovun_s16(v_src1)); in rshiftConst() 226 int16x8_t v_src0 = vld1q_s16(src + j), v_src1 = vld1q_s16(src + j + 8); in rshiftConst() local 227 int8x16_t v_dst = vcombine_s8(vmovn_s16(v_src0), vmovn_s16(v_src1)); in rshiftConst() 335 int16x8_t v_src0 = vld1q_s16(src + j), v_src1 = vld1q_s16(src + j + 8); in rshift() local 336 uint8x16_t v_dst = vcombine_u8(vmovn_u16(vcltq_s16(v_src0, v_zero)), in rshift()
|
H A D | div.cpp | 190 vec128 v_src0 = internal::vld1q(src0 + j); in div() local 198 vec64 v_src0 = internal::vld1(src0 + j); in div() local 216 vec128 v_src0 = internal::vld1q(src0 + j); in div() local 224 vec64 v_src0 = internal::vld1(src0 + j); in div() local 491 float32x4_t v_src0 = vld1q_f32(src0 + j); in div() local 499 float32x2_t v_src0 = vld1_f32(src0 + j); in div() local 502 vst1_f32(dst + j, vmul_f32(v_src0, internal::vrecp_f32(v_src1))); in div() 525 float32x4_t v_src0 = vld1q_f32(src0 + j); in div() local 528 vst1q_f32(dst + j, vmulq_f32(vmulq_n_f32(v_src0, scale), in div() 534 float32x2_t v_src0 = vld1_f32(src0 + j); in div() local [all …]
|
/dports/graphics/opencv/opencv-4.5.3/modules/imgproc/src/ |
H A D | accum.simd.hpp | 350 v_src0 = v_src0 & v_mask; in acc_simd_() 447 v_src0 = v_src0 & v_mask; in acc_simd_() 671 v_src0 = v_src0 & v_mask; in acc_simd_() 824 v_src0 = v_src0 & v_mask; in acc_simd_() 1048 v_src0 = v_mul_wrap(v_src0, v_src0); in accSqr_simd_() 1074 v_src0 = v_mul_wrap(v_src0, v_src0); in accSqr_simd_() 1096 v_src0 = v_src0 & v_mask; in accSqr_simd_() 1194 v_src0 = v_src0 & v_mask0; in accSqr_simd_() 1300 v_src0 = v_src0 & v_mask0; in accSqr_simd_() 1572 v_src0 = v_src0 & v_mask; in accSqr_simd_() [all …]
|
/dports/graphics/opencv/opencv-4.5.3/modules/core/src/ |
H A D | sum.simd.hpp | 46 v_uint16 v_src0, v_src1; in operator ()() local 48 v_sum16 += v_src0 + v_src1; in operator ()() 101 v_int16 v_src0, v_src1; in operator ()() local 103 v_sum16 += v_src0 + v_src1; in operator ()() 151 v_uint32 v_src0, v_src1; in operator ()() local 152 v_expand(vx_load(src0 + x), v_src0, v_src1); in operator ()() 153 v_sum += v_src0 + v_src1; in operator ()() 190 v_int32 v_src0, v_src1; in operator ()() local 192 v_sum += v_src0 + v_src1; in operator ()() 231 v_int32 v_src0 = vx_load(src0 + x); in operator ()() local [all …]
|
/dports/lang/gcc6-aux/gcc-6-20180516/gcc/testsuite/gcc.target/powerpc/ |
H A D | pr83677.c | 86 vector unsigned char v_src0, v_src1, v_src2; in acc_simd_() local 87 v_load_deinterleave_u8((unsigned char *)(src + (x * 3)), &v_src0, &v_src1, &v_src2); in acc_simd_() 88 v_src0 = v_src0 & v_mask; in acc_simd_() 94 v_expand_u8(&v_src0, &v_src00, &v_src01); in acc_simd_()
|
/dports/lang/gcc12-devel/gcc-12-20211205/gcc/testsuite/gcc.target/powerpc/ |
H A D | pr83677.c | 85 vector unsigned char v_src0, v_src1, v_src2; in acc_simd_() local 86 v_load_deinterleave_u8((unsigned char *)(src + (x * 3)), &v_src0, &v_src1, &v_src2); in acc_simd_() 87 v_src0 = v_src0 & v_mask; in acc_simd_() 93 v_expand_u8(&v_src0, &v_src00, &v_src01); in acc_simd_()
|
/dports/devel/riscv64-none-elf-gcc/gcc-8.4.0/gcc/testsuite/gcc.target/powerpc/ |
H A D | pr83677.c | 86 vector unsigned char v_src0, v_src1, v_src2; in acc_simd_() local 87 v_load_deinterleave_u8((unsigned char *)(src + (x * 3)), &v_src0, &v_src1, &v_src2); in acc_simd_() 88 v_src0 = v_src0 & v_mask; in acc_simd_() 94 v_expand_u8(&v_src0, &v_src00, &v_src01); in acc_simd_()
|
/dports/lang/gcc10/gcc-10.3.0/gcc/testsuite/gcc.target/powerpc/ |
H A D | pr83677.c | 85 vector unsigned char v_src0, v_src1, v_src2; in acc_simd_() local 86 v_load_deinterleave_u8((unsigned char *)(src + (x * 3)), &v_src0, &v_src1, &v_src2); in acc_simd_() 87 v_src0 = v_src0 & v_mask; in acc_simd_() 93 v_expand_u8(&v_src0, &v_src00, &v_src01); in acc_simd_()
|
/dports/lang/gcc11-devel/gcc-11-20211009/gcc/testsuite/gcc.target/powerpc/ |
H A D | pr83677.c | 85 vector unsigned char v_src0, v_src1, v_src2; in acc_simd_() local 86 v_load_deinterleave_u8((unsigned char *)(src + (x * 3)), &v_src0, &v_src1, &v_src2); in acc_simd_() 87 v_src0 = v_src0 & v_mask; in acc_simd_() 93 v_expand_u8(&v_src0, &v_src00, &v_src01); in acc_simd_()
|
/dports/lang/gcc11/gcc-11.2.0/gcc/testsuite/gcc.target/powerpc/ |
H A D | pr83677.c | 85 vector unsigned char v_src0, v_src1, v_src2; in acc_simd_() local 86 v_load_deinterleave_u8((unsigned char *)(src + (x * 3)), &v_src0, &v_src1, &v_src2); in acc_simd_() 87 v_src0 = v_src0 & v_mask; in acc_simd_() 93 v_expand_u8(&v_src0, &v_src00, &v_src01); in acc_simd_()
|
/dports/devel/arm-none-eabi-gcc/gcc-8.4.0/gcc/testsuite/gcc.target/powerpc/ |
H A D | pr83677.c | 86 vector unsigned char v_src0, v_src1, v_src2; in acc_simd_() local 87 v_load_deinterleave_u8((unsigned char *)(src + (x * 3)), &v_src0, &v_src1, &v_src2); in acc_simd_() 88 v_src0 = v_src0 & v_mask; in acc_simd_() 94 v_expand_u8(&v_src0, &v_src00, &v_src01); in acc_simd_()
|
/dports/devel/riscv32-unknown-elf-gcc/gcc-8.4.0/gcc/testsuite/gcc.target/powerpc/ |
H A D | pr83677.c | 86 vector unsigned char v_src0, v_src1, v_src2; in acc_simd_() local 87 v_load_deinterleave_u8((unsigned char *)(src + (x * 3)), &v_src0, &v_src1, &v_src2); in acc_simd_() 88 v_src0 = v_src0 & v_mask; in acc_simd_() 94 v_expand_u8(&v_src0, &v_src00, &v_src01); in acc_simd_()
|
/dports/devel/aarch64-none-elf-gcc/gcc-8.4.0/gcc/testsuite/gcc.target/powerpc/ |
H A D | pr83677.c | 86 vector unsigned char v_src0, v_src1, v_src2; in acc_simd_() local 87 v_load_deinterleave_u8((unsigned char *)(src + (x * 3)), &v_src0, &v_src1, &v_src2); in acc_simd_() 88 v_src0 = v_src0 & v_mask; in acc_simd_() 94 v_expand_u8(&v_src0, &v_src00, &v_src01); in acc_simd_()
|
/dports/lang/gcc9-aux/gcc-9.1.0/gcc/testsuite/gcc.target/powerpc/ |
H A D | pr83677.c | 85 vector unsigned char v_src0, v_src1, v_src2; in acc_simd_() local 86 v_load_deinterleave_u8((unsigned char *)(src + (x * 3)), &v_src0, &v_src1, &v_src2); in acc_simd_() 87 v_src0 = v_src0 & v_mask; in acc_simd_() 93 v_expand_u8(&v_src0, &v_src00, &v_src01); in acc_simd_()
|