Home
last modified time | relevance | path

Searched refs:vsubq_f32 (Results 1 – 25 of 534) sorted by relevance

12345678910>>...22

/dports/www/qt5-webengine/qtwebengine-everywhere-src-5.15.2/src/3rdparty/chromium/third_party/webrtc/modules/audio_processing/utility/
H A Dooura_fft_neon.cc46 const float32x4_t x1v = vsubq_f32(a01v, a23v); in cft1st_128_neon()
48 const float32x4_t x3v = vsubq_f32(a45v, a67v); in cft1st_128_neon()
52 x0v = vsubq_f32(x0v, x2v); in cft1st_128_neon()
213 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftfsub_128_neon()
234 const float32x4_t a_k2_p1n = vsubq_f32(a_k2_p1, yi_); in rftfsub_128_neon()
241 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftfsub_128_neon()
243 a_j2_p.val[1] = vsubq_f32(a_j2_p.val[1], yi_); in rftfsub_128_neon()
293 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftbsub_128_neon()
314 const float32x4_t a_k2_p1n = vsubq_f32(yi_, a_k2_p1); in rftbsub_128_neon()
322 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftbsub_128_neon()
[all …]
/dports/net-im/telegram-desktop/tdesktop-3.2.5-full/Telegram/ThirdParty/libtgvoip/webrtc_dsp/modules/audio_processing/utility/
H A Dooura_fft_neon.cc48 const float32x4_t x1v = vsubq_f32(a01v, a23v); in cft1st_128_neon()
50 const float32x4_t x3v = vsubq_f32(a45v, a67v); in cft1st_128_neon()
54 x0v = vsubq_f32(x0v, x2v); in cft1st_128_neon()
215 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftfsub_128_neon()
236 const float32x4_t a_k2_p1n = vsubq_f32(a_k2_p1, yi_); in rftfsub_128_neon()
243 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftfsub_128_neon()
245 a_j2_p.val[1] = vsubq_f32(a_j2_p.val[1], yi_); in rftfsub_128_neon()
295 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftbsub_128_neon()
316 const float32x4_t a_k2_p1n = vsubq_f32(yi_, a_k2_p1); in rftbsub_128_neon()
324 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftbsub_128_neon()
[all …]
/dports/net-im/tg_owt/tg_owt-d578c76/src/common_audio/third_party/ooura/fft_size_128/
H A Dooura_fft_neon.cc46 const float32x4_t x1v = vsubq_f32(a01v, a23v); in cft1st_128_neon()
48 const float32x4_t x3v = vsubq_f32(a45v, a67v); in cft1st_128_neon()
52 x0v = vsubq_f32(x0v, x2v); in cft1st_128_neon()
213 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftfsub_128_neon()
234 const float32x4_t a_k2_p1n = vsubq_f32(a_k2_p1, yi_); in rftfsub_128_neon()
241 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftfsub_128_neon()
243 a_j2_p.val[1] = vsubq_f32(a_j2_p.val[1], yi_); in rftfsub_128_neon()
293 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftbsub_128_neon()
314 const float32x4_t a_k2_p1n = vsubq_f32(yi_, a_k2_p1); in rftbsub_128_neon()
322 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftbsub_128_neon()
[all …]
/dports/www/chromium-legacy/chromium-88.0.4324.182/third_party/webrtc/common_audio/third_party/ooura/fft_size_128/
H A Dooura_fft_neon.cc46 const float32x4_t x1v = vsubq_f32(a01v, a23v); in cft1st_128_neon()
48 const float32x4_t x3v = vsubq_f32(a45v, a67v); in cft1st_128_neon()
52 x0v = vsubq_f32(x0v, x2v); in cft1st_128_neon()
213 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftfsub_128_neon()
234 const float32x4_t a_k2_p1n = vsubq_f32(a_k2_p1, yi_); in rftfsub_128_neon()
241 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftfsub_128_neon()
243 a_j2_p.val[1] = vsubq_f32(a_j2_p.val[1], yi_); in rftfsub_128_neon()
293 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftbsub_128_neon()
314 const float32x4_t a_k2_p1n = vsubq_f32(yi_, a_k2_p1); in rftbsub_128_neon()
322 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftbsub_128_neon()
[all …]
/dports/www/firefox/firefox-99.0/third_party/libwebrtc/common_audio/third_party/ooura/fft_size_128/
H A Dooura_fft_neon.cc46 const float32x4_t x1v = vsubq_f32(a01v, a23v); in cft1st_128_neon()
48 const float32x4_t x3v = vsubq_f32(a45v, a67v); in cft1st_128_neon()
52 x0v = vsubq_f32(x0v, x2v); in cft1st_128_neon()
213 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftfsub_128_neon()
234 const float32x4_t a_k2_p1n = vsubq_f32(a_k2_p1, yi_); in rftfsub_128_neon()
241 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftfsub_128_neon()
243 a_j2_p.val[1] = vsubq_f32(a_j2_p.val[1], yi_); in rftfsub_128_neon()
293 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftbsub_128_neon()
314 const float32x4_t a_k2_p1n = vsubq_f32(yi_, a_k2_p1); in rftbsub_128_neon()
322 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftbsub_128_neon()
[all …]
/dports/net/pjsip/pjproject-2.11.1/third_party/webrtc/src/webrtc/modules/audio_processing/aec/
H A Daec_rdft_neon.c45 const float32x4_t x1v = vsubq_f32(a01v, a23v); in cft1st_128_neon()
47 const float32x4_t x3v = vsubq_f32(a45v, a67v); in cft1st_128_neon()
51 x0v = vsubq_f32(x0v, x2v); in cft1st_128_neon()
212 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftfsub_128_neon()
233 const float32x4_t a_k2_p1n = vsubq_f32(a_k2_p1, yi_); in rftfsub_128_neon()
240 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftfsub_128_neon()
242 a_j2_p.val[1] = vsubq_f32(a_j2_p.val[1], yi_); in rftfsub_128_neon()
292 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftbsub_128_neon()
313 const float32x4_t a_k2_p1n = vsubq_f32(yi_, a_k2_p1); in rftbsub_128_neon()
321 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftbsub_128_neon()
[all …]
/dports/mail/thunderbird/thunderbird-91.8.0/third_party/libwebrtc/webrtc/modules/audio_processing/utility/
H A Dooura_fft_neon.cc47 const float32x4_t x1v = vsubq_f32(a01v, a23v); in cft1st_128_neon()
49 const float32x4_t x3v = vsubq_f32(a45v, a67v); in cft1st_128_neon()
53 x0v = vsubq_f32(x0v, x2v); in cft1st_128_neon()
214 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftfsub_128_neon()
235 const float32x4_t a_k2_p1n = vsubq_f32(a_k2_p1, yi_); in rftfsub_128_neon()
242 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftfsub_128_neon()
244 a_j2_p.val[1] = vsubq_f32(a_j2_p.val[1], yi_); in rftfsub_128_neon()
294 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftbsub_128_neon()
315 const float32x4_t a_k2_p1n = vsubq_f32(yi_, a_k2_p1); in rftbsub_128_neon()
323 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftbsub_128_neon()
[all …]
/dports/lang/spidermonkey60/firefox-60.9.0/media/webrtc/trunk/webrtc/modules/audio_processing/utility/
H A Dooura_fft_neon.cc47 const float32x4_t x1v = vsubq_f32(a01v, a23v); in cft1st_128_neon()
49 const float32x4_t x3v = vsubq_f32(a45v, a67v); in cft1st_128_neon()
53 x0v = vsubq_f32(x0v, x2v); in cft1st_128_neon()
214 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftfsub_128_neon()
235 const float32x4_t a_k2_p1n = vsubq_f32(a_k2_p1, yi_); in rftfsub_128_neon()
242 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftfsub_128_neon()
244 a_j2_p.val[1] = vsubq_f32(a_j2_p.val[1], yi_); in rftfsub_128_neon()
294 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftbsub_128_neon()
315 const float32x4_t a_k2_p1n = vsubq_f32(yi_, a_k2_p1); in rftbsub_128_neon()
323 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftbsub_128_neon()
[all …]
/dports/www/firefox-legacy/firefox-52.8.0esr/media/webrtc/trunk/webrtc/modules/audio_processing/aec/
H A Daec_rdft_neon.c45 const float32x4_t x1v = vsubq_f32(a01v, a23v); in cft1st_128_neon()
47 const float32x4_t x3v = vsubq_f32(a45v, a67v); in cft1st_128_neon()
51 x0v = vsubq_f32(x0v, x2v); in cft1st_128_neon()
212 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftfsub_128_neon()
233 const float32x4_t a_k2_p1n = vsubq_f32(a_k2_p1, yi_); in rftfsub_128_neon()
240 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftfsub_128_neon()
242 a_j2_p.val[1] = vsubq_f32(a_j2_p.val[1], yi_); in rftfsub_128_neon()
292 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftbsub_128_neon()
313 const float32x4_t a_k2_p1n = vsubq_f32(yi_, a_k2_p1); in rftbsub_128_neon()
321 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftbsub_128_neon()
[all …]
/dports/www/firefox-esr/firefox-91.8.0/third_party/libwebrtc/webrtc/modules/audio_processing/utility/
H A Dooura_fft_neon.cc47 const float32x4_t x1v = vsubq_f32(a01v, a23v); in cft1st_128_neon()
49 const float32x4_t x3v = vsubq_f32(a45v, a67v); in cft1st_128_neon()
53 x0v = vsubq_f32(x0v, x2v); in cft1st_128_neon()
214 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftfsub_128_neon()
235 const float32x4_t a_k2_p1n = vsubq_f32(a_k2_p1, yi_); in rftfsub_128_neon()
242 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftfsub_128_neon()
244 a_j2_p.val[1] = vsubq_f32(a_j2_p.val[1], yi_); in rftfsub_128_neon()
294 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftbsub_128_neon()
315 const float32x4_t a_k2_p1n = vsubq_f32(yi_, a_k2_p1); in rftbsub_128_neon()
323 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftbsub_128_neon()
[all …]
/dports/audio/webrtc-audio-processing0/webrtc-audio-processing-0.3.1/webrtc/modules/audio_processing/aec/
H A Daec_rdft_neon.c45 const float32x4_t x1v = vsubq_f32(a01v, a23v); in cft1st_128_neon()
47 const float32x4_t x3v = vsubq_f32(a45v, a67v); in cft1st_128_neon()
51 x0v = vsubq_f32(x0v, x2v); in cft1st_128_neon()
212 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftfsub_128_neon()
233 const float32x4_t a_k2_p1n = vsubq_f32(a_k2_p1, yi_); in rftfsub_128_neon()
240 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftfsub_128_neon()
242 a_j2_p.val[1] = vsubq_f32(a_j2_p.val[1], yi_); in rftfsub_128_neon()
292 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftbsub_128_neon()
313 const float32x4_t a_k2_p1n = vsubq_f32(yi_, a_k2_p1); in rftbsub_128_neon()
321 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftbsub_128_neon()
[all …]
/dports/audio/webrtc-audio-processing/webrtc-audio-processing-1.0/webrtc/common_audio/third_party/ooura/fft_size_128/
H A Dooura_fft_neon.cc46 const float32x4_t x1v = vsubq_f32(a01v, a23v); in cft1st_128_neon()
48 const float32x4_t x3v = vsubq_f32(a45v, a67v); in cft1st_128_neon()
52 x0v = vsubq_f32(x0v, x2v); in cft1st_128_neon()
213 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftfsub_128_neon()
234 const float32x4_t a_k2_p1n = vsubq_f32(a_k2_p1, yi_); in rftfsub_128_neon()
241 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftfsub_128_neon()
243 a_j2_p.val[1] = vsubq_f32(a_j2_p.val[1], yi_); in rftfsub_128_neon()
293 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftbsub_128_neon()
314 const float32x4_t a_k2_p1n = vsubq_f32(yi_, a_k2_p1); in rftbsub_128_neon()
322 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftbsub_128_neon()
[all …]
/dports/lang/spidermonkey78/firefox-78.9.0/media/webrtc/trunk/webrtc/modules/audio_processing/utility/
H A Dooura_fft_neon.cc47 const float32x4_t x1v = vsubq_f32(a01v, a23v); in cft1st_128_neon()
49 const float32x4_t x3v = vsubq_f32(a45v, a67v); in cft1st_128_neon()
53 x0v = vsubq_f32(x0v, x2v); in cft1st_128_neon()
214 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftfsub_128_neon()
235 const float32x4_t a_k2_p1n = vsubq_f32(a_k2_p1, yi_); in rftfsub_128_neon()
242 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftfsub_128_neon()
244 a_j2_p.val[1] = vsubq_f32(a_j2_p.val[1], yi_); in rftfsub_128_neon()
294 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftbsub_128_neon()
315 const float32x4_t a_k2_p1n = vsubq_f32(yi_, a_k2_p1); in rftbsub_128_neon()
323 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftbsub_128_neon()
[all …]
/dports/multimedia/mswebrtc/mswebrtc-1.1.1/webrtc/webrtc/modules/audio_processing/aec/
H A Daec_rdft_neon.c45 const float32x4_t x1v = vsubq_f32(a01v, a23v); in cft1st_128_neon()
47 const float32x4_t x3v = vsubq_f32(a45v, a67v); in cft1st_128_neon()
51 x0v = vsubq_f32(x0v, x2v); in cft1st_128_neon()
212 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftfsub_128_neon()
233 const float32x4_t a_k2_p1n = vsubq_f32(a_k2_p1, yi_); in rftfsub_128_neon()
240 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftfsub_128_neon()
242 a_j2_p.val[1] = vsubq_f32(a_j2_p.val[1], yi_); in rftfsub_128_neon()
292 const float32x4_t xr_ = vsubq_f32(a_j2_p.val[0], a_k2_p0); in rftbsub_128_neon()
313 const float32x4_t a_k2_p1n = vsubq_f32(yi_, a_k2_p1); in rftbsub_128_neon()
321 a_j2_p.val[0] = vsubq_f32(a_j2_p.val[0], yr_); in rftbsub_128_neon()
[all …]
/dports/www/chromium-legacy/chromium-88.0.4324.182/third_party/blink/renderer/modules/webaudio/cpu/arm/
H A Doscillator_kernel_neon.cc27 return vsubq_f32(x, vmulq_f32(vcvtq_f32_s32(f), wave_size)); in WrapVirtualIndexVector()
110 vsubq_f32(v_virt_index, vcvtq_f32_u32(read_index_0)); in ProcessKRateVector()
112 s1_high, vmulq_f32(interpolation_factor, vsubq_f32(s2_high, s1_high))); in ProcessKRateVector()
114 s1_low, vmulq_f32(interpolation_factor, vsubq_f32(s2_low, s1_low))); in ProcessKRateVector()
117 vmulq_f32(v_table_factor, vsubq_f32(sample_lower, sample_higher))); in ProcessKRateVector()
216 const float32x4_t v_factor = vsubq_f32(v_virt_index, vcvtq_f32_u32(v_read0)); in ProcessARateVectorKernel()
221 vsubq_f32(vld1q_f32(sample2_higher), vld1q_f32(sample1_higher))); in ProcessARateVectorKernel()
226 vsubq_f32(vld1q_f32(sample2_lower), vld1q_f32(sample1_lower))); in ProcessARateVectorKernel()
232 vsubq_f32(sample_lower, sample_higher)); in ProcessARateVectorKernel()
/dports/devel/libflatarray/libflatarray-0.3.0/src/detail/
H A Dshort_vec_neon_float_32.hpp78 val1 = vsubq_f32(val1, other.val1); in operator -=()
79 val2 = vsubq_f32(val2, other.val2); in operator -=()
80 val3 = vsubq_f32(val3, other.val3); in operator -=()
81 val4 = vsubq_f32(val4, other.val4); in operator -=()
82 val5 = vsubq_f32(val5, other.val5); in operator -=()
83 val6 = vsubq_f32(val6, other.val6); in operator -=()
84 val7 = vsubq_f32(val7, other.val7); in operator -=()
92 vsubq_f32(val1, other.val1), vsubq_f32(val2, other.val2), in operator -()
93 vsubq_f32(val3, other.val3), vsubq_f32(val4, other.val4), in operator -()
94 vsubq_f32(val5, other.val5), vsubq_f32(val6, other.val6), in operator -()
[all …]
/dports/graphics/vapoursynth-waifu2x-ncnn-vulkan/vapoursynth-waifu2x-ncnn-vulkan-r4/deps/ncnn/src/layer/arm/
H A Dconvolution_3x3_pack4_bf16s.h105 … float32x4_t _tmp0m = vmlaq_n_f32(vsubq_f32(_r00, _r06), vsubq_f32(_r04, _r02), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
106 … float32x4_t _tmp7m = vmlaq_n_f32(vsubq_f32(_r07, _r01), vsubq_f32(_r03, _r05), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
120 float32x4_t _tmp2m = vsubq_f32(_tmp12a, _tmp12b); in conv3x3s1_winograd64_pack4_bf16s_neon()
178 … float32x4_t _r0tm0 = vmlaq_n_f32(vsubq_f32(_tmp00, _tmp06), vsubq_f32(_tmp04, _tmp02), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
179 … float32x4_t _r0tm7 = vmlaq_n_f32(vsubq_f32(_tmp07, _tmp01), vsubq_f32(_tmp03, _tmp05), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
1896 … float32x4_t _tmp2m = vmlaq_n_f32(vsubq_f32(_r04, _r03), vsubq_f32(_r01, _r02), 4.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1897 … float32x4_t _tmp3m = vmlsq_n_f32(vsubq_f32(_r04, _r02), vsubq_f32(_r01, _r03), 2.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1898 … float32x4_t _tmp4m = vmlaq_n_f32(vsubq_f32(_r04, _r02), vsubq_f32(_r01, _r03), 2.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1929 … float32x4_t _r0tm2 = vmlaq_n_f32(vsubq_f32(_tmp04, _tmp03), vsubq_f32(_tmp01, _tmp02), 4.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1930 … float32x4_t _r0tm3 = vmlsq_n_f32(vsubq_f32(_tmp04, _tmp02), vsubq_f32(_tmp01, _tmp03), 2.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
[all …]
/dports/graphics/waifu2x-ncnn-vulkan/waifu2x-ncnn-vulkan-20210521/src/ncnn/src/layer/arm/
H A Dconvolution_3x3_pack4_bf16s.h105 … float32x4_t _tmp0m = vmlaq_n_f32(vsubq_f32(_r00, _r06), vsubq_f32(_r04, _r02), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
106 … float32x4_t _tmp7m = vmlaq_n_f32(vsubq_f32(_r07, _r01), vsubq_f32(_r03, _r05), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
120 float32x4_t _tmp2m = vsubq_f32(_tmp12a, _tmp12b); in conv3x3s1_winograd64_pack4_bf16s_neon()
178 … float32x4_t _r0tm0 = vmlaq_n_f32(vsubq_f32(_tmp00, _tmp06), vsubq_f32(_tmp04, _tmp02), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
179 … float32x4_t _r0tm7 = vmlaq_n_f32(vsubq_f32(_tmp07, _tmp01), vsubq_f32(_tmp03, _tmp05), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
1896 … float32x4_t _tmp2m = vmlaq_n_f32(vsubq_f32(_r04, _r03), vsubq_f32(_r01, _r02), 4.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1897 … float32x4_t _tmp3m = vmlsq_n_f32(vsubq_f32(_r04, _r02), vsubq_f32(_r01, _r03), 2.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1898 … float32x4_t _tmp4m = vmlaq_n_f32(vsubq_f32(_r04, _r02), vsubq_f32(_r01, _r03), 2.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1929 … float32x4_t _r0tm2 = vmlaq_n_f32(vsubq_f32(_tmp04, _tmp03), vsubq_f32(_tmp01, _tmp02), 4.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1930 … float32x4_t _r0tm3 = vmlsq_n_f32(vsubq_f32(_tmp04, _tmp02), vsubq_f32(_tmp01, _tmp03), 2.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
[all …]
/dports/benchmarks/vkpeak/vkpeak-20210430/ncnn/src/layer/arm/
H A Dconvolution_3x3_pack4_bf16s.h105 … float32x4_t _tmp0m = vmlaq_n_f32(vsubq_f32(_r00, _r06), vsubq_f32(_r04, _r02), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
106 … float32x4_t _tmp7m = vmlaq_n_f32(vsubq_f32(_r07, _r01), vsubq_f32(_r03, _r05), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
120 float32x4_t _tmp2m = vsubq_f32(_tmp12a, _tmp12b); in conv3x3s1_winograd64_pack4_bf16s_neon()
178 … float32x4_t _r0tm0 = vmlaq_n_f32(vsubq_f32(_tmp00, _tmp06), vsubq_f32(_tmp04, _tmp02), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
179 … float32x4_t _r0tm7 = vmlaq_n_f32(vsubq_f32(_tmp07, _tmp01), vsubq_f32(_tmp03, _tmp05), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
1896 … float32x4_t _tmp2m = vmlaq_n_f32(vsubq_f32(_r04, _r03), vsubq_f32(_r01, _r02), 4.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1897 … float32x4_t _tmp3m = vmlsq_n_f32(vsubq_f32(_r04, _r02), vsubq_f32(_r01, _r03), 2.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1898 … float32x4_t _tmp4m = vmlaq_n_f32(vsubq_f32(_r04, _r02), vsubq_f32(_r01, _r03), 2.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1929 … float32x4_t _r0tm2 = vmlaq_n_f32(vsubq_f32(_tmp04, _tmp03), vsubq_f32(_tmp01, _tmp02), 4.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1930 … float32x4_t _r0tm3 = vmlsq_n_f32(vsubq_f32(_tmp04, _tmp02), vsubq_f32(_tmp01, _tmp03), 2.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
[all …]
/dports/misc/ncnn/ncnn-20211208/src/layer/arm/
H A Dconvolution_3x3_pack4_bf16s.h105 … float32x4_t _tmp0m = vmlaq_n_f32(vsubq_f32(_r00, _r06), vsubq_f32(_r04, _r02), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
106 … float32x4_t _tmp7m = vmlaq_n_f32(vsubq_f32(_r07, _r01), vsubq_f32(_r03, _r05), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
120 float32x4_t _tmp2m = vsubq_f32(_tmp12a, _tmp12b); in conv3x3s1_winograd64_pack4_bf16s_neon()
178 … float32x4_t _r0tm0 = vmlaq_n_f32(vsubq_f32(_tmp00, _tmp06), vsubq_f32(_tmp04, _tmp02), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
179 … float32x4_t _r0tm7 = vmlaq_n_f32(vsubq_f32(_tmp07, _tmp01), vsubq_f32(_tmp03, _tmp05), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
1896 … float32x4_t _tmp2m = vmlaq_n_f32(vsubq_f32(_r04, _r03), vsubq_f32(_r01, _r02), 4.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1897 … float32x4_t _tmp3m = vmlsq_n_f32(vsubq_f32(_r04, _r02), vsubq_f32(_r01, _r03), 2.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1898 … float32x4_t _tmp4m = vmlaq_n_f32(vsubq_f32(_r04, _r02), vsubq_f32(_r01, _r03), 2.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1929 … float32x4_t _r0tm2 = vmlaq_n_f32(vsubq_f32(_tmp04, _tmp03), vsubq_f32(_tmp01, _tmp02), 4.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1930 … float32x4_t _r0tm3 = vmlsq_n_f32(vsubq_f32(_tmp04, _tmp02), vsubq_f32(_tmp01, _tmp03), 2.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
[all …]
/dports/graphics/realsr-ncnn-vulkan/realsr-ncnn-vulkan-20210210/src/ncnn/src/layer/arm/
H A Dconvolution_3x3_pack4_bf16s.h105 … float32x4_t _tmp0m = vmlaq_n_f32(vsubq_f32(_r00, _r06), vsubq_f32(_r04, _r02), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
106 … float32x4_t _tmp7m = vmlaq_n_f32(vsubq_f32(_r07, _r01), vsubq_f32(_r03, _r05), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
120 float32x4_t _tmp2m = vsubq_f32(_tmp12a, _tmp12b); in conv3x3s1_winograd64_pack4_bf16s_neon()
178 … float32x4_t _r0tm0 = vmlaq_n_f32(vsubq_f32(_tmp00, _tmp06), vsubq_f32(_tmp04, _tmp02), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
179 … float32x4_t _r0tm7 = vmlaq_n_f32(vsubq_f32(_tmp07, _tmp01), vsubq_f32(_tmp03, _tmp05), 5.25f); in conv3x3s1_winograd64_pack4_bf16s_neon()
1896 … float32x4_t _tmp2m = vmlaq_n_f32(vsubq_f32(_r04, _r03), vsubq_f32(_r01, _r02), 4.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1897 … float32x4_t _tmp3m = vmlsq_n_f32(vsubq_f32(_r04, _r02), vsubq_f32(_r01, _r03), 2.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1898 … float32x4_t _tmp4m = vmlaq_n_f32(vsubq_f32(_r04, _r02), vsubq_f32(_r01, _r03), 2.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1929 … float32x4_t _r0tm2 = vmlaq_n_f32(vsubq_f32(_tmp04, _tmp03), vsubq_f32(_tmp01, _tmp02), 4.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
1930 … float32x4_t _r0tm3 = vmlsq_n_f32(vsubq_f32(_tmp04, _tmp02), vsubq_f32(_tmp01, _tmp03), 2.f); in conv3x3s1_winograd42_pack4_bf16s_neon()
[all …]
/dports/graphics/opencv/opencv-4.5.3/3rdparty/carotene/src/
H A Dsobel.cpp151 tnext = vsubq_f32(vsubq_f32(x2, x1), vsubq_f32(x1, x0)); in Sobel3x3()
155 tnext = vsubq_f32(x2, x0); in Sobel3x3()
188 t0 = vsubq_f32(vsubq_f32(t2, t1), vsubq_f32(t1, t0)); in Sobel3x3()
192 t0 = vsubq_f32(t2, t0); in Sobel3x3()
/dports/audio/madronalib/madronalib-1.6-1016-g103895f/source/DSP/
H A DMLDSPMathNEON.h88 x = vsubq_f32(x, one); in log_ps()
89 e = vsubq_f32(e, vreinterpretq_f32_u32(vandq_u32(vreinterpretq_u32_f32(one), mask))); in log_ps()
119 y = vsubq_f32(y, tmp); in log_ps()
162 fx = vsubq_f32(tmp, vreinterpretq_f32_u32(mask)); in exp_ps()
166 x = vsubq_f32(x, tmp); in exp_ps()
167 x = vsubq_f32(x, z); in exp_ps()
288 y1 = vsubq_f32(y1, vmulq_f32(z, vdupq_n_f32(0.5f))); in sincos_ps()
/dports/audio/sonic-visualiser/sonic-visualiser-4.0.1/bqvec/pommier/
H A Dneon_mathfun.h79 x = vsubq_f32(x, one); in log_ps()
80 e = vsubq_f32(e, vreinterpretq_f32_u32(vandq_u32(vreinterpretq_u32_f32(one), mask))); in log_ps()
112 y = vsubq_f32(y, tmp); in log_ps()
154 fx = vsubq_f32(tmp, vreinterpretq_f32_u32(mask)); in exp_ps()
158 x = vsubq_f32(x, tmp); in exp_ps()
159 x = vsubq_f32(x, z); in exp_ps()
278 y1 = vsubq_f32(y1, vmulq_f32(z, vdupq_n_f32(0.5f))); in sincos_ps()
/dports/audio/rubberband/rubberband-2.0.0/src/pommier/
H A Dneon_mathfun.h79 x = vsubq_f32(x, one); in log_ps()
80 e = vsubq_f32(e, vreinterpretq_f32_u32(vandq_u32(vreinterpretq_u32_f32(one), mask))); in log_ps()
112 y = vsubq_f32(y, tmp); in log_ps()
154 fx = vsubq_f32(tmp, vreinterpretq_f32_u32(mask)); in exp_ps()
158 x = vsubq_f32(x, tmp); in exp_ps()
159 x = vsubq_f32(x, z); in exp_ps()
278 y1 = vsubq_f32(y1, vmulq_f32(z, vdupq_n_f32(0.5f))); in sincos_ps()

12345678910>>...22