Home
last modified time | relevance | path

Searched defs:_sum12 (Results 1 – 25 of 35) sorted by relevance

12

/dports/graphics/vapoursynth-waifu2x-ncnn-vulkan/vapoursynth-waifu2x-ncnn-vulkan-r4/deps/ncnn/src/layer/arm/
H A Dconvolutiondepthwise_3x3_pack8_int8.h113 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local
196 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local
265 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local
416 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s2_pack8_int8_neon() local
H A Dconvolution_sgemm_pack8to4_int8.h770 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack8to4_int8_neon() local
H A Dconvolution_sgemm_pack8to1_int8.h870 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack8to1_int8_neon() local
H A Dconvolution_sgemm_pack1to4_int8.h1715 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack1to4_int8_neon() local
/dports/graphics/waifu2x-ncnn-vulkan/waifu2x-ncnn-vulkan-20210521/src/ncnn/src/layer/arm/
H A Dconvolutiondepthwise_3x3_pack8_int8.h113 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local
195 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local
261 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local
412 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s2_pack8_int8_neon() local
H A Dconvolution_sgemm_pack8to4_int8.h770 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack8to4_int8_neon() local
H A Dconvolution_sgemm_pack8to1_int8.h870 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack8to1_int8_neon() local
H A Dconvolution_sgemm_pack1to4_int8.h1715 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack1to4_int8_neon() local
/dports/benchmarks/vkpeak/vkpeak-20210430/ncnn/src/layer/arm/
H A Dconvolutiondepthwise_3x3_pack8_int8.h113 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local
195 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local
261 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local
412 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s2_pack8_int8_neon() local
H A Dconvolution_sgemm_pack8to4_int8.h770 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack8to4_int8_neon() local
H A Dconvolution_sgemm_pack8to1_int8.h870 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack8to1_int8_neon() local
H A Dconvolution_sgemm_pack1to4_int8.h1715 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack1to4_int8_neon() local
/dports/misc/ncnn/ncnn-20211208/src/layer/arm/
H A Dconvolutiondepthwise_3x3_pack8_int8.h113 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local
196 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local
265 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local
416 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s2_pack8_int8_neon() local
H A Dconvolution_sgemm_pack8to4_int8.h770 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack8to4_int8_neon() local
H A Dconvolution_sgemm_pack8to1_int8.h870 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack8to1_int8_neon() local
/dports/graphics/waifu2x-ncnn-vulkan/waifu2x-ncnn-vulkan-20210521/src/ncnn/src/layer/x86/
H A Dconvolution_3x3_pack1to8.h147 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s1_pack1to8_avx() local
684 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local
957 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local
H A Dconvolution_sgemm_pack8to4_int8.h96 __m128i _sum12 = _mm_setzero_si128(); in im2col_sgemm_pack8to4_int8_sse() local
/dports/graphics/vapoursynth-waifu2x-ncnn-vulkan/vapoursynth-waifu2x-ncnn-vulkan-r4/deps/ncnn/src/layer/x86/
H A Dconvolution_3x3_pack1to8.h147 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s1_pack1to8_avx() local
684 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local
957 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local
H A Dconvolution_sgemm_pack8to4_int8.h96 __m128i _sum12 = _mm_setzero_si128(); in im2col_sgemm_pack8to4_int8_sse() local
/dports/benchmarks/vkpeak/vkpeak-20210430/ncnn/src/layer/x86/
H A Dconvolution_3x3_pack1to8.h147 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s1_pack1to8_avx() local
684 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local
957 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local
H A Dconvolution_sgemm_pack8to4_int8.h96 __m128i _sum12 = _mm_setzero_si128(); in im2col_sgemm_pack8to4_int8_sse() local
/dports/misc/ncnn/ncnn-20211208/src/layer/x86/
H A Dconvolution_3x3_pack1to8.h147 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s1_pack1to8_avx() local
684 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local
957 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local
H A Dconvolution_sgemm_pack8to4_int8.h96 __m128i _sum12 = _mm_setzero_si128(); in im2col_sgemm_pack8to4_int8_sse() local
H A Dconvolution_3x3_pack1to4.h147 __m128 _sum12 = _mm_loadu_ps(outptr1 + 8); in conv3x3s1_pack1to4_sse() local
684 __m128 _sum12 = _mm_loadu_ps(outptr1 + 8); in conv3x3s2_pack1to4_sse() local
/dports/graphics/realsr-ncnn-vulkan/realsr-ncnn-vulkan-20210210/src/ncnn/src/layer/x86/
H A Dconvolution_3x3_pack1to8.h147 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s1_pack1to8_avx() local
684 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local
957 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local

12