/dports/graphics/vapoursynth-waifu2x-ncnn-vulkan/vapoursynth-waifu2x-ncnn-vulkan-r4/deps/ncnn/src/layer/arm/ |
H A D | convolutiondepthwise_3x3_pack8_int8.h | 113 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local 196 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local 265 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local 416 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s2_pack8_int8_neon() local
|
H A D | convolution_sgemm_pack8to4_int8.h | 770 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack8to4_int8_neon() local
|
H A D | convolution_sgemm_pack8to1_int8.h | 870 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack8to1_int8_neon() local
|
H A D | convolution_sgemm_pack1to4_int8.h | 1715 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack1to4_int8_neon() local
|
/dports/graphics/waifu2x-ncnn-vulkan/waifu2x-ncnn-vulkan-20210521/src/ncnn/src/layer/arm/ |
H A D | convolutiondepthwise_3x3_pack8_int8.h | 113 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local 195 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local 261 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local 412 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s2_pack8_int8_neon() local
|
H A D | convolution_sgemm_pack8to4_int8.h | 770 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack8to4_int8_neon() local
|
H A D | convolution_sgemm_pack8to1_int8.h | 870 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack8to1_int8_neon() local
|
H A D | convolution_sgemm_pack1to4_int8.h | 1715 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack1to4_int8_neon() local
|
/dports/benchmarks/vkpeak/vkpeak-20210430/ncnn/src/layer/arm/ |
H A D | convolutiondepthwise_3x3_pack8_int8.h | 113 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local 195 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local 261 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local 412 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s2_pack8_int8_neon() local
|
H A D | convolution_sgemm_pack8to4_int8.h | 770 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack8to4_int8_neon() local
|
H A D | convolution_sgemm_pack8to1_int8.h | 870 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack8to1_int8_neon() local
|
H A D | convolution_sgemm_pack1to4_int8.h | 1715 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack1to4_int8_neon() local
|
/dports/misc/ncnn/ncnn-20211208/src/layer/arm/ |
H A D | convolutiondepthwise_3x3_pack8_int8.h | 113 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local 196 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local 265 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s1_pack8_int8_neon() local 416 int32x4_t _sum12 = vaddl_s16(vget_low_s16(_s12), vget_low_s16(_s13)); in convdw3x3s2_pack8_int8_neon() local
|
H A D | convolution_sgemm_pack8to4_int8.h | 770 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack8to4_int8_neon() local
|
H A D | convolution_sgemm_pack8to1_int8.h | 870 int32x4_t _sum12 = vdupq_n_s32(0); in im2col_sgemm_pack8to1_int8_neon() local
|
/dports/graphics/waifu2x-ncnn-vulkan/waifu2x-ncnn-vulkan-20210521/src/ncnn/src/layer/x86/ |
H A D | convolution_3x3_pack1to8.h | 147 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s1_pack1to8_avx() local 684 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local 957 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local
|
H A D | convolution_sgemm_pack8to4_int8.h | 96 __m128i _sum12 = _mm_setzero_si128(); in im2col_sgemm_pack8to4_int8_sse() local
|
/dports/graphics/vapoursynth-waifu2x-ncnn-vulkan/vapoursynth-waifu2x-ncnn-vulkan-r4/deps/ncnn/src/layer/x86/ |
H A D | convolution_3x3_pack1to8.h | 147 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s1_pack1to8_avx() local 684 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local 957 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local
|
H A D | convolution_sgemm_pack8to4_int8.h | 96 __m128i _sum12 = _mm_setzero_si128(); in im2col_sgemm_pack8to4_int8_sse() local
|
/dports/benchmarks/vkpeak/vkpeak-20210430/ncnn/src/layer/x86/ |
H A D | convolution_3x3_pack1to8.h | 147 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s1_pack1to8_avx() local 684 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local 957 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local
|
H A D | convolution_sgemm_pack8to4_int8.h | 96 __m128i _sum12 = _mm_setzero_si128(); in im2col_sgemm_pack8to4_int8_sse() local
|
/dports/misc/ncnn/ncnn-20211208/src/layer/x86/ |
H A D | convolution_3x3_pack1to8.h | 147 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s1_pack1to8_avx() local 684 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local 957 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local
|
H A D | convolution_sgemm_pack8to4_int8.h | 96 __m128i _sum12 = _mm_setzero_si128(); in im2col_sgemm_pack8to4_int8_sse() local
|
H A D | convolution_3x3_pack1to4.h | 147 __m128 _sum12 = _mm_loadu_ps(outptr1 + 8); in conv3x3s1_pack1to4_sse() local 684 __m128 _sum12 = _mm_loadu_ps(outptr1 + 8); in conv3x3s2_pack1to4_sse() local
|
/dports/graphics/realsr-ncnn-vulkan/realsr-ncnn-vulkan-20210210/src/ncnn/src/layer/x86/ |
H A D | convolution_3x3_pack1to8.h | 147 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s1_pack1to8_avx() local 684 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local 957 __m256 _sum12 = _mm256_loadu_ps(outptr1 + 16); in conv3x3s2_pack1to8_avx() local
|