Home
last modified time | relevance | path

Searched refs:_k22 (Results 51 – 75 of 96) sorted by relevance

1234

/dports/misc/ncnn/ncnn-20211208/src/layer/riscv/
H A Dconvolutiondepthwise_3x3_packn_fp16s.h56 vfloat16m1_t _k22 = vle16_v_f16m1(k0 + packn * 8, vl); in convdw3x3s1_packn_fp16sa_rvv() local
106 _sum00 = vfmacc_vv_f16m1(_sum00, _k22, _r22, vl); in convdw3x3s1_packn_fp16sa_rvv()
109 _sum01 = vfmacc_vv_f16m1(_sum01, _k22, _r23, vl); in convdw3x3s1_packn_fp16sa_rvv()
124 _sum10 = vfmacc_vv_f16m1(_sum10, _k22, _r32, vl); in convdw3x3s1_packn_fp16sa_rvv()
127 _sum11 = vfmacc_vv_f16m1(_sum11, _k22, _r33, vl); in convdw3x3s1_packn_fp16sa_rvv()
172 _sum0 = vfmacc_vv_f16m1(_sum0, _k22, _r22, vl); in convdw3x3s1_packn_fp16sa_rvv()
183 _sum1 = vfmacc_vv_f16m1(_sum1, _k22, _r32, vl); in convdw3x3s1_packn_fp16sa_rvv()
244 _sum00 = vfmacc_vv_f16m1(_sum00, _k22, _r22, vl); in convdw3x3s1_packn_fp16sa_rvv()
284 _sum0 = vfmacc_vv_f16m1(_sum0, _k22, _r22, vl); in convdw3x3s1_packn_fp16sa_rvv()
343 vfloat16m1_t _k22 = vle16_v_f16m1(k0 + packn * 8, vl); in convdw3x3s2_packn_fp16sa_rvv() local
[all …]
H A Dconvolutiondepthwise_5x5_packn.h117 vfloat32m1_t _k22 = vle32_v_f32m1(k0 + packn * 2, vl); in convdw5x5s1_packn_rvv() local
124 _sum0 = vfmacc_vv_f32m1(_sum0, _k22, _r22, vl); in convdw5x5s1_packn_rvv()
136 _sum1 = vfmacc_vv_f32m1(_sum1, _k22, _r32, vl); in convdw5x5s1_packn_rvv()
267 vfloat32m1_t _k22 = vle32_v_f32m1(k0 + packn * 2, vl); in convdw5x5s1_packn_rvv() local
274 _sum0 = vfmacc_vv_f32m1(_sum0, _k22, _r22, vl); in convdw5x5s1_packn_rvv()
425 vfloat32m1_t _k22 = vle32_v_f32m1(k0 + packn * 2, vl); in convdw5x5s2_packn_rvv() local
432 _sum0 = vfmacc_vv_f32m1(_sum0, _k22, _r22, vl); in convdw5x5s2_packn_rvv()
H A Dconvolutiondepthwise_5x5_packn_fp16s.h117 vfloat16m1_t _k22 = vle16_v_f16m1(k0 + packn * 2, vl); in convdw5x5s1_packn_fp16sa_rvv() local
124 _sum0 = vfmacc_vv_f16m1(_sum0, _k22, _r22, vl); in convdw5x5s1_packn_fp16sa_rvv()
136 _sum1 = vfmacc_vv_f16m1(_sum1, _k22, _r32, vl); in convdw5x5s1_packn_fp16sa_rvv()
267 vfloat16m1_t _k22 = vle16_v_f16m1(k0 + packn * 2, vl); in convdw5x5s1_packn_fp16sa_rvv() local
274 _sum0 = vfmacc_vv_f16m1(_sum0, _k22, _r22, vl); in convdw5x5s1_packn_fp16sa_rvv()
425 vfloat16m1_t _k22 = vle16_v_f16m1(k0 + packn * 2, vl); in convdw5x5s2_packn_fp16sa_rvv() local
432 _sum0 = vfmacc_vv_f16m1(_sum0, _k22, _r22, vl); in convdw5x5s2_packn_fp16sa_rvv()
H A Dconvolution_7x7_pack1ton.h231 _sum0 = vfmacc_vf_f32m1(_sum0, r2[2], _k22, vl); in conv7x7s2_pack1ton_rvv()
232 _sum1 = vfmacc_vf_f32m1(_sum1, r2[4], _k22, vl); in conv7x7s2_pack1ton_rvv()
233 _sum2 = vfmacc_vf_f32m1(_sum2, r2[6], _k22, vl); in conv7x7s2_pack1ton_rvv()
234 _sum3 = vfmacc_vf_f32m1(_sum3, r2[8], _k22, vl); in conv7x7s2_pack1ton_rvv()
235 _sum4 = vfmacc_vf_f32m1(_sum4, r2[10], _k22, vl); in conv7x7s2_pack1ton_rvv()
236 _sum5 = vfmacc_vf_f32m1(_sum5, r2[12], _k22, vl); in conv7x7s2_pack1ton_rvv()
237 _sum6 = vfmacc_vf_f32m1(_sum6, r2[14], _k22, vl); in conv7x7s2_pack1ton_rvv()
238 _sum7 = vfmacc_vf_f32m1(_sum7, r2[16], _k22, vl); in conv7x7s2_pack1ton_rvv()
662 _sum0 = vfmacc_vf_f32m1(_sum0, r2[2], _k22, vl); in conv7x7s2_pack1ton_rvv()
663 _sum1 = vfmacc_vf_f32m1(_sum1, r2[4], _k22, vl); in conv7x7s2_pack1ton_rvv()
[all …]
H A Dconvolution_7x7_pack1ton_fp16s.h231 _sum0 = vfmacc_vf_f16m1(_sum0, r2[2], _k22, vl); in conv7x7s2_pack1ton_fp16sa_rvv()
232 _sum1 = vfmacc_vf_f16m1(_sum1, r2[4], _k22, vl); in conv7x7s2_pack1ton_fp16sa_rvv()
233 _sum2 = vfmacc_vf_f16m1(_sum2, r2[6], _k22, vl); in conv7x7s2_pack1ton_fp16sa_rvv()
234 _sum3 = vfmacc_vf_f16m1(_sum3, r2[8], _k22, vl); in conv7x7s2_pack1ton_fp16sa_rvv()
235 _sum4 = vfmacc_vf_f16m1(_sum4, r2[10], _k22, vl); in conv7x7s2_pack1ton_fp16sa_rvv()
236 _sum5 = vfmacc_vf_f16m1(_sum5, r2[12], _k22, vl); in conv7x7s2_pack1ton_fp16sa_rvv()
237 _sum6 = vfmacc_vf_f16m1(_sum6, r2[14], _k22, vl); in conv7x7s2_pack1ton_fp16sa_rvv()
238 _sum7 = vfmacc_vf_f16m1(_sum7, r2[16], _k22, vl); in conv7x7s2_pack1ton_fp16sa_rvv()
662 _sum0 = vfmacc_vf_f16m1(_sum0, r2[2], _k22, vl); in conv7x7s2_pack1ton_fp16sa_rvv()
663 _sum1 = vfmacc_vf_f16m1(_sum1, r2[4], _k22, vl); in conv7x7s2_pack1ton_fp16sa_rvv()
[all …]
/dports/graphics/vapoursynth-waifu2x-ncnn-vulkan/vapoursynth-waifu2x-ncnn-vulkan-r4/deps/ncnn/src/layer/arm/
H A Dconvolutiondepthwise_3x3_pack8_int8.h49 int8x8_t _k22 = vld1_s8(k0 + 64); in convdw3x3s1_pack8_int8_neon() local
102 int16x8_t _s08 = vmull_s8(vget_low_s8(_r2223), _k22); in convdw3x3s1_pack8_int8_neon()
103 int16x8_t _s18 = vmull_s8(vget_high_s8(_r2223), _k22); in convdw3x3s1_pack8_int8_neon()
104 int16x8_t _s28 = vmull_s8(vget_low_s8(_r3233), _k22); in convdw3x3s1_pack8_int8_neon()
187 int16x8_t _s08 = vmull_s8(_r22, _k22); in convdw3x3s1_pack8_int8_neon()
188 int16x8_t _s18 = vmull_s8(_r32, _k22); in convdw3x3s1_pack8_int8_neon()
306 int16x8_t _s4 = vmull_s8(_r22, _k22); in convdw3x3s1_pack8_int8_neon()
367 int8x8_t _k22 = vld1_s8(k0 + 64); in convdw3x3s2_pack8_int8_neon() local
407 int16x8_t _s08 = vmull_s8(_r22, _k22); in convdw3x3s2_pack8_int8_neon()
408 int16x8_t _s18 = vmull_s8(_r24, _k22); in convdw3x3s2_pack8_int8_neon()
[all …]
H A Dconvolutiondepthwise_5x5_pack4.h174 float32x4_t _k22 = vld1q_f32(k0 + 8); in convdw5x5s1_pack4_neon() local
202 _sum00 = vmlaq_f32(_sum00, _k22, _r22); in convdw5x5s1_pack4_neon()
207 _sum01 = vmlaq_f32(_sum01, _k22, _r23); in convdw5x5s1_pack4_neon()
212 _sum02 = vmlaq_f32(_sum02, _k22, _r24); in convdw5x5s1_pack4_neon()
217 _sum03 = vmlaq_f32(_sum03, _k22, _r25); in convdw5x5s1_pack4_neon()
239 _sum10 = vmlaq_f32(_sum10, _k22, _r32); in convdw5x5s1_pack4_neon()
244 _sum11 = vmlaq_f32(_sum11, _k22, _r33); in convdw5x5s1_pack4_neon()
462 float32x4_t _k22 = vld1q_f32(k0 + 8); in convdw5x5s1_pack4_neon() local
650 float32x4_t _k22 = vld1q_f32(k0 + 8); in convdw5x5s1_pack4_neon() local
663 _sum0 = vmlaq_f32(_sum0, _k22, _r22); in convdw5x5s1_pack4_neon()
[all …]
/dports/graphics/waifu2x-ncnn-vulkan/waifu2x-ncnn-vulkan-20210521/src/ncnn/src/layer/arm/
H A Dconvolutiondepthwise_3x3_pack8_int8.h49 int8x8_t _k22 = vld1_s8(k0 + 64); in convdw3x3s1_pack8_int8_neon() local
102 int16x8_t _s08 = vmull_s8(vget_low_s8(_r2223), _k22); in convdw3x3s1_pack8_int8_neon()
103 int16x8_t _s18 = vmull_s8(vget_high_s8(_r2223), _k22); in convdw3x3s1_pack8_int8_neon()
104 int16x8_t _s28 = vmull_s8(vget_low_s8(_r3233), _k22); in convdw3x3s1_pack8_int8_neon()
186 int16x8_t _s08 = vmull_s8(_r22, _k22); in convdw3x3s1_pack8_int8_neon()
187 int16x8_t _s18 = vmull_s8(_r32, _k22); in convdw3x3s1_pack8_int8_neon()
302 int16x8_t _s4 = vmull_s8(_r22, _k22); in convdw3x3s1_pack8_int8_neon()
363 int8x8_t _k22 = vld1_s8(k0 + 64); in convdw3x3s2_pack8_int8_neon() local
403 int16x8_t _s08 = vmull_s8(_r22, _k22); in convdw3x3s2_pack8_int8_neon()
404 int16x8_t _s18 = vmull_s8(_r24, _k22); in convdw3x3s2_pack8_int8_neon()
[all …]
H A Dconvolutiondepthwise_5x5_pack4.h174 float32x4_t _k22 = vld1q_f32(k0 + 8); in convdw5x5s1_pack4_neon() local
202 _sum00 = vmlaq_f32(_sum00, _k22, _r22); in convdw5x5s1_pack4_neon()
207 _sum01 = vmlaq_f32(_sum01, _k22, _r23); in convdw5x5s1_pack4_neon()
212 _sum02 = vmlaq_f32(_sum02, _k22, _r24); in convdw5x5s1_pack4_neon()
217 _sum03 = vmlaq_f32(_sum03, _k22, _r25); in convdw5x5s1_pack4_neon()
239 _sum10 = vmlaq_f32(_sum10, _k22, _r32); in convdw5x5s1_pack4_neon()
244 _sum11 = vmlaq_f32(_sum11, _k22, _r33); in convdw5x5s1_pack4_neon()
462 float32x4_t _k22 = vld1q_f32(k0 + 8); in convdw5x5s1_pack4_neon() local
650 float32x4_t _k22 = vld1q_f32(k0 + 8); in convdw5x5s1_pack4_neon() local
663 _sum0 = vmlaq_f32(_sum0, _k22, _r22); in convdw5x5s1_pack4_neon()
[all …]
/dports/benchmarks/vkpeak/vkpeak-20210430/ncnn/src/layer/arm/
H A Dconvolutiondepthwise_3x3_pack8_int8.h49 int8x8_t _k22 = vld1_s8(k0 + 64); in convdw3x3s1_pack8_int8_neon() local
102 int16x8_t _s08 = vmull_s8(vget_low_s8(_r2223), _k22); in convdw3x3s1_pack8_int8_neon()
103 int16x8_t _s18 = vmull_s8(vget_high_s8(_r2223), _k22); in convdw3x3s1_pack8_int8_neon()
104 int16x8_t _s28 = vmull_s8(vget_low_s8(_r3233), _k22); in convdw3x3s1_pack8_int8_neon()
186 int16x8_t _s08 = vmull_s8(_r22, _k22); in convdw3x3s1_pack8_int8_neon()
187 int16x8_t _s18 = vmull_s8(_r32, _k22); in convdw3x3s1_pack8_int8_neon()
302 int16x8_t _s4 = vmull_s8(_r22, _k22); in convdw3x3s1_pack8_int8_neon()
363 int8x8_t _k22 = vld1_s8(k0 + 64); in convdw3x3s2_pack8_int8_neon() local
403 int16x8_t _s08 = vmull_s8(_r22, _k22); in convdw3x3s2_pack8_int8_neon()
404 int16x8_t _s18 = vmull_s8(_r24, _k22); in convdw3x3s2_pack8_int8_neon()
[all …]
H A Dconvolutiondepthwise_5x5_pack4.h174 float32x4_t _k22 = vld1q_f32(k0 + 8); in convdw5x5s1_pack4_neon() local
202 _sum00 = vmlaq_f32(_sum00, _k22, _r22); in convdw5x5s1_pack4_neon()
207 _sum01 = vmlaq_f32(_sum01, _k22, _r23); in convdw5x5s1_pack4_neon()
212 _sum02 = vmlaq_f32(_sum02, _k22, _r24); in convdw5x5s1_pack4_neon()
217 _sum03 = vmlaq_f32(_sum03, _k22, _r25); in convdw5x5s1_pack4_neon()
239 _sum10 = vmlaq_f32(_sum10, _k22, _r32); in convdw5x5s1_pack4_neon()
244 _sum11 = vmlaq_f32(_sum11, _k22, _r33); in convdw5x5s1_pack4_neon()
462 float32x4_t _k22 = vld1q_f32(k0 + 8); in convdw5x5s1_pack4_neon() local
650 float32x4_t _k22 = vld1q_f32(k0 + 8); in convdw5x5s1_pack4_neon() local
663 _sum0 = vmlaq_f32(_sum0, _k22, _r22); in convdw5x5s1_pack4_neon()
[all …]
/dports/misc/ncnn/ncnn-20211208/src/layer/arm/
H A Dconvolutiondepthwise_3x3_pack8_int8.h49 int8x8_t _k22 = vld1_s8(k0 + 64); in convdw3x3s1_pack8_int8_neon() local
102 int16x8_t _s08 = vmull_s8(vget_low_s8(_r2223), _k22); in convdw3x3s1_pack8_int8_neon()
103 int16x8_t _s18 = vmull_s8(vget_high_s8(_r2223), _k22); in convdw3x3s1_pack8_int8_neon()
104 int16x8_t _s28 = vmull_s8(vget_low_s8(_r3233), _k22); in convdw3x3s1_pack8_int8_neon()
187 int16x8_t _s08 = vmull_s8(_r22, _k22); in convdw3x3s1_pack8_int8_neon()
188 int16x8_t _s18 = vmull_s8(_r32, _k22); in convdw3x3s1_pack8_int8_neon()
306 int16x8_t _s4 = vmull_s8(_r22, _k22); in convdw3x3s1_pack8_int8_neon()
367 int8x8_t _k22 = vld1_s8(k0 + 64); in convdw3x3s2_pack8_int8_neon() local
407 int16x8_t _s08 = vmull_s8(_r22, _k22); in convdw3x3s2_pack8_int8_neon()
408 int16x8_t _s18 = vmull_s8(_r24, _k22); in convdw3x3s2_pack8_int8_neon()
[all …]
H A Dconvolutiondepthwise_5x5_pack4.h174 float32x4_t _k22 = vld1q_f32(k0 + 8); in convdw5x5s1_pack4_neon() local
202 _sum00 = vmlaq_f32(_sum00, _k22, _r22); in convdw5x5s1_pack4_neon()
207 _sum01 = vmlaq_f32(_sum01, _k22, _r23); in convdw5x5s1_pack4_neon()
212 _sum02 = vmlaq_f32(_sum02, _k22, _r24); in convdw5x5s1_pack4_neon()
217 _sum03 = vmlaq_f32(_sum03, _k22, _r25); in convdw5x5s1_pack4_neon()
239 _sum10 = vmlaq_f32(_sum10, _k22, _r32); in convdw5x5s1_pack4_neon()
244 _sum11 = vmlaq_f32(_sum11, _k22, _r33); in convdw5x5s1_pack4_neon()
462 float32x4_t _k22 = vld1q_f32(k0 + 8); in convdw5x5s1_pack4_neon() local
650 float32x4_t _k22 = vld1q_f32(k0 + 8); in convdw5x5s1_pack4_neon() local
663 _sum0 = vmlaq_f32(_sum0, _k22, _r22); in convdw5x5s1_pack4_neon()
[all …]
/dports/graphics/realsr-ncnn-vulkan/realsr-ncnn-vulkan-20210210/src/ncnn/src/layer/arm/
H A Dconvolutiondepthwise_5x5_pack4.h174 float32x4_t _k22 = vld1q_f32(k0 + 8); in convdw5x5s1_pack4_neon() local
202 _sum00 = vmlaq_f32(_sum00, _k22, _r22); in convdw5x5s1_pack4_neon()
207 _sum01 = vmlaq_f32(_sum01, _k22, _r23); in convdw5x5s1_pack4_neon()
212 _sum02 = vmlaq_f32(_sum02, _k22, _r24); in convdw5x5s1_pack4_neon()
217 _sum03 = vmlaq_f32(_sum03, _k22, _r25); in convdw5x5s1_pack4_neon()
239 _sum10 = vmlaq_f32(_sum10, _k22, _r32); in convdw5x5s1_pack4_neon()
244 _sum11 = vmlaq_f32(_sum11, _k22, _r33); in convdw5x5s1_pack4_neon()
462 float32x4_t _k22 = vld1q_f32(k0 + 8); in convdw5x5s1_pack4_neon() local
650 float32x4_t _k22 = vld1q_f32(k0 + 8); in convdw5x5s1_pack4_neon() local
663 _sum0 = vmlaq_f32(_sum0, _k22, _r22); in convdw5x5s1_pack4_neon()
[all …]
/dports/graphics/vapoursynth-waifu2x-ncnn-vulkan/vapoursynth-waifu2x-ncnn-vulkan-r4/deps/ncnn/src/layer/x86/
H A Dconvolution_3x3_pack8to1.h50 __m256 _k22 = _mm256_loadu_ps(k0 + 64); in conv3x3s1_pack8to1_avx() local
84 _sum2 = _mm256_fmadd_ps(_k22, _r22, _sum2); in conv3x3s1_pack8to1_avx()
H A Dconvolutiondepthwise_5x5_pack8.h97 __m256 _k22 = _mm256_loadu_ps(k0 + 16); in convdw5x5s1_pack8_avx() local
104 _sum0 = _mm256_fmadd_ps(_k22, _r22, _sum0); in convdw5x5s1_pack8_avx()
251 __m256 _k22 = _mm256_loadu_ps(k0 + 16); in convdw5x5s2_pack8_avx() local
258 _sum0 = _mm256_fmadd_ps(_k22, _r22, _sum0); in convdw5x5s2_pack8_avx()
/dports/graphics/waifu2x-ncnn-vulkan/waifu2x-ncnn-vulkan-20210521/src/ncnn/src/layer/x86/
H A Dconvolution_3x3_pack8to1.h50 __m256 _k22 = _mm256_loadu_ps(k0 + 64); in conv3x3s1_pack8to1_avx() local
84 _sum2 = _mm256_fmadd_ps(_k22, _r22, _sum2); in conv3x3s1_pack8to1_avx()
H A Dconvolutiondepthwise_5x5_pack8.h97 __m256 _k22 = _mm256_loadu_ps(k0 + 16); in convdw5x5s1_pack8_avx() local
104 _sum0 = _mm256_fmadd_ps(_k22, _r22, _sum0); in convdw5x5s1_pack8_avx()
251 __m256 _k22 = _mm256_loadu_ps(k0 + 16); in convdw5x5s2_pack8_avx() local
258 _sum0 = _mm256_fmadd_ps(_k22, _r22, _sum0); in convdw5x5s2_pack8_avx()
/dports/benchmarks/vkpeak/vkpeak-20210430/ncnn/src/layer/x86/
H A Dconvolution_3x3_pack8to1.h50 __m256 _k22 = _mm256_loadu_ps(k0 + 64); in conv3x3s1_pack8to1_avx() local
84 _sum2 = _mm256_fmadd_ps(_k22, _r22, _sum2); in conv3x3s1_pack8to1_avx()
H A Dconvolutiondepthwise_5x5_pack8.h97 __m256 _k22 = _mm256_loadu_ps(k0 + 16); in convdw5x5s1_pack8_avx() local
104 _sum0 = _mm256_fmadd_ps(_k22, _r22, _sum0); in convdw5x5s1_pack8_avx()
251 __m256 _k22 = _mm256_loadu_ps(k0 + 16); in convdw5x5s2_pack8_avx() local
258 _sum0 = _mm256_fmadd_ps(_k22, _r22, _sum0); in convdw5x5s2_pack8_avx()
/dports/misc/ncnn/ncnn-20211208/src/layer/x86/
H A Dconvolution_3x3_pack8to1.h50 __m256 _k22 = _mm256_loadu_ps(k0 + 64); in conv3x3s1_pack8to1_avx() local
84 _sum2 = _mm256_comp_fmadd_ps(_k22, _r22, _sum2); in conv3x3s1_pack8to1_avx()
H A Dconvolutiondepthwise_5x5_pack8.h97 __m256 _k22 = _mm256_loadu_ps(k0 + 16); in convdw5x5s1_pack8_avx() local
104 _sum0 = _mm256_comp_fmadd_ps(_k22, _r22, _sum0); in convdw5x5s1_pack8_avx()
251 __m256 _k22 = _mm256_loadu_ps(k0 + 16); in convdw5x5s2_pack8_avx() local
258 _sum0 = _mm256_comp_fmadd_ps(_k22, _r22, _sum0); in convdw5x5s2_pack8_avx()
/dports/graphics/realsr-ncnn-vulkan/realsr-ncnn-vulkan-20210210/src/ncnn/src/layer/x86/
H A Dconvolution_3x3_pack8to1.h50 __m256 _k22 = _mm256_loadu_ps(k0 + 64); in conv3x3s1_pack8to1_avx() local
84 _sum2 = _mm256_fmadd_ps(_k22, _r22, _sum2); in conv3x3s1_pack8to1_avx()
H A Dconvolutiondepthwise_5x5_pack8.h97 __m256 _k22 = _mm256_loadu_ps(k0 + 16); in convdw5x5s1_pack8_avx() local
104 _sum0 = _mm256_fmadd_ps(_k22, _r22, _sum0); in convdw5x5s1_pack8_avx()
251 __m256 _k22 = _mm256_loadu_ps(k0 + 16); in convdw5x5s2_pack8_avx() local
258 _sum0 = _mm256_fmadd_ps(_k22, _r22, _sum0); in convdw5x5s2_pack8_avx()
/dports/misc/ncnn/ncnn-20211208/src/layer/mips/
H A Dconvolutiondepthwise_5x5_pack4.h123 v4f32 _k22 = (v4f32)__msa_ld_w(k0 + 4 * 2, 0); in convdw5x5s1_pack4_msa() local
130 _sum0 = __msa_fmadd_w(_sum0, _k22, _r22); in convdw5x5s1_pack4_msa()
142 _sum1 = __msa_fmadd_w(_sum1, _k22, _r32); in convdw5x5s1_pack4_msa()
281 v4f32 _k22 = (v4f32)__msa_ld_w(k0 + 4 * 2, 0); in convdw5x5s1_pack4_msa() local
288 _sum0 = __msa_fmadd_w(_sum0, _k22, _r22); in convdw5x5s1_pack4_msa()
444 v4f32 _k22 = (v4f32)__msa_ld_w(k0 + 4 * 2, 0); in convdw5x5s2_pack4_msa() local
451 _sum0 = __msa_fmadd_w(_sum0, _k22, _r22); in convdw5x5s2_pack4_msa()

1234