/dports/graphics/vapoursynth-waifu2x-ncnn-vulkan/vapoursynth-waifu2x-ncnn-vulkan-r4/deps/ncnn/src/layer/x86/ |
H A D | dequantize_x86.cpp | 69 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 90 __m256 _bias = _mm256_loadu_ps((const float*)bias_data + i * 8); in forward() local 115 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 290 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 311 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward() local 336 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 359 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward() local 539 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 585 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 856 __m128 _bias = _mm_set1_ps(bias); in forward() local [all …]
|
H A D | scale_x86.cpp | 60 __m256 _bias = _mm256_loadu_ps(bias + i * 8); in forward_inplace() local 92 __m256 _bias = _mm256_loadu_ps((const float*)bias_data + i * 8); in forward_inplace() local 138 __m256 _bias = _mm256_loadu_ps((const float*)bias_data + q * 8); in forward_inplace() local 191 __m128 _bias = _mm_loadu_ps(bias + i * 4); in forward_inplace() local 223 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward_inplace() local 269 __m128 _bias = _mm_loadu_ps((const float*)bias_data + q * 4); in forward_inplace() local 334 __m256 _bias = _mm256_set1_ps(bias); in forward_inplace() local
|
H A D | convolution_7x7.h | 15 …x7s1_sse(const Mat& bottom_blob, Mat& top_blob, const Mat& _kernel, const Mat& _bias, const Option… in conv7x7s1_sse() 26 …x7s2_sse(const Mat& bottom_blob, Mat& top_blob, const Mat& _kernel, const Mat& _bias, const Option… in conv7x7s2_sse()
|
H A D | requantize_x86.cpp | 92 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 131 __m256 _bias = _mm256_loadu_ps((const float*)bias_data + i * 8); in forward() local 194 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 302 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 407 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 725 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 752 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward() local 791 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 820 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward() local 859 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local [all …]
|
/dports/graphics/waifu2x-ncnn-vulkan/waifu2x-ncnn-vulkan-20210521/src/ncnn/src/layer/x86/ |
H A D | dequantize_x86.cpp | 69 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 90 __m256 _bias = _mm256_loadu_ps((const float*)bias_data + i * 8); in forward() local 115 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 290 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 311 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward() local 336 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 359 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward() local 539 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 585 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 856 __m128 _bias = _mm_set1_ps(bias); in forward() local [all …]
|
H A D | scale_x86.cpp | 60 __m256 _bias = _mm256_loadu_ps(bias + i * 8); in forward_inplace() local 92 __m256 _bias = _mm256_loadu_ps((const float*)bias_data + i * 8); in forward_inplace() local 138 __m256 _bias = _mm256_loadu_ps((const float*)bias_data + q * 8); in forward_inplace() local 191 __m128 _bias = _mm_loadu_ps(bias + i * 4); in forward_inplace() local 223 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward_inplace() local 269 __m128 _bias = _mm_loadu_ps((const float*)bias_data + q * 4); in forward_inplace() local 334 __m256 _bias = _mm256_set1_ps(bias); in forward_inplace() local
|
H A D | convolution_7x7.h | 15 …x7s1_sse(const Mat& bottom_blob, Mat& top_blob, const Mat& _kernel, const Mat& _bias, const Option… in conv7x7s1_sse() 26 …x7s2_sse(const Mat& bottom_blob, Mat& top_blob, const Mat& _kernel, const Mat& _bias, const Option… in conv7x7s2_sse()
|
H A D | requantize_x86.cpp | 92 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 131 __m256 _bias = _mm256_loadu_ps((const float*)bias_data + i * 8); in forward() local 194 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 302 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 407 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 725 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 752 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward() local 791 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 820 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward() local 859 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local [all …]
|
/dports/benchmarks/vkpeak/vkpeak-20210430/ncnn/src/layer/x86/ |
H A D | dequantize_x86.cpp | 69 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 90 __m256 _bias = _mm256_loadu_ps((const float*)bias_data + i * 8); in forward() local 115 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 290 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 311 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward() local 336 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 359 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward() local 539 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 585 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 856 __m128 _bias = _mm_set1_ps(bias); in forward() local [all …]
|
H A D | scale_x86.cpp | 60 __m256 _bias = _mm256_loadu_ps(bias + i * 8); in forward_inplace() local 92 __m256 _bias = _mm256_loadu_ps((const float*)bias_data + i * 8); in forward_inplace() local 138 __m256 _bias = _mm256_loadu_ps((const float*)bias_data + q * 8); in forward_inplace() local 191 __m128 _bias = _mm_loadu_ps(bias + i * 4); in forward_inplace() local 223 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward_inplace() local 269 __m128 _bias = _mm_loadu_ps((const float*)bias_data + q * 4); in forward_inplace() local 334 __m256 _bias = _mm256_set1_ps(bias); in forward_inplace() local
|
H A D | convolution_7x7.h | 15 …x7s1_sse(const Mat& bottom_blob, Mat& top_blob, const Mat& _kernel, const Mat& _bias, const Option… in conv7x7s1_sse() 26 …x7s2_sse(const Mat& bottom_blob, Mat& top_blob, const Mat& _kernel, const Mat& _bias, const Option… in conv7x7s2_sse()
|
H A D | requantize_x86.cpp | 92 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 131 __m256 _bias = _mm256_loadu_ps((const float*)bias_data + i * 8); in forward() local 194 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 302 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 407 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 725 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 752 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward() local 791 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 820 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward() local 859 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local [all …]
|
/dports/misc/ncnn/ncnn-20211208/src/layer/x86/ |
H A D | dequantize_x86.cpp | 71 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 92 __m256 _bias = _mm256_loadu_ps((const float*)bias_data + i * 8); in forward() local 117 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 292 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 313 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward() local 338 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 361 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward() local 541 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 587 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 858 __m128 _bias = _mm_set1_ps(bias); in forward() local [all …]
|
H A D | scale_x86.cpp | 60 __m256 _bias = _mm256_loadu_ps(bias + i * 8); in forward_inplace() local 92 __m256 _bias = _mm256_loadu_ps((const float*)bias_data + i * 8); in forward_inplace() local 138 __m256 _bias = _mm256_loadu_ps((const float*)bias_data + q * 8); in forward_inplace() local 191 __m128 _bias = _mm_loadu_ps(bias + i * 4); in forward_inplace() local 223 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward_inplace() local 269 __m128 _bias = _mm_loadu_ps((const float*)bias_data + q * 4); in forward_inplace() local 334 __m256 _bias = _mm256_set1_ps(bias); in forward_inplace() local
|
H A D | convolution_7x7.h | 15 …x7s1_sse(const Mat& bottom_blob, Mat& top_blob, const Mat& _kernel, const Mat& _bias, const Option… in conv7x7s1_sse() 26 …x7s2_sse(const Mat& bottom_blob, Mat& top_blob, const Mat& _kernel, const Mat& _bias, const Option… in conv7x7s2_sse()
|
H A D | requantize_x86.cpp | 92 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 131 __m256 _bias = _mm256_loadu_ps((const float*)bias_data + i * 8); in forward() local 194 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 302 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 407 __m256 _bias = _mm256_set1_ps(bias_data[0]); in forward() local 725 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 752 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward() local 791 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local 820 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward() local 859 __m128 _bias = _mm_set1_ps(bias_data[0]); in forward() local [all …]
|
/dports/graphics/vapoursynth-waifu2x-ncnn-vulkan/vapoursynth-waifu2x-ncnn-vulkan-r4/deps/ncnn/src/layer/arm/ |
H A D | dequantize_arm.cpp | 87 float32x4_t _bias = vdupq_n_f32(bias_data[0]); in forward() local 141 float32x4_t _bias = vdupq_n_f32(bias_data[0]); in forward() local 408 float32x4_t _bias = vdupq_n_f32(bias_data[0]); in forward() local 780 float32x4_t _bias = vdupq_n_f32(bias); in forward() local 869 float32x4_t _bias = vdupq_n_f32(bias); in forward() local 1509 float32x4_t _bias = vdupq_n_f32(bias); in forward_fp16s() local 1578 float32x4_t _bias = vdupq_n_f32(bias); in forward_fp16s() local 2197 float32x4_t _bias = vdupq_n_f32(bias); in forward_fp16sa() local 2266 float32x4_t _bias = vdupq_n_f32(bias); in forward_fp16sa() local 2939 float32x4_t _bias = vdupq_n_f32(bias); in forward_bf16s() local [all …]
|
H A D | scale_arm.cpp | 56 float32x4_t _bias = vld1q_f32(bias + i * 4); in forward_inplace() local 88 float32x4_t _bias = vld1q_f32((const float*)bias_data + i * 4); in forward_inplace() local 134 float32x4_t _bias = vld1q_f32((const float*)bias_data + q * 4); in forward_inplace() local 199 float32x4_t _bias = vdupq_n_f32(bias); in forward_inplace() local
|
/dports/graphics/waifu2x-ncnn-vulkan/waifu2x-ncnn-vulkan-20210521/src/ncnn/src/layer/arm/ |
H A D | dequantize_arm.cpp | 87 float32x4_t _bias = vdupq_n_f32(bias_data[0]); in forward() local 141 float32x4_t _bias = vdupq_n_f32(bias_data[0]); in forward() local 408 float32x4_t _bias = vdupq_n_f32(bias_data[0]); in forward() local 780 float32x4_t _bias = vdupq_n_f32(bias); in forward() local 869 float32x4_t _bias = vdupq_n_f32(bias); in forward() local 1509 float32x4_t _bias = vdupq_n_f32(bias); in forward_fp16s() local 1578 float32x4_t _bias = vdupq_n_f32(bias); in forward_fp16s() local 2197 float32x4_t _bias = vdupq_n_f32(bias); in forward_fp16sa() local 2266 float32x4_t _bias = vdupq_n_f32(bias); in forward_fp16sa() local 2939 float32x4_t _bias = vdupq_n_f32(bias); in forward_bf16s() local [all …]
|
H A D | scale_arm.cpp | 56 float32x4_t _bias = vld1q_f32(bias + i * 4); in forward_inplace() local 88 float32x4_t _bias = vld1q_f32((const float*)bias_data + i * 4); in forward_inplace() local 134 float32x4_t _bias = vld1q_f32((const float*)bias_data + q * 4); in forward_inplace() local 199 float32x4_t _bias = vdupq_n_f32(bias); in forward_inplace() local
|
/dports/benchmarks/vkpeak/vkpeak-20210430/ncnn/src/layer/arm/ |
H A D | dequantize_arm.cpp | 87 float32x4_t _bias = vdupq_n_f32(bias_data[0]); in forward() local 141 float32x4_t _bias = vdupq_n_f32(bias_data[0]); in forward() local 408 float32x4_t _bias = vdupq_n_f32(bias_data[0]); in forward() local 780 float32x4_t _bias = vdupq_n_f32(bias); in forward() local 869 float32x4_t _bias = vdupq_n_f32(bias); in forward() local 1509 float32x4_t _bias = vdupq_n_f32(bias); in forward_fp16s() local 1578 float32x4_t _bias = vdupq_n_f32(bias); in forward_fp16s() local 2197 float32x4_t _bias = vdupq_n_f32(bias); in forward_fp16sa() local 2266 float32x4_t _bias = vdupq_n_f32(bias); in forward_fp16sa() local 2939 float32x4_t _bias = vdupq_n_f32(bias); in forward_bf16s() local [all …]
|
H A D | scale_arm.cpp | 56 float32x4_t _bias = vld1q_f32(bias + i * 4); in forward_inplace() local 88 float32x4_t _bias = vld1q_f32((const float*)bias_data + i * 4); in forward_inplace() local 134 float32x4_t _bias = vld1q_f32((const float*)bias_data + q * 4); in forward_inplace() local 199 float32x4_t _bias = vdupq_n_f32(bias); in forward_inplace() local
|
/dports/misc/ncnn/ncnn-20211208/src/layer/arm/ |
H A D | dequantize_arm.cpp | 91 float32x4_t _bias = vdupq_n_f32(bias_data[0]); in forward() local 145 float32x4_t _bias = vdupq_n_f32(bias_data[0]); in forward() local 412 float32x4_t _bias = vdupq_n_f32(bias_data[0]); in forward() local 784 float32x4_t _bias = vdupq_n_f32(bias); in forward() local 873 float32x4_t _bias = vdupq_n_f32(bias); in forward() local 1513 float32x4_t _bias = vdupq_n_f32(bias); in forward_fp16s() local 1582 float32x4_t _bias = vdupq_n_f32(bias); in forward_fp16s() local 2201 float32x4_t _bias = vdupq_n_f32(bias); in forward_fp16sa() local 2270 float32x4_t _bias = vdupq_n_f32(bias); in forward_fp16sa() local 2944 float32x4_t _bias = vdupq_n_f32(bias); in forward_bf16s() local [all …]
|
/dports/graphics/realsr-ncnn-vulkan/realsr-ncnn-vulkan-20210210/src/ncnn/src/layer/x86/ |
H A D | scale_x86.cpp | 60 __m256 _bias = _mm256_loadu_ps(bias + i * 8); in forward_inplace() local 92 __m256 _bias = _mm256_loadu_ps((const float*)bias_data + i * 8); in forward_inplace() local 138 __m256 _bias = _mm256_loadu_ps((const float*)bias_data + q * 8); in forward_inplace() local 191 __m128 _bias = _mm_loadu_ps(bias + i * 4); in forward_inplace() local 223 __m128 _bias = _mm_loadu_ps((const float*)bias_data + i * 4); in forward_inplace() local 269 __m128 _bias = _mm_loadu_ps((const float*)bias_data + q * 4); in forward_inplace() local 334 __m256 _bias = _mm256_set1_ps(bias); in forward_inplace() local
|
H A D | convolution_7x7.h | 15 …x7s1_sse(const Mat& bottom_blob, Mat& top_blob, const Mat& _kernel, const Mat& _bias, const Option… in conv7x7s1_sse() 26 …x7s2_sse(const Mat& bottom_blob, Mat& top_blob, const Mat& _kernel, const Mat& _bias, const Option… in conv7x7s2_sse()
|