Home
last modified time | relevance | path

Searched refs:__msa_ld_w (Results 1 – 25 of 142) sorted by relevance

123456

/dports/misc/ncnn/ncnn-20211208/src/layer/mips/
H A Dconvolutiondepthwise_5x5_pack4.h65 v4f32 _r00 = (v4f32)__msa_ld_w(r0, 0); in convdw5x5s1_pack4_msa()
71 v4f32 _k00 = (v4f32)__msa_ld_w(k0, 0); in convdw5x5s1_pack4_msa()
84 v4f32 _r10 = (v4f32)__msa_ld_w(r1, 0); in convdw5x5s1_pack4_msa()
96 v4f32 _k10 = (v4f32)__msa_ld_w(k0, 0); in convdw5x5s1_pack4_msa()
109 v4f32 _r20 = (v4f32)__msa_ld_w(r2, 0); in convdw5x5s1_pack4_msa()
121 v4f32 _k20 = (v4f32)__msa_ld_w(k0, 0); in convdw5x5s1_pack4_msa()
134 v4f32 _r30 = (v4f32)__msa_ld_w(r3, 0); in convdw5x5s1_pack4_msa()
146 v4f32 _k30 = (v4f32)__msa_ld_w(k0, 0); in convdw5x5s1_pack4_msa()
159 v4f32 _r40 = (v4f32)__msa_ld_w(r4, 0); in convdw5x5s1_pack4_msa()
171 v4f32 _k40 = (v4f32)__msa_ld_w(k0, 0); in convdw5x5s1_pack4_msa()
[all …]
H A Dconvolutiondepthwise_3x3_pack4.h45 v4f32 _k00 = (v4f32)__msa_ld_w(k0, 0); in convdw3x3s1_pack4_msa()
46 v4f32 _k01 = (v4f32)__msa_ld_w(k0 + 4, 0); in convdw3x3s1_pack4_msa()
47 v4f32 _k02 = (v4f32)__msa_ld_w(k0 + 4 * 2, 0); in convdw3x3s1_pack4_msa()
48 v4f32 _k10 = (v4f32)__msa_ld_w(k0 + 4 * 3, 0); in convdw3x3s1_pack4_msa()
49 v4f32 _k11 = (v4f32)__msa_ld_w(k0 + 4 * 4, 0); in convdw3x3s1_pack4_msa()
50 v4f32 _k12 = (v4f32)__msa_ld_w(k0 + 4 * 5, 0); in convdw3x3s1_pack4_msa()
51 v4f32 _k20 = (v4f32)__msa_ld_w(k0 + 4 * 6, 0); in convdw3x3s1_pack4_msa()
52 v4f32 _k21 = (v4f32)__msa_ld_w(k0 + 4 * 7, 0); in convdw3x3s1_pack4_msa()
53 v4f32 _k22 = (v4f32)__msa_ld_w(k0 + 4 * 8, 0); in convdw3x3s1_pack4_msa()
347 v4f32 _k00 = (v4f32)__msa_ld_w(k0, 0); in convdw3x3s2_pack4_msa()
[all …]
H A Dconvolution_7x7_pack1to4.h74 v4i32 _r0 = __msa_ld_w(r0, 0); in conv7x7s2_pack1to4_msa()
131 v4i32 _r1 = __msa_ld_w(r1, 0); in conv7x7s2_pack1to4_msa()
188 v4i32 _r2 = __msa_ld_w(r2, 0); in conv7x7s2_pack1to4_msa()
245 v4i32 _r3 = __msa_ld_w(r3, 0); in conv7x7s2_pack1to4_msa()
302 v4i32 _r4 = __msa_ld_w(r4, 0); in conv7x7s2_pack1to4_msa()
359 v4i32 _r5 = __msa_ld_w(r5, 0); in conv7x7s2_pack1to4_msa()
416 v4i32 _r6 = __msa_ld_w(r6, 0); in conv7x7s2_pack1to4_msa()
492 v4i32 _r0 = __msa_ld_w(r0, 0); in conv7x7s2_pack1to4_msa()
513 v4i32 _r1 = __msa_ld_w(r1, 0); in conv7x7s2_pack1to4_msa()
534 v4i32 _r2 = __msa_ld_w(r2, 0); in conv7x7s2_pack1to4_msa()
[all …]
H A Dinterp_bicubic_pack4.h62 v4f32 _S30 = (v4f32)__msa_ld_w(S3p - 4, 0); in resize_bicubic_image_pack4()
63 v4f32 _S31 = (v4f32)__msa_ld_w(S3p + 0, 0); in resize_bicubic_image_pack4()
64 v4f32 _S32 = (v4f32)__msa_ld_w(S3p + 4, 0); in resize_bicubic_image_pack4()
65 v4f32 _S33 = (v4f32)__msa_ld_w(S3p + 8, 0); in resize_bicubic_image_pack4()
101 v4f32 _S20 = (v4f32)__msa_ld_w(S2p - 4, 0); in resize_bicubic_image_pack4()
102 v4f32 _S21 = (v4f32)__msa_ld_w(S2p + 0, 0); in resize_bicubic_image_pack4()
103 v4f32 _S22 = (v4f32)__msa_ld_w(S2p + 4, 0); in resize_bicubic_image_pack4()
267 v4f32 _rows0 = (v4f32)__msa_ld_w(rows0p, 0); in resize_bicubic_image_pack4()
268 v4f32 _rows1 = (v4f32)__msa_ld_w(rows1p, 0); in resize_bicubic_image_pack4()
269 v4f32 _rows2 = (v4f32)__msa_ld_w(rows2p, 0); in resize_bicubic_image_pack4()
[all …]
H A Dconvolution_3x3_pack1to4.h45 v4f32 _k00 = (v4f32)__msa_ld_w(k0, 0); in conv3x3s1_pack1to4_msa()
46 v4f32 _k01 = (v4f32)__msa_ld_w(k0 + 4, 0); in conv3x3s1_pack1to4_msa()
70 v4i32 _r0 = __msa_ld_w(r0, 0); in conv3x3s1_pack1to4_msa()
110 v4i32 _r1 = __msa_ld_w(r1, 0); in conv3x3s1_pack1to4_msa()
150 v4i32 _r2 = __msa_ld_w(r2, 0); in conv3x3s1_pack1to4_msa()
212 v4i32 _r0 = __msa_ld_w(r0, 0); in conv3x3s1_pack1to4_msa()
235 v4i32 _r1 = __msa_ld_w(r1, 0); in conv3x3s1_pack1to4_msa()
258 v4i32 _r2 = __msa_ld_w(r2, 0); in conv3x3s1_pack1to4_msa()
297 v4i32 _r0 = __msa_ld_w(r0, 0); in conv3x3s1_pack1to4_msa()
310 v4i32 _r1 = __msa_ld_w(r1, 0); in conv3x3s1_pack1to4_msa()
[all …]
H A Dconvolution_3x3_pack4.h333 v4f32 _r0 = (v4f32)__msa_ld_w(r0, 0); in conv3x3s1_winograd64_pack4_msa()
399 v4f32 _r0 = (v4f32)__msa_ld_w(r0, 0); in conv3x3s1_winograd64_pack4_msa()
449 v4f32 _r0 = (v4f32)__msa_ld_w(r0, 0); in conv3x3s1_winograd64_pack4_msa()
483 v4f32 _r0 = (v4f32)__msa_ld_w(r0, 0); in conv3x3s1_winograd64_pack4_msa()
506 v4f32 _val = (v4f32)__msa_ld_w(r0, 0); in conv3x3s1_winograd64_pack4_msa()
556 v4i32 _val0123 = __msa_ld_w(r0, 0); in conv3x3s1_winograd64_pack4_msa()
612 v4i32 _val0123 = __msa_ld_w(r0, 0); in conv3x3s1_winograd64_pack4_msa()
1147 v4f32 _r0 = (v4f32)__msa_ld_w(r0, 0); in conv3x3s1_winograd42_pack4_msa()
1213 v4f32 _r0 = (v4f32)__msa_ld_w(r0, 0); in conv3x3s1_winograd42_pack4_msa()
1263 v4f32 _r0 = (v4f32)__msa_ld_w(r0, 0); in conv3x3s1_winograd42_pack4_msa()
[all …]
H A Deltwise_mips.cpp62 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward()
63 v4f32 _p1 = (v4f32)__msa_ld_w(ptr1, 0); in forward()
207 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward()
208 v4f32 _p1 = (v4f32)__msa_ld_w(ptr1, 0); in forward()
260 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward()
261 v4f32 _p1 = (v4f32)__msa_ld_w(ptr1, 0); in forward()
294 v4f32 _p1 = (v4f32)__msa_ld_w(ptr, 0); in forward()
329 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward()
402 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward()
475 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward()
[all …]
H A Dpadding_pack4.h39 __msa_st_w(__msa_ld_w(ptr, 0), outptr, 0); in padding_constant_pack4_msa()
66 v4f32 _p = (v4f32)__msa_ld_w(ptr0, 0); in padding_replicate_pack4_msa()
74 _p = (v4f32)__msa_ld_w(ptr0, 0); in padding_replicate_pack4_msa()
88 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in padding_replicate_pack4_msa()
96 _p = (v4f32)__msa_ld_w(ptr, 0); in padding_replicate_pack4_msa()
112 v4f32 _p = (v4f32)__msa_ld_w(ptr0, 0); in padding_replicate_pack4_msa()
120 _p = (v4f32)__msa_ld_w(ptr0, 0); in padding_replicate_pack4_msa()
151 v4f32 _p = (v4f32)__msa_ld_w(ptr0, 0); in padding_reflect_pack4_msa()
175 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in padding_reflect_pack4_msa()
182 v4f32 _p = (v4f32)__msa_ld_w(ptr - 8 - x * 4, 0); in padding_reflect_pack4_msa()
[all …]
H A Dconvolution_sgemm_pack4.h57 v4f32 _r0 = (v4f32)__msa_ld_w(img0, 0); in im2col_sgemm_pack4_msa()
131 v4f32 _r0 = (v4f32)__msa_ld_w(img0, 0); in im2col_sgemm_pack4_msa()
189 v4f32 _r0 = (v4f32)__msa_ld_w(img0, 0); in im2col_sgemm_pack4_msa()
299 v4i32 _val0123 = __msa_ld_w(tmpptr, 0); in im2col_sgemm_pack4_msa()
302 v4f32 _w0 = (v4f32)__msa_ld_w(kptr0, 0); in im2col_sgemm_pack4_msa()
355 v4i32 _val0123 = __msa_ld_w(tmpptr, 0); in im2col_sgemm_pack4_msa()
357 v4f32 _w0 = (v4f32)__msa_ld_w(kptr0, 0); in im2col_sgemm_pack4_msa()
398 v4i32 _val0123 = __msa_ld_w(tmpptr, 0); in im2col_sgemm_pack4_msa()
399 v4f32 _w0 = (v4f32)__msa_ld_w(kptr0, 0); in im2col_sgemm_pack4_msa()
432 v4f32 _w0 = (v4f32)__msa_ld_w(kptr0, 0); in im2col_sgemm_pack4_msa()
[all …]
H A Dconvolution_sgemm_pack4to1.h54 v4f32 _r0 = (v4f32)__msa_ld_w(img0, 0); in im2col_sgemm_pack4to1_msa()
128 v4f32 _r0 = (v4f32)__msa_ld_w(img0, 0); in im2col_sgemm_pack4to1_msa()
258 v4i32 _bias = __msa_ld_w(biasptr, 0); in im2col_sgemm_pack4to1_msa()
279 v4i32 _w0123 = __msa_ld_w(kptr0, 0); in im2col_sgemm_pack4to1_msa()
322 v4i32 _bias = __msa_ld_w(biasptr, 0); in im2col_sgemm_pack4to1_msa()
338 v4i32 _w0123 = __msa_ld_w(kptr0, 0); in im2col_sgemm_pack4to1_msa()
373 v4i32 _bias = __msa_ld_w(biasptr, 0); in im2col_sgemm_pack4to1_msa()
384 v4i32 _w0123 = __msa_ld_w(kptr0, 0); in im2col_sgemm_pack4to1_msa()
411 v4f32 _sum = (v4f32)__msa_ld_w(biasptr, 0); in im2col_sgemm_pack4to1_msa()
418 v4f32 _w0 = (v4f32)__msa_ld_w(kptr0, 0); in im2col_sgemm_pack4to1_msa()
[all …]
H A Dbinaryop_mips.cpp73 v4f32 _b0 = (v4f32)__msa_ld_w(b0, 0); in binary_op_pack4()
77 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in binary_op_pack4()
130 v4f32 _a0 = (v4f32)__msa_ld_w(a0, 0); in binary_op_pack4()
323 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in binary_op_pack4()
468 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in binary_op_pack4()
469 v4f32 _p1 = (v4f32)__msa_ld_w(ptr1, 0); in binary_op_pack4()
512 v4f32 _b0 = (v4f32)__msa_ld_w(ptr1, 0); in binary_op_pack4()
649 v4f32 _a0 = (v4f32)__msa_ld_w(ptr, 0); in binary_op_pack4()
699 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in binary_op_pack4()
700 v4f32 _p1 = (v4f32)__msa_ld_w(ptr1, 0); in binary_op_pack4()
[all …]
H A Dinterp_bilinear_pack4.h55 v4f32 _S10 = (v4f32)__msa_ld_w(S1p, 0); in resize_bilinear_image_pack4()
56 v4f32 _S11 = (v4f32)__msa_ld_w(S1p + 4, 0); in resize_bilinear_image_pack4()
83 v4f32 _S00 = (v4f32)__msa_ld_w(S0p, 0); in resize_bilinear_image_pack4()
84 v4f32 _S01 = (v4f32)__msa_ld_w(S0p + 4, 0); in resize_bilinear_image_pack4()
85 v4f32 _S10 = (v4f32)__msa_ld_w(S1p, 0); in resize_bilinear_image_pack4()
86 v4f32 _S11 = (v4f32)__msa_ld_w(S1p + 4, 0); in resize_bilinear_image_pack4()
110 v4f32 _rows0 = (v4f32)__msa_ld_w(rows0p, 0); in resize_bilinear_image_pack4()
111 v4f32 _rows1 = (v4f32)__msa_ld_w(rows1p, 0); in resize_bilinear_image_pack4()
H A Dunaryop_mips.cpp52 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in unary_op_inplace_pack4()
89 return (v4f32)__msa_ld_w(tmp, 0); in operator ()()
109 return (v4f32)__msa_ld_w(tmp, 0); in operator ()()
169 return (v4f32)__msa_ld_w(tmp, 0); in operator ()()
184 return (v4f32)__msa_ld_w(tmp, 0); in operator ()()
199 return (v4f32)__msa_ld_w(tmp, 0); in operator ()()
214 return (v4f32)__msa_ld_w(tmp, 0); in operator ()()
229 return (v4f32)__msa_ld_w(tmp, 0); in operator ()()
244 return (v4f32)__msa_ld_w(tmp, 0); in operator ()()
H A Dprelu_mips.cpp55 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
56 v4f32 _slope = (v4f32)__msa_ld_w(slope + i * 4, 0); in forward_inplace()
72 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
90 …v4f32 _slope = num_slope > 1 ? (v4f32)__msa_ld_w((const float*)slope_data + i * 4, 0) : (v4f32)__m… in forward_inplace()
95 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
117 …v4f32 _slope = num_slope > 1 ? (v4f32)__msa_ld_w((const float*)slope_data + q * 4, 0) : (v4f32)__m… in forward_inplace()
122 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
189 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
232 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
H A Dsoftmax_mips.cpp77 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
78 v4f32 _max = (v4f32)__msa_ld_w(maxptr, 0); in forward_inplace()
118 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
119 v4f32 _sum = (v4f32)__msa_ld_w(sumptr, 0); in forward_inplace()
153 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
154 v4f32 _sum = (v4f32)__msa_ld_w(sumptr, 0); in forward_inplace()
H A Dconvolution1d_mips.cpp136 _sum = (v4f32)__msa_ld_w((const float*)bias_data + p * 4, 0); in forward()
152 v4f32 _w0 = (v4f32)__msa_ld_w(kptr, 0); in forward()
153 v4f32 _w1 = (v4f32)__msa_ld_w(kptr + 4, 0); in forward()
154 v4f32 _w2 = (v4f32)__msa_ld_w(kptr + 8, 0); in forward()
155 v4f32 _w3 = (v4f32)__msa_ld_w(kptr + 12, 0); in forward()
190 _sum = (v4f32)__msa_ld_w((const float*)bias_data + p * 4, 0); in forward()
202 v4f32 _w = (v4f32)__msa_ld_w(kptr, 0); in forward()
246 v4f32 _val = (v4f32)__msa_ld_w(sptr, 0); in forward()
247 v4f32 _w = (v4f32)__msa_ld_w(kptr, 0); in forward()
H A Dpacking_mips.cpp125 v4f32 _r0 = (v4f32)__msa_ld_w(r0, 0); in forward()
126 v4f32 _r1 = (v4f32)__msa_ld_w(r1, 0); in forward()
127 v4f32 _r2 = (v4f32)__msa_ld_w(r2, 0); in forward()
128 v4f32 _r3 = (v4f32)__msa_ld_w(r3, 0); in forward()
179 v4f32 _r0 = (v4f32)__msa_ld_w(r0, 0); in forward()
180 v4f32 _r1 = (v4f32)__msa_ld_w(r0 + 4, 0); in forward()
250 v4f32 _r0 = (v4f32)__msa_ld_w(r0, 0); in forward()
251 v4f32 _r1 = (v4f32)__msa_ld_w(r1, 0); in forward()
252 v4f32 _r2 = (v4f32)__msa_ld_w(r2, 0); in forward()
253 v4f32 _r3 = (v4f32)__msa_ld_w(r3, 0); in forward()
[all …]
H A Dconvolution_pack4.h60 _sum = (v4f32)__msa_ld_w(bias_data_ptr + p * 4, 0); in convolution_pack4_msa()
80 v4f32 _w0 = (v4f32)__msa_ld_w(kptr, 0); in convolution_pack4_msa()
81 v4f32 _w1 = (v4f32)__msa_ld_w(kptr + 4, 0); in convolution_pack4_msa()
82 v4f32 _w2 = (v4f32)__msa_ld_w(kptr + 8, 0); in convolution_pack4_msa()
83 v4f32 _w3 = (v4f32)__msa_ld_w(kptr + 12, 0); in convolution_pack4_msa()
H A Ddeconvolution_pack4.h46 _sum = (v4f32)__msa_ld_w((const float*)bias_data_ptr + p * 4, 0); in deconvolution_pack4_msa()
84 v4f32 _w0 = (v4f32)__msa_ld_w(kptr + k, 0); in deconvolution_pack4_msa()
85 v4f32 _w1 = (v4f32)__msa_ld_w(kptr + k + 4, 0); in deconvolution_pack4_msa()
86 v4f32 _w2 = (v4f32)__msa_ld_w(kptr + k + 8, 0); in deconvolution_pack4_msa()
87 v4f32 _w3 = (v4f32)__msa_ld_w(kptr + k + 12, 0); in deconvolution_pack4_msa()
H A Dpooling_mips.cpp86 v4f32 _max = (v4f32)__msa_ld_w(ptr, 0); in forward()
89 v4f32 _val = (v4f32)__msa_ld_w(ptr, 0); in forward()
108 v4f32 _val = (v4f32)__msa_ld_w(ptr, 0); in forward()
173 v4f32 _max = (v4f32)__msa_ld_w(sptr, 0); in forward()
177 v4f32 _val = (v4f32)__msa_ld_w(sptr + space_ofs[k] * 4, 0); in forward()
238 v4f32 _val = (v4f32)__msa_ld_w(m.row(sy) + sx * 4, 0); in forward()
272 v4f32 _val = (v4f32)__msa_ld_w(sptr + space_ofs[k] * 4, 0); in forward()
H A Dflatten_mips.cpp104 v4f32 _r0 = (v4f32)__msa_ld_w(ptr, 0); in forward()
105 v4f32 _r1 = (v4f32)__msa_ld_w(ptr + 4, 0); in forward()
106 v4f32 _r2 = (v4f32)__msa_ld_w(ptr + 4 * 2, 0); in forward()
107 v4f32 _r3 = (v4f32)__msa_ld_w(ptr + 4 * 3, 0); in forward()
161 v4f32 _r0 = (v4f32)__msa_ld_w(ptr, 0); in forward()
162 v4f32 _r1 = (v4f32)__msa_ld_w(ptr + 4, 0); in forward()
163 v4f32 _r2 = (v4f32)__msa_ld_w(ptr + 4 * 2, 0); in forward()
164 v4f32 _r3 = (v4f32)__msa_ld_w(ptr + 4 * 3, 0); in forward()
211 __msa_st_w(__msa_ld_w(ptr, 0), outptr, 0); in forward()
/dports/graphics/waifu2x-ncnn-vulkan/waifu2x-ncnn-vulkan-20210521/src/ncnn/src/layer/mips/
H A Dsoftmax_mips.cpp78 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
79 v4f32 _max = (v4f32)__msa_ld_w(maxptr, 0); in forward_inplace()
119 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
120 v4f32 _sum = (v4f32)__msa_ld_w(sumptr, 0); in forward_inplace()
154 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
155 v4f32 _sum = (v4f32)__msa_ld_w(sumptr, 0); in forward_inplace()
/dports/graphics/vapoursynth-waifu2x-ncnn-vulkan/vapoursynth-waifu2x-ncnn-vulkan-r4/deps/ncnn/src/layer/mips/
H A Dsoftmax_mips.cpp78 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
79 v4f32 _max = (v4f32)__msa_ld_w(maxptr, 0); in forward_inplace()
119 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
120 v4f32 _sum = (v4f32)__msa_ld_w(sumptr, 0); in forward_inplace()
154 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
155 v4f32 _sum = (v4f32)__msa_ld_w(sumptr, 0); in forward_inplace()
/dports/benchmarks/vkpeak/vkpeak-20210430/ncnn/src/layer/mips/
H A Dsoftmax_mips.cpp78 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
79 v4f32 _max = (v4f32)__msa_ld_w(maxptr, 0); in forward_inplace()
119 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
120 v4f32 _sum = (v4f32)__msa_ld_w(sumptr, 0); in forward_inplace()
154 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
155 v4f32 _sum = (v4f32)__msa_ld_w(sumptr, 0); in forward_inplace()
/dports/graphics/realsr-ncnn-vulkan/realsr-ncnn-vulkan-20210210/src/ncnn/src/layer/mips/
H A Dsoftmax_mips.cpp78 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
79 v4f32 _max = (v4f32)__msa_ld_w(maxptr, 0); in forward_inplace()
119 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
120 v4f32 _sum = (v4f32)__msa_ld_w(sumptr, 0); in forward_inplace()
154 v4f32 _p = (v4f32)__msa_ld_w(ptr, 0); in forward_inplace()
155 v4f32 _sum = (v4f32)__msa_ld_w(sumptr, 0); in forward_inplace()

123456