Home
last modified time | relevance | path

Searched refs:c12v (Results 1 – 6 of 6) sorted by relevance

/dports/misc/mnn/MNN-1.2.0/source/backend/cpu/x86_x64/avx/
H A DMNNMatrixAdd.cpp35 auto c12v = _mm256_loadu_ps(c12Y + unit*x); in _AVX_MNNStrassenMergeCFunction() local
36 c12v = _mm256_add_ps(c12v, xv); in _AVX_MNNStrassenMergeCFunction()
37 c21v = _mm256_add_ps(c12v, c21v); in _AVX_MNNStrassenMergeCFunction()
38 c12v = _mm256_add_ps(c22v, c12v); in _AVX_MNNStrassenMergeCFunction()
40 c12v = _mm256_add_ps(c11v, c12v); in _AVX_MNNStrassenMergeCFunction()
41 _mm256_storeu_ps(c12Y + unit*x, c12v); in _AVX_MNNStrassenMergeCFunction()
/dports/misc/mnn/MNN-1.2.0/source/backend/cpu/compute/
H A DConvOpt.cpp298 auto c12v = Vec4::load(c12Y + 4*x); in MNNStrassenMergeCFunction() local
299 c12v = c12v + xv; in MNNStrassenMergeCFunction()
300 c21v = c12v + c21v; in MNNStrassenMergeCFunction()
301 c12v = c22v + c12v; in MNNStrassenMergeCFunction()
303 c12v = c11v + c12v; in MNNStrassenMergeCFunction()
304 Vec4::save(c12Y + 4*x, c12v); in MNNStrassenMergeCFunction()
/dports/misc/mnn/MNN-1.2.0/source/backend/cpu/x86_x64/avx512/
H A DCommonOptFunction.cpp54 auto c12v = _mm256_loadu_ps(c12Y + 8*x); in _AVX512_MNNStrassenMergeCFunction() local
55 c12v = _mm256_add_ps(c12v, xv); in _AVX512_MNNStrassenMergeCFunction()
56 c21v = _mm256_add_ps(c12v, c21v); in _AVX512_MNNStrassenMergeCFunction()
57 c12v = _mm256_add_ps(c22v, c12v); in _AVX512_MNNStrassenMergeCFunction()
59 c12v = _mm256_add_ps(c11v, c12v); in _AVX512_MNNStrassenMergeCFunction()
60 _mm256_storeu_ps(c12Y + 8*x, c12v); in _AVX512_MNNStrassenMergeCFunction()
61 _mm256_storeu_ps(c12Y + 8*x, c12v); in _AVX512_MNNStrassenMergeCFunction()
/dports/misc/mnn/MNN-1.2.0/source/backend/arm82/
H A DArm82Functions.cpp254 auto c12v = vld1q_f16(c12Y + x * pack); in ARM82StrassenMerge() local
255 c12v = c12v + xv; in ARM82StrassenMerge()
256 c21v = c12v + c21v; in ARM82StrassenMerge()
257 c12v = c22v + c12v; in ARM82StrassenMerge()
259 c12v = c11v + c12v; in ARM82StrassenMerge()
260 vst1q_f16(c12Y + x * pack, c12v); in ARM82StrassenMerge()
/dports/misc/mnn/MNN-1.2.0/source/backend/cpu/bf16/
H A DBF16Functions.cpp520 auto c12v = BFVec4::load(c12Y + 4*x); in _MNNStrassenMergeCFunction() local
521 c12v = c12v + xv; in _MNNStrassenMergeCFunction()
522 c21v = c12v + c21v; in _MNNStrassenMergeCFunction()
523 c12v = c22v + c12v; in _MNNStrassenMergeCFunction()
525 c12v = c11v + c12v; in _MNNStrassenMergeCFunction()
526 BFVec4::save(c12Y + 4*x, c12v); in _MNNStrassenMergeCFunction()
/dports/science/libint2/libint-2.7.1/include/libint2/
H A Dboys.h1165 libint2::simd::VectorAVXDouble c00v, c01v, c02v, c03v, c10v, c11v, c12v, c13v, in interpolate_Gm() local
1178 c12v.load_aligned((c_tuint+8) +ORDERp1); c13v.load_aligned((c_tuint+12) +ORDERp1); in interpolate_Gm()
1180 …libint2::simd::VectorAVXDouble t1 = t1vec * (c10v * u0vec + c11v * u1vec + c12v * u2vec + c13v * u… in interpolate_Gm()