/dports/audio/aften/aften-0.0.8/libaften/x86/ |
H A D | x86_sse_mdct_common.c | 107 XMM4 = _mm_add_ps(XMM4, XMM1); in mdct_butterfly_16() 189 XMM4 = _mm_shuffle_ps(XMM4, XMM4, _MM_SHUFFLE(2,2,0,0)); in mdct_butterfly_32() 235 XMM4 = _mm_add_ps(XMM4, XMM2); in mdct_butterfly_first() 363 XMM4 = _mm_add_ps(XMM4, XMM1); in mdct_butterfly_generic() 526 XMM4 = _mm_shuffle_ps(XMM4, XMM4, _MM_SHUFFLE(0,1,2,3)); in mdct() 528 XMM4 = _mm_add_ps(XMM4, XMM5); in mdct() 533 XMM4 = _mm_shuffle_ps(XMM4, XMM4, _MM_SHUFFLE(0,0,3,3)); in mdct() 537 XMM4 = _mm_mul_ps(XMM4, XMM6); in mdct() 540 XMM4 = _mm_sub_ps(XMM4, XMM5); in mdct() 571 XMM4 = _mm_shuffle_ps(XMM4, XMM4, _MM_SHUFFLE(0,0,3,3)); in mdct() [all …]
|
H A D | x86_sse_mdct_common_init.c | 231 XMM4 = _mm_shuffle_ps(XMM4, XMM5, _MM_SHUFFLE(1,0,1,0)); in sse_mdct_ctx_init() 233 XMM4 = _mm_xor_ps(XMM4, PCS_RNRN.v); in sse_mdct_ctx_init() 239 XMM4 = _mm_xor_ps(XMM4, PCS_RRRR.v); in sse_mdct_ctx_init() 268 XMM4 = _mm_shuffle_ps(XMM4, XMM5, _MM_SHUFFLE(1,0,1,0)); in sse_mdct_ctx_init() 270 XMM4 = _mm_xor_ps(XMM4, PCS_RNRN.v); in sse_mdct_ctx_init() 297 XMM4 = _mm_shuffle_ps(XMM4, XMM5, _MM_SHUFFLE(1,0,1,0)); in sse_mdct_ctx_init() 299 XMM4 = _mm_xor_ps(XMM4, PCS_RNRN.v); in sse_mdct_ctx_init() 330 XMM4 = _mm_shuffle_ps(XMM4, XMM5, _MM_SHUFFLE(1,0,1,0)); in sse_mdct_ctx_init() 332 XMM4 = _mm_xor_ps(XMM4, PCS_RNRN.v); in sse_mdct_ctx_init() 364 XMM4 = _mm_shuffle_ps(XMM4, XMM5, _MM_SHUFFLE(1,0,1,0)); in sse_mdct_ctx_init() [all …]
|
/dports/science/PETSc/petsc-3.14.1/src/mat/impls/baij/seq/ |
H A D | dgefa4.c | 187 SSE_COPY_PS(XMM4,XMM0) in PetscKernel_A_gets_inverse_A_4_SSE() 194 SSE_COPY_PS(XMM7,XMM4) in PetscKernel_A_gets_inverse_A_4_SSE() 220 SSE_MULT_PS(XMM0,XMM4) in PetscKernel_A_gets_inverse_A_4_SSE() 251 SSE_SHUFFLE(XMM4,XMM4,0x4E) in PetscKernel_A_gets_inverse_A_4_SSE() 326 SSE_SHUFFLE(XMM4,XMM4,0xB1) in PetscKernel_A_gets_inverse_A_4_SSE() 337 SSE_SHUFFLE(XMM4,XMM4,0x4E) in PetscKernel_A_gets_inverse_A_4_SSE() 352 SSE_ADD_PS(XMM4,XMM3) in PetscKernel_A_gets_inverse_A_4_SSE() 356 SSE_ADD_SS(XMM6,XMM4) in PetscKernel_A_gets_inverse_A_4_SSE() 361 SSE_ADD_SS(XMM4,XMM3) in PetscKernel_A_gets_inverse_A_4_SSE() 364 SSE_SUB_SS(XMM4,XMM6) in PetscKernel_A_gets_inverse_A_4_SSE() [all …]
|
H A D | baijfact11.c | 682 SSE_OR_PS(XMM5,XMM4) in MatLUFactorNumeric_SeqBAIJ_4_NaturalOrdering_SSE() 704 SSE_SHUFFLE(XMM4,XMM4,0x00) in MatLUFactorNumeric_SeqBAIJ_4_NaturalOrdering_SSE() 864 SSE_SHUFFLE(XMM4,XMM4,0x00) in MatLUFactorNumeric_SeqBAIJ_4_NaturalOrdering_SSE() 889 SSE_SHUFFLE(XMM4,XMM4,0x00) in MatLUFactorNumeric_SeqBAIJ_4_NaturalOrdering_SSE() 1126 SSE_OR_PS(XMM5,XMM4) in MatLUFactorNumeric_SeqBAIJ_4_NaturalOrdering_SSE_usj_Inplace() 1148 SSE_SHUFFLE(XMM4,XMM4,0x00) in MatLUFactorNumeric_SeqBAIJ_4_NaturalOrdering_SSE_usj_Inplace() 1308 SSE_SHUFFLE(XMM4,XMM4,0x00) in MatLUFactorNumeric_SeqBAIJ_4_NaturalOrdering_SSE_usj_Inplace() 1333 SSE_SHUFFLE(XMM4,XMM4,0x00) in MatLUFactorNumeric_SeqBAIJ_4_NaturalOrdering_SSE_usj_Inplace() 1593 SSE_SHUFFLE(XMM4,XMM4,0x00) in MatLUFactorNumeric_SeqBAIJ_4_NaturalOrdering_SSE_usj() 1753 SSE_SHUFFLE(XMM4,XMM4,0x00) in MatLUFactorNumeric_SeqBAIJ_4_NaturalOrdering_SSE_usj() [all …]
|
/dports/graphics/libosmesa-gallium/mesa-21.3.6/src/mesa/x86/ |
H A D | sse_xform3.S | 87 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox | ox */ 97 ADDPS ( XMM5, XMM4 ) 98 ADDPS ( XMM6, XMM4 ) 99 ADDPS ( XMM3, XMM4 ) 101 MOVAPS ( XMM4, REGOFF(0, EDI) ) 353 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* oy | oy */ 356 ADDPS ( XMM4, XMM3 ) 478 MOVSS( S(0), XMM4 ) 479 SHUFPS( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox */ 495 UNPCKHPS( XMM4, XMM4 ) [all …]
|
H A D | sse_normal.S | 143 MOVSS ( ARG_SCALE, XMM4 ) /* scale */ 144 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* scale | scale */ 146 MULPS ( XMM4, XMM0 ) /* m4*scale | m0*scale */ 150 MULPS ( XMM4, XMM1 ) /* m5*scale | m1*scale */ 166 MOVSS ( S(1), XMM4 ) /* uy */ 167 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* uy | uy */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 173 ADDPS ( XMM4, XMM3 ) 180 MOVSS ( S(1), XMM4 ) /* uy */ 181 MULSS ( XMM7, XMM4 ) /* uy*m9*scale */ [all …]
|
/dports/lang/clover/mesa-21.3.6/src/mesa/x86/ |
H A D | sse_xform3.S | 87 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox | ox */ 97 ADDPS ( XMM5, XMM4 ) 98 ADDPS ( XMM6, XMM4 ) 99 ADDPS ( XMM3, XMM4 ) 101 MOVAPS ( XMM4, REGOFF(0, EDI) ) 353 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* oy | oy */ 356 ADDPS ( XMM4, XMM3 ) 478 MOVSS( S(0), XMM4 ) 479 SHUFPS( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox */ 495 UNPCKHPS( XMM4, XMM4 ) [all …]
|
H A D | sse_normal.S | 143 MOVSS ( ARG_SCALE, XMM4 ) /* scale */ 144 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* scale | scale */ 146 MULPS ( XMM4, XMM0 ) /* m4*scale | m0*scale */ 150 MULPS ( XMM4, XMM1 ) /* m5*scale | m1*scale */ 166 MOVSS ( S(1), XMM4 ) /* uy */ 167 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* uy | uy */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 173 ADDPS ( XMM4, XMM3 ) 180 MOVSS ( S(1), XMM4 ) /* uy */ 181 MULSS ( XMM7, XMM4 ) /* uy*m9*scale */ [all …]
|
/dports/graphics/libosmesa/mesa-21.3.6/src/mesa/x86/ |
H A D | sse_xform3.S | 87 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox | ox */ 97 ADDPS ( XMM5, XMM4 ) 98 ADDPS ( XMM6, XMM4 ) 99 ADDPS ( XMM3, XMM4 ) 101 MOVAPS ( XMM4, REGOFF(0, EDI) ) 353 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* oy | oy */ 356 ADDPS ( XMM4, XMM3 ) 478 MOVSS( S(0), XMM4 ) 479 SHUFPS( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox */ 495 UNPCKHPS( XMM4, XMM4 ) [all …]
|
H A D | sse_normal.S | 143 MOVSS ( ARG_SCALE, XMM4 ) /* scale */ 144 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* scale | scale */ 146 MULPS ( XMM4, XMM0 ) /* m4*scale | m0*scale */ 150 MULPS ( XMM4, XMM1 ) /* m5*scale | m1*scale */ 166 MOVSS ( S(1), XMM4 ) /* uy */ 167 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* uy | uy */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 173 ADDPS ( XMM4, XMM3 ) 180 MOVSS ( S(1), XMM4 ) /* uy */ 181 MULSS ( XMM7, XMM4 ) /* uy*m9*scale */ [all …]
|
/dports/graphics/mesa-libs/mesa-21.3.6/src/mesa/x86/ |
H A D | sse_xform3.S | 87 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox | ox */ 97 ADDPS ( XMM5, XMM4 ) 98 ADDPS ( XMM6, XMM4 ) 99 ADDPS ( XMM3, XMM4 ) 101 MOVAPS ( XMM4, REGOFF(0, EDI) ) 353 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* oy | oy */ 356 ADDPS ( XMM4, XMM3 ) 478 MOVSS( S(0), XMM4 ) 479 SHUFPS( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox */ 495 UNPCKHPS( XMM4, XMM4 ) [all …]
|
H A D | sse_normal.S | 143 MOVSS ( ARG_SCALE, XMM4 ) /* scale */ 144 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* scale | scale */ 146 MULPS ( XMM4, XMM0 ) /* m4*scale | m0*scale */ 150 MULPS ( XMM4, XMM1 ) /* m5*scale | m1*scale */ 166 MOVSS ( S(1), XMM4 ) /* uy */ 167 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* uy | uy */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 173 ADDPS ( XMM4, XMM3 ) 180 MOVSS ( S(1), XMM4 ) /* uy */ 181 MULSS ( XMM7, XMM4 ) /* uy*m9*scale */ [all …]
|
/dports/graphics/mesa-dri-gallium/mesa-21.3.6/src/mesa/x86/ |
H A D | sse_xform3.S | 87 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox | ox */ 97 ADDPS ( XMM5, XMM4 ) 98 ADDPS ( XMM6, XMM4 ) 99 ADDPS ( XMM3, XMM4 ) 101 MOVAPS ( XMM4, REGOFF(0, EDI) ) 353 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* oy | oy */ 356 ADDPS ( XMM4, XMM3 ) 478 MOVSS( S(0), XMM4 ) 479 SHUFPS( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox */ 495 UNPCKHPS( XMM4, XMM4 ) [all …]
|
H A D | sse_normal.S | 143 MOVSS ( ARG_SCALE, XMM4 ) /* scale */ 144 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* scale | scale */ 146 MULPS ( XMM4, XMM0 ) /* m4*scale | m0*scale */ 150 MULPS ( XMM4, XMM1 ) /* m5*scale | m1*scale */ 166 MOVSS ( S(1), XMM4 ) /* uy */ 167 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* uy | uy */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 173 ADDPS ( XMM4, XMM3 ) 180 MOVSS ( S(1), XMM4 ) /* uy */ 181 MULSS ( XMM7, XMM4 ) /* uy*m9*scale */ [all …]
|
/dports/graphics/mesa-gallium-va/mesa-21.3.6/src/mesa/x86/ |
H A D | sse_xform3.S | 87 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox | ox */ 97 ADDPS ( XMM5, XMM4 ) 98 ADDPS ( XMM6, XMM4 ) 99 ADDPS ( XMM3, XMM4 ) 101 MOVAPS ( XMM4, REGOFF(0, EDI) ) 353 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* oy | oy */ 356 ADDPS ( XMM4, XMM3 ) 478 MOVSS( S(0), XMM4 ) 479 SHUFPS( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox */ 495 UNPCKHPS( XMM4, XMM4 ) [all …]
|
H A D | sse_normal.S | 143 MOVSS ( ARG_SCALE, XMM4 ) /* scale */ 144 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* scale | scale */ 146 MULPS ( XMM4, XMM0 ) /* m4*scale | m0*scale */ 150 MULPS ( XMM4, XMM1 ) /* m5*scale | m1*scale */ 166 MOVSS ( S(1), XMM4 ) /* uy */ 167 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* uy | uy */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 173 ADDPS ( XMM4, XMM3 ) 180 MOVSS ( S(1), XMM4 ) /* uy */ 181 MULSS ( XMM7, XMM4 ) /* uy*m9*scale */ [all …]
|
/dports/graphics/mesa-dri-classic/mesa-20.2.3/src/mesa/x86/ |
H A D | sse_xform3.S | 87 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox | ox */ 97 ADDPS ( XMM5, XMM4 ) 98 ADDPS ( XMM6, XMM4 ) 99 ADDPS ( XMM3, XMM4 ) 101 MOVAPS ( XMM4, REGOFF(0, EDI) ) 353 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* oy | oy */ 356 ADDPS ( XMM4, XMM3 ) 478 MOVSS( S(0), XMM4 ) 479 SHUFPS( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox */ 495 UNPCKHPS( XMM4, XMM4 ) [all …]
|
H A D | sse_normal.S | 143 MOVSS ( ARG_SCALE, XMM4 ) /* scale */ 144 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* scale | scale */ 146 MULPS ( XMM4, XMM0 ) /* m4*scale | m0*scale */ 150 MULPS ( XMM4, XMM1 ) /* m5*scale | m1*scale */ 166 MOVSS ( S(1), XMM4 ) /* uy */ 167 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* uy | uy */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 173 ADDPS ( XMM4, XMM3 ) 180 MOVSS ( S(1), XMM4 ) /* uy */ 181 MULSS ( XMM7, XMM4 ) /* uy*m9*scale */ [all …]
|
/dports/graphics/mesa-gallium-vdpau/mesa-21.3.6/src/mesa/x86/ |
H A D | sse_xform3.S | 87 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox | ox */ 97 ADDPS ( XMM5, XMM4 ) 98 ADDPS ( XMM6, XMM4 ) 99 ADDPS ( XMM3, XMM4 ) 101 MOVAPS ( XMM4, REGOFF(0, EDI) ) 353 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* oy | oy */ 356 ADDPS ( XMM4, XMM3 ) 478 MOVSS( S(0), XMM4 ) 479 SHUFPS( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox */ 495 UNPCKHPS( XMM4, XMM4 ) [all …]
|
H A D | sse_normal.S | 143 MOVSS ( ARG_SCALE, XMM4 ) /* scale */ 144 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* scale | scale */ 146 MULPS ( XMM4, XMM0 ) /* m4*scale | m0*scale */ 150 MULPS ( XMM4, XMM1 ) /* m5*scale | m1*scale */ 166 MOVSS ( S(1), XMM4 ) /* uy */ 167 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* uy | uy */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 173 ADDPS ( XMM4, XMM3 ) 180 MOVSS ( S(1), XMM4 ) /* uy */ 181 MULSS ( XMM7, XMM4 ) /* uy*m9*scale */ [all …]
|
/dports/graphics/mesa-gallium-xa/mesa-21.3.6/src/mesa/x86/ |
H A D | sse_xform3.S | 87 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox | ox */ 97 ADDPS ( XMM5, XMM4 ) 98 ADDPS ( XMM6, XMM4 ) 99 ADDPS ( XMM3, XMM4 ) 101 MOVAPS ( XMM4, REGOFF(0, EDI) ) 353 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* oy | oy */ 356 ADDPS ( XMM4, XMM3 ) 478 MOVSS( S(0), XMM4 ) 479 SHUFPS( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox */ 495 UNPCKHPS( XMM4, XMM4 ) [all …]
|
H A D | sse_normal.S | 143 MOVSS ( ARG_SCALE, XMM4 ) /* scale */ 144 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* scale | scale */ 146 MULPS ( XMM4, XMM0 ) /* m4*scale | m0*scale */ 150 MULPS ( XMM4, XMM1 ) /* m5*scale | m1*scale */ 166 MOVSS ( S(1), XMM4 ) /* uy */ 167 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* uy | uy */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 173 ADDPS ( XMM4, XMM3 ) 180 MOVSS ( S(1), XMM4 ) /* uy */ 181 MULSS ( XMM7, XMM4 ) /* uy*m9*scale */ [all …]
|
/dports/graphics/mesa-dri/mesa-21.3.6/src/mesa/x86/ |
H A D | sse_xform3.S | 87 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox | ox */ 97 ADDPS ( XMM5, XMM4 ) 98 ADDPS ( XMM6, XMM4 ) 99 ADDPS ( XMM3, XMM4 ) 101 MOVAPS ( XMM4, REGOFF(0, EDI) ) 353 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* oy | oy */ 356 ADDPS ( XMM4, XMM3 ) 478 MOVSS( S(0), XMM4 ) 479 SHUFPS( CONST(0x0), XMM4, XMM4 ) /* ox | ox | ox */ 495 UNPCKHPS( XMM4, XMM4 ) [all …]
|
H A D | sse_normal.S | 143 MOVSS ( ARG_SCALE, XMM4 ) /* scale */ 144 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* scale | scale */ 146 MULPS ( XMM4, XMM0 ) /* m4*scale | m0*scale */ 150 MULPS ( XMM4, XMM1 ) /* m5*scale | m1*scale */ 166 MOVSS ( S(1), XMM4 ) /* uy */ 167 SHUFPS ( CONST(0x0), XMM4, XMM4 ) /* uy | uy */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 173 ADDPS ( XMM4, XMM3 ) 180 MOVSS ( S(1), XMM4 ) /* uy */ 181 MULSS ( XMM7, XMM4 ) /* uy*m9*scale */ [all …]
|
/dports/math/igraph/igraph-0.9.5/vendor/plfit/ |
H A D | arithmetic_sse_double.h | 111 XMM0 = _mm_sub_pd(XMM0, XMM4); \ 152 XMM0 = _mm_sub_pd(XMM0, XMM4); \ 189 XMM4 = _mm_mul_pd(XMM4, XMM0); \ 193 _mm_store_pd((y)+i , XMM4); \ 230 __m128d XMM2, XMM3, XMM4, XMM5; \ 234 XMM4 = _mm_load_pd((y)+i ); \ 236 XMM2 = _mm_mul_pd(XMM2, XMM4); \ 252 __m128d XMM2, XMM3, XMM4, XMM5; \ 256 XMM4 = XMM2; \ 276 __m128d XMM2, XMM3, XMM4, XMM5; \ [all …]
|