/dports/audio/aften/aften-0.0.8/libaften/x86/ |
H A D | x86_sse_mdct_common.c | 75 XMM1 = _mm_shuffle_ps(XMM1, XMM1, _MM_SHUFFLE(0,1,0,1)); in mdct_butterfly_8() 114 XMM1 = _mm_shuffle_ps(XMM1, XMM1, _MM_SHUFFLE(2,3,0,0)); in mdct_butterfly_16() 121 XMM1 = _mm_mul_ps(XMM1, XMM4); in mdct_butterfly_16() 191 XMM1 = _mm_shuffle_ps(XMM1, XMM1, _MM_SHUFFLE(2,3,1,1)); in mdct_butterfly_32() 206 XMM1 = _mm_add_ps(XMM1, XMM5); in mdct_butterfly_32() 250 XMM1 = _mm_shuffle_ps(XMM1 , XMM1 , _MM_SHUFFLE(3,3,1,1)); in mdct_butterfly_first() 307 XMM1 = _mm_shuffle_ps(XMM1, XMM1, _MM_SHUFFLE(2,2,0,0)); in mdct_butterfly_generic() 376 XMM1 = _mm_shuffle_ps(XMM1, XMM1, _MM_SHUFFLE(2,2,0,0)); in mdct_butterfly_generic() 532 XMM1 = _mm_shuffle_ps(XMM1, XMM1, _MM_SHUFFLE(2,2,1,1)); in mdct() 563 XMM1 = _mm_shuffle_ps(XMM1, XMM1, _MM_SHUFFLE(0,1,2,3)); in mdct() [all …]
|
H A D | x86_sse_mdct_common_init.c | 156 XMM1 = _mm_xor_ps(XMM1, PCS_RNNR.v); in sse_mdct_ctx_init() 183 XMM1 = _mm_xor_ps(XMM1, PCS_RNNR.v); in sse_mdct_ctx_init() 201 XMM1 = _mm_shuffle_ps(XMM1, XMM2,_MM_SHUFFLE(0,2,0,2)); in sse_mdct_ctx_init() 203 XMM1 = _mm_mul_ps(XMM1, pscalem); in sse_mdct_ctx_init() 206 XMM1 = _mm_shuffle_ps(XMM1, XMM1, _MM_SHUFFLE(0,1,2,3)); in sse_mdct_ctx_init() 232 XMM1 = _mm_xor_ps(XMM1, PCS_RNRN.v); in sse_mdct_ctx_init() 238 XMM1 = _mm_xor_ps(XMM1, PCS_RRRR.v); in sse_mdct_ctx_init() 269 XMM1 = _mm_xor_ps(XMM1, PCS_RNRN.v); in sse_mdct_ctx_init() 298 XMM1 = _mm_xor_ps(XMM1, PCS_RNRN.v); in sse_mdct_ctx_init() 331 XMM1 = _mm_xor_ps(XMM1, PCS_RNRN.v); in sse_mdct_ctx_init() [all …]
|
/dports/math/igraph/igraph-0.9.5/vendor/plfit/ |
H A D | arithmetic_sse_float.h | 102 XMM1 = _mm_xor_ps(XMM1, XMM4); \ 122 XMM1 = _mm_mul_ps(XMM1, XMM7); \ 143 XMM1 = _mm_sub_ps(XMM1, XMM5); \ 161 XMM1 = _mm_mul_ps(XMM1, XMM7); \ 229 XMM1 = _mm_add_ps(XMM1, XMM3); \ 255 XMM1 = _mm_mul_ss(XMM1, XMM1); \ 256 XMM1 = _mm_mul_ss(XMM1, XMM3); \ 257 XMM1 = _mm_mul_ss(XMM1, XMM0); \ 284 XMM1 = _mm_mul_ss(XMM1, XMM1); \ 285 XMM1 = _mm_mul_ss(XMM1, XMM3); \ [all …]
|
H A D | arithmetic_sse_double.h | 93 _mm_store_pd((y)+i+2, XMM1); \ 112 XMM1 = _mm_sub_pd(XMM1, XMM5); \ 132 XMM1 = _mm_mul_pd(XMM1, XMM7); \ 153 XMM1 = _mm_sub_pd(XMM1, XMM5); \ 171 XMM1 = _mm_mul_pd(XMM1, XMM7); \ 239 XMM1 = _mm_add_pd(XMM1, XMM3); \ 241 XMM0 = _mm_add_pd(XMM0, XMM1); \ 243 XMM0 = _mm_add_pd(XMM0, XMM1); \ 261 XMM1 = _mm_add_pd(XMM1, XMM3); \ 263 XMM0 = _mm_add_pd(XMM0, XMM1); \ [all …]
|
/dports/science/InsightToolkit/ITK-5.0.1/Modules/ThirdParty/libLBFGS/src/ |
H A D | arithmetic_sse_float.h | 109 XMM1 = _mm_xor_ps(XMM1, XMM4); \ 129 XMM1 = _mm_mul_ps(XMM1, XMM7); \ 150 XMM1 = _mm_sub_ps(XMM1, XMM5); \ 168 XMM1 = _mm_mul_ps(XMM1, XMM7); \ 236 XMM1 = _mm_add_ps(XMM1, XMM3); \ 262 XMM1 = _mm_mul_ss(XMM1, XMM1); \ 263 XMM1 = _mm_mul_ss(XMM1, XMM3); \ 264 XMM1 = _mm_mul_ss(XMM1, XMM0); \ 291 XMM1 = _mm_mul_ss(XMM1, XMM1); \ 292 XMM1 = _mm_mul_ss(XMM1, XMM3); \ [all …]
|
H A D | arithmetic_sse_double.h | 93 _mm_store_pd((y)+i+2, XMM1); \ 112 XMM1 = _mm_sub_pd(XMM1, XMM5); \ 132 XMM1 = _mm_mul_pd(XMM1, XMM7); \ 153 XMM1 = _mm_sub_pd(XMM1, XMM5); \ 171 XMM1 = _mm_mul_pd(XMM1, XMM7); \ 239 XMM1 = _mm_add_pd(XMM1, XMM3); \ 241 XMM0 = _mm_add_pd(XMM0, XMM1); \ 243 XMM0 = _mm_add_pd(XMM0, XMM1); \ 261 XMM1 = _mm_add_pd(XMM1, XMM3); \ 263 XMM0 = _mm_add_pd(XMM0, XMM1); \ [all …]
|
/dports/math/R-cran-igraph/igraph/src/plfit/ |
H A D | arithmetic_sse_float.h | 102 XMM1 = _mm_xor_ps(XMM1, XMM4); \ 122 XMM1 = _mm_mul_ps(XMM1, XMM7); \ 143 XMM1 = _mm_sub_ps(XMM1, XMM5); \ 161 XMM1 = _mm_mul_ps(XMM1, XMM7); \ 229 XMM1 = _mm_add_ps(XMM1, XMM3); \ 255 XMM1 = _mm_mul_ss(XMM1, XMM1); \ 256 XMM1 = _mm_mul_ss(XMM1, XMM3); \ 257 XMM1 = _mm_mul_ss(XMM1, XMM0); \ 284 XMM1 = _mm_mul_ss(XMM1, XMM1); \ 285 XMM1 = _mm_mul_ss(XMM1, XMM3); \ [all …]
|
H A D | arithmetic_sse_double.h | 93 _mm_store_pd((y)+i+2, XMM1); \ 112 XMM1 = _mm_sub_pd(XMM1, XMM5); \ 132 XMM1 = _mm_mul_pd(XMM1, XMM7); \ 153 XMM1 = _mm_sub_pd(XMM1, XMM5); \ 171 XMM1 = _mm_mul_pd(XMM1, XMM7); \ 239 XMM1 = _mm_add_pd(XMM1, XMM3); \ 241 XMM0 = _mm_add_pd(XMM0, XMM1); \ 243 XMM0 = _mm_add_pd(XMM0, XMM1); \ 261 XMM1 = _mm_add_pd(XMM1, XMM3); \ 263 XMM0 = _mm_add_pd(XMM0, XMM1); \ [all …]
|
/dports/science/PETSc/petsc-3.14.1/src/mat/impls/baij/seq/ |
H A D | dgefa4.c | 209 SSE_SUB_PS(XMM1,XMM0) in PetscKernel_A_gets_inverse_A_4_SSE() 226 SSE_ADD_PS(XMM2,XMM1) in PetscKernel_A_gets_inverse_A_4_SSE() 235 SSE_SUB_PS(XMM2,XMM1) in PetscKernel_A_gets_inverse_A_4_SSE() 264 SSE_SUB_PS(XMM0,XMM1) in PetscKernel_A_gets_inverse_A_4_SSE() 277 SSE_SHUFFLE(XMM1,XMM1,0xB1) in PetscKernel_A_gets_inverse_A_4_SSE() 287 SSE_SHUFFLE(XMM1,XMM1,0x4E) in PetscKernel_A_gets_inverse_A_4_SSE() 294 SSE_SUB_PS(XMM2,XMM1) in PetscKernel_A_gets_inverse_A_4_SSE() 302 SSE_SHUFFLE(XMM1,XMM1,0xB1) in PetscKernel_A_gets_inverse_A_4_SSE() 313 SSE_SHUFFLE(XMM1,XMM1,0x4E) in PetscKernel_A_gets_inverse_A_4_SSE() 320 SSE_SUB_PS(XMM2,XMM1) in PetscKernel_A_gets_inverse_A_4_SSE() [all …]
|
/dports/math/openblas/OpenBLAS-0.3.18/kernel/x86_64/ |
H A D | dgemm_kernel_6x4_piledriver.S | 241 VXOR1282(XMM1,XMM1,XMM1); 266 VMA1282(XMM13,XMM15,XMM1,XMM1); 472 VXOR1282(XMM1,XMM1,XMM1); 648 VXOR1282(XMM1,XMM1,XMM1); 773 VXOR1281(XMM1,XMM1,XMM1); 919 VXOR1282(XMM1,XMM1,XMM1); 1070 VXOR1282(XMM1,XMM1,XMM1); 1188 VXOR1282(XMM1,XMM1,XMM1); 1277 VXOR1281(XMM1,XMM1,XMM1); 1382 VXOR1282(XMM1,XMM1,XMM1); [all …]
|
/dports/emulators/ppsspp-qt5/ppsspp-1.12.3/Core/MIPS/x86/ |
H A D | CompVFPU.cpp | 191 XORPS(XMM1, R(XMM1)); in ApplyPrefixD() 1323 XORPS(XMM1, R(XMM1)); in Comp_Vcmp() 1458 PCMPEQW(XMM1, R(XMM1)); in Comp_Vcmp() 1646 XORPS(XMM1, R(XMM1)); in Comp_Vh2f() 1757 PXOR(XMM1, R(XMM1)); in Comp_Vx2i() 2337 XORPS(XMM1, R(XMM1)); in Comp_VV2Op() 3265 PXOR(XMM1, R(XMM1)); in Comp_Vi2x() 3274 PXOR(XMM1, R(XMM1)); in Comp_Vi2x() 3348 XORPS(XMM1, R(XMM1)); in Comp_Vhoriz() 3362 XORPS(XMM1, R(XMM1)); in Comp_Vhoriz() [all …]
|
/dports/emulators/ppsspp/ppsspp-1.12.3/Core/MIPS/x86/ |
H A D | CompVFPU.cpp | 191 XORPS(XMM1, R(XMM1)); in ApplyPrefixD() 1323 XORPS(XMM1, R(XMM1)); in Comp_Vcmp() 1458 PCMPEQW(XMM1, R(XMM1)); in Comp_Vcmp() 1646 XORPS(XMM1, R(XMM1)); in Comp_Vh2f() 1757 PXOR(XMM1, R(XMM1)); in Comp_Vx2i() 2337 XORPS(XMM1, R(XMM1)); in Comp_VV2Op() 3265 PXOR(XMM1, R(XMM1)); in Comp_Vi2x() 3274 PXOR(XMM1, R(XMM1)); in Comp_Vi2x() 3348 XORPS(XMM1, R(XMM1)); in Comp_Vhoriz() 3362 XORPS(XMM1, R(XMM1)); in Comp_Vhoriz() [all …]
|
/dports/emulators/libretro-ppsspp/ppsspp-1.12.3/Core/MIPS/x86/ |
H A D | CompVFPU.cpp | 191 XORPS(XMM1, R(XMM1)); in ApplyPrefixD() 1323 XORPS(XMM1, R(XMM1)); in Comp_Vcmp() 1458 PCMPEQW(XMM1, R(XMM1)); in Comp_Vcmp() 1646 XORPS(XMM1, R(XMM1)); in Comp_Vh2f() 1757 PXOR(XMM1, R(XMM1)); in Comp_Vx2i() 2337 XORPS(XMM1, R(XMM1)); in Comp_VV2Op() 3265 PXOR(XMM1, R(XMM1)); in Comp_Vi2x() 3274 PXOR(XMM1, R(XMM1)); in Comp_Vi2x() 3348 XORPS(XMM1, R(XMM1)); in Comp_Vhoriz() 3362 XORPS(XMM1, R(XMM1)); in Comp_Vhoriz() [all …]
|
/dports/emulators/dolphin-emu/dolphin-3152428/Source/Core/Core/PowerPC/Jit64/ |
H A D | Jit_FloatingPoint.cpp | 271 MOVDDUP(XMM1, Rc); in fmaddXX() 273 Force25BitPrecision(XMM1, R(XMM1), XMM0); in fmaddXX() 278 Force25BitPrecision(XMM1, R(XMM1), XMM0); in fmaddXX() 331 MOVAPD(XMM1, Rb); in fmaddXX() 347 MULPD(XMM1, Ra); in fmaddXX() 355 MULSD(XMM1, Ra); in fmaddXX() 372 HandleNaNs(inst, XMM1, XMM1); in fmaddXX() 373 MOVSD(Rd, R(XMM1)); in fmaddXX() 468 MOVAPD(XMM1, Rc); in fselx() 475 ANDNPD(XMM1, Rc); in fselx() [all …]
|
/dports/lang/fpc-source/fpc-3.2.2/tests/test/ |
H A D | taes1.pp | 38 PSHUFD XMM1, XMM1, 011100101b; MOVD EBX, XMM1; XOR EAX, EBX; MOV [RCX], EAX; ADD RCX, 4 39 PSHUFD XMM1, XMM1, 011100110b; MOVD EBX, XMM1; XOR EAX, EBX; MOV [RCX], EAX; ADD RCX, 4 40 PSHUFD XMM1, XMM1, 011100111b; MOVD EBX, XMM1; XOR EAX, EBX; MOV [RCX], EAX; ADD RCX, 4 46 MOVDQU XMM1, [RDX]; ADD RDX, $10; MOVDQU XMM3, [RDX] 56 MOVDQU XMM1, [RCX]; MOVDQU XMM3, [RCX+16] 57 MOVDQU [RDX], XMM1; MOVDQU [RDX + $10], XMM3 70 AESIMC XMM1, XMM1; AESIMC XMM2, XMM2; AESIMC XMM3, XMM3; AESIMC XMM4, XMM4 92 MOVDQU XMM1, [R9+16*1] 111 AESENC XMM15, XMM1 140 MOVDQU XMM1, [R9+16*1] [all …]
|
/dports/graphics/libosmesa-gallium/mesa-21.3.6/src/mesa/x86/ |
H A D | sse_normal.S | 77 MOVSS ( M(0), XMM1 ) /* m0 */ 79 UNPCKLPS( XMM2, XMM1 ) /* m5 | m0 */ 140 MOVSS ( M(4), XMM1 ) /* m4 */ 141 UNPCKLPS( XMM1, XMM0 ) /* m4 | m0 */ 147 MOVSS ( M(1), XMM1 ) /* m1 */ 149 UNPCKLPS( XMM2, XMM1 ) /* m5 | m1 */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 233 MOVSS( M(5), XMM1 ) /* m5 */ 234 UNPCKLPS( XMM1, XMM0 ) /* m5 | m0 */ 235 MOVSS( M(10), XMM1 ) /* m10 */ [all …]
|
/dports/lang/clover/mesa-21.3.6/src/mesa/x86/ |
H A D | sse_normal.S | 77 MOVSS ( M(0), XMM1 ) /* m0 */ 79 UNPCKLPS( XMM2, XMM1 ) /* m5 | m0 */ 140 MOVSS ( M(4), XMM1 ) /* m4 */ 141 UNPCKLPS( XMM1, XMM0 ) /* m4 | m0 */ 147 MOVSS ( M(1), XMM1 ) /* m1 */ 149 UNPCKLPS( XMM2, XMM1 ) /* m5 | m1 */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 233 MOVSS( M(5), XMM1 ) /* m5 */ 234 UNPCKLPS( XMM1, XMM0 ) /* m5 | m0 */ 235 MOVSS( M(10), XMM1 ) /* m10 */ [all …]
|
/dports/graphics/libosmesa/mesa-21.3.6/src/mesa/x86/ |
H A D | sse_normal.S | 77 MOVSS ( M(0), XMM1 ) /* m0 */ 79 UNPCKLPS( XMM2, XMM1 ) /* m5 | m0 */ 140 MOVSS ( M(4), XMM1 ) /* m4 */ 141 UNPCKLPS( XMM1, XMM0 ) /* m4 | m0 */ 147 MOVSS ( M(1), XMM1 ) /* m1 */ 149 UNPCKLPS( XMM2, XMM1 ) /* m5 | m1 */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 233 MOVSS( M(5), XMM1 ) /* m5 */ 234 UNPCKLPS( XMM1, XMM0 ) /* m5 | m0 */ 235 MOVSS( M(10), XMM1 ) /* m10 */ [all …]
|
/dports/graphics/mesa-libs/mesa-21.3.6/src/mesa/x86/ |
H A D | sse_normal.S | 77 MOVSS ( M(0), XMM1 ) /* m0 */ 79 UNPCKLPS( XMM2, XMM1 ) /* m5 | m0 */ 140 MOVSS ( M(4), XMM1 ) /* m4 */ 141 UNPCKLPS( XMM1, XMM0 ) /* m4 | m0 */ 147 MOVSS ( M(1), XMM1 ) /* m1 */ 149 UNPCKLPS( XMM2, XMM1 ) /* m5 | m1 */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 233 MOVSS( M(5), XMM1 ) /* m5 */ 234 UNPCKLPS( XMM1, XMM0 ) /* m5 | m0 */ 235 MOVSS( M(10), XMM1 ) /* m10 */ [all …]
|
/dports/graphics/mesa-dri-gallium/mesa-21.3.6/src/mesa/x86/ |
H A D | sse_normal.S | 77 MOVSS ( M(0), XMM1 ) /* m0 */ 79 UNPCKLPS( XMM2, XMM1 ) /* m5 | m0 */ 140 MOVSS ( M(4), XMM1 ) /* m4 */ 141 UNPCKLPS( XMM1, XMM0 ) /* m4 | m0 */ 147 MOVSS ( M(1), XMM1 ) /* m1 */ 149 UNPCKLPS( XMM2, XMM1 ) /* m5 | m1 */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 233 MOVSS( M(5), XMM1 ) /* m5 */ 234 UNPCKLPS( XMM1, XMM0 ) /* m5 | m0 */ 235 MOVSS( M(10), XMM1 ) /* m10 */ [all …]
|
/dports/graphics/mesa-gallium-va/mesa-21.3.6/src/mesa/x86/ |
H A D | sse_normal.S | 77 MOVSS ( M(0), XMM1 ) /* m0 */ 79 UNPCKLPS( XMM2, XMM1 ) /* m5 | m0 */ 140 MOVSS ( M(4), XMM1 ) /* m4 */ 141 UNPCKLPS( XMM1, XMM0 ) /* m4 | m0 */ 147 MOVSS ( M(1), XMM1 ) /* m1 */ 149 UNPCKLPS( XMM2, XMM1 ) /* m5 | m1 */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 233 MOVSS( M(5), XMM1 ) /* m5 */ 234 UNPCKLPS( XMM1, XMM0 ) /* m5 | m0 */ 235 MOVSS( M(10), XMM1 ) /* m10 */ [all …]
|
/dports/graphics/mesa-dri-classic/mesa-20.2.3/src/mesa/x86/ |
H A D | sse_normal.S | 77 MOVSS ( M(0), XMM1 ) /* m0 */ 79 UNPCKLPS( XMM2, XMM1 ) /* m5 | m0 */ 140 MOVSS ( M(4), XMM1 ) /* m4 */ 141 UNPCKLPS( XMM1, XMM0 ) /* m4 | m0 */ 147 MOVSS ( M(1), XMM1 ) /* m1 */ 149 UNPCKLPS( XMM2, XMM1 ) /* m5 | m1 */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 233 MOVSS( M(5), XMM1 ) /* m5 */ 234 UNPCKLPS( XMM1, XMM0 ) /* m5 | m0 */ 235 MOVSS( M(10), XMM1 ) /* m10 */ [all …]
|
/dports/graphics/mesa-gallium-vdpau/mesa-21.3.6/src/mesa/x86/ |
H A D | sse_normal.S | 77 MOVSS ( M(0), XMM1 ) /* m0 */ 79 UNPCKLPS( XMM2, XMM1 ) /* m5 | m0 */ 140 MOVSS ( M(4), XMM1 ) /* m4 */ 141 UNPCKLPS( XMM1, XMM0 ) /* m4 | m0 */ 147 MOVSS ( M(1), XMM1 ) /* m1 */ 149 UNPCKLPS( XMM2, XMM1 ) /* m5 | m1 */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 233 MOVSS( M(5), XMM1 ) /* m5 */ 234 UNPCKLPS( XMM1, XMM0 ) /* m5 | m0 */ 235 MOVSS( M(10), XMM1 ) /* m10 */ [all …]
|
/dports/graphics/mesa-gallium-xa/mesa-21.3.6/src/mesa/x86/ |
H A D | sse_normal.S | 77 MOVSS ( M(0), XMM1 ) /* m0 */ 79 UNPCKLPS( XMM2, XMM1 ) /* m5 | m0 */ 140 MOVSS ( M(4), XMM1 ) /* m4 */ 141 UNPCKLPS( XMM1, XMM0 ) /* m4 | m0 */ 147 MOVSS ( M(1), XMM1 ) /* m1 */ 149 UNPCKLPS( XMM2, XMM1 ) /* m5 | m1 */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 233 MOVSS( M(5), XMM1 ) /* m5 */ 234 UNPCKLPS( XMM1, XMM0 ) /* m5 | m0 */ 235 MOVSS( M(10), XMM1 ) /* m10 */ [all …]
|
/dports/graphics/mesa-dri/mesa-21.3.6/src/mesa/x86/ |
H A D | sse_normal.S | 77 MOVSS ( M(0), XMM1 ) /* m0 */ 79 UNPCKLPS( XMM2, XMM1 ) /* m5 | m0 */ 140 MOVSS ( M(4), XMM1 ) /* m4 */ 141 UNPCKLPS( XMM1, XMM0 ) /* m4 | m0 */ 147 MOVSS ( M(1), XMM1 ) /* m1 */ 149 UNPCKLPS( XMM2, XMM1 ) /* m5 | m1 */ 168 MULPS ( XMM1, XMM4 ) /* uy*m5 | uy*m1 */ 233 MOVSS( M(5), XMM1 ) /* m5 */ 234 UNPCKLPS( XMM1, XMM0 ) /* m5 | m0 */ 235 MOVSS( M(10), XMM1 ) /* m10 */ [all …]
|