Home
last modified time | relevance | path

Searched refs:_mm256_castpd256_pd128 (Results 1 – 25 of 199) sorted by relevance

12345678

/dports/math/blasfeo/blasfeo-0.1.2/kernel/avx/
H A Dkernel_dgecp_lib4.c385 c_0 = _mm_mul_pd( _mm256_castpd256_pd128( alpha_0 ), c_0 ); in kernel_dgecpsc_8_0_lib4()
388 c_0 = _mm_mul_pd( _mm256_castpd256_pd128( alpha_0 ), c_0 ); in kernel_dgecpsc_8_0_lib4()
395 c_0 = _mm_mul_pd( _mm256_castpd256_pd128( alpha_0 ), c_0 ); in kernel_dgecpsc_8_0_lib4()
402 c_0 = _mm_mul_pd( _mm256_castpd256_pd128( alpha_0 ), c_0 ); in kernel_dgecpsc_8_0_lib4()
413 c_0 = _mm_mul_pd( _mm256_castpd256_pd128( alpha_0 ), c_0 ); in kernel_dgecpsc_8_0_lib4()
416 c_0 = _mm_mul_pd( _mm256_castpd256_pd128( alpha_0 ), c_0 ); in kernel_dgecpsc_8_0_lib4()
420 c_0 = _mm_mul_pd( _mm256_castpd256_pd128( alpha_0 ), c_0 ); in kernel_dgecpsc_8_0_lib4()
3266 _mm_store_sd( &A[5], _mm256_castpd256_pd128( a0 ) ); in kernel_dtrset_4_lib4()
3267 _mm_store_pd( &A[6], _mm256_castpd256_pd128( a0 ) ); in kernel_dtrset_4_lib4()
3269 _mm_store_pd( &A[10], _mm256_castpd256_pd128( a0 ) ); in kernel_dtrset_4_lib4()
[all …]
H A Dkernel_dgetrf_pivot_lib.c188 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_8_lib()
392 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_8_lib()
581 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_8_lib()
754 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_8_lib()
912 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_8_lib()
1053 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_8_lib()
1178 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_8_lib()
1287 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_8_lib()
1543 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_4_lib()
1683 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_4_lib()
[all …]
/dports/math/blis/blis-0.8.1/kernels/zen/3/sup/broken/
H A Dbli_gemmsup_rv_zen_asm_z3x4n.c261 _mm_storeu_pd((double *)(tC ), _mm256_castpd256_pd128(ymm4)); in bli_zgemmsup_rv_zen_asm_3x4n()
262 _mm_storeu_pd((double *)(tC+1), _mm256_castpd256_pd128(ymm8)); in bli_zgemmsup_rv_zen_asm_3x4n()
272 _mm_storeu_pd((double *)(tC ), _mm256_castpd256_pd128(ymm5)); in bli_zgemmsup_rv_zen_asm_3x4n()
273 _mm_storeu_pd((double *)(tC+1), _mm256_castpd256_pd128(ymm9)); in bli_zgemmsup_rv_zen_asm_3x4n()
643 _mm_storeu_pd((double *)(tC), _mm256_castpd256_pd128(ymm4)); in bli_zgemmsup_rv_zen_asm_2x4n()
672 _mm_storeu_pd((double *)(tC), _mm256_castpd256_pd128(ymm5)); in bli_zgemmsup_rv_zen_asm_2x4n()
878 _mm_storeu_pd((double *)(tC), _mm256_castpd256_pd128(ymm4)); in bli_zgemmsup_rv_zen_asm_1x4n()
885 _mm_storeu_pd((double *)(tC), _mm256_castpd256_pd128(ymm5)); in bli_zgemmsup_rv_zen_asm_1x4n()
903 _mm_storeu_pd((double *)(tC), _mm256_castpd256_pd128(ymm4)); in bli_zgemmsup_rv_zen_asm_1x4n()
1110 _mm_storeu_pd((double *)(tC), _mm256_castpd256_pd128(ymm4)); in bli_zgemmsup_rv_zen_asm_3x2()
[all …]
/dports/science/gromacs/gromacs-2021.4/src/gromacs/simd/impl_x86_avx_256/
H A Dimpl_x86_avx_256_util_double.h167 _mm_storeu_pd(base + align * offset[0], _mm256_castpd256_pd128(t0)); in transposeScatterStoreU()
168 _mm_storeu_pd(base + align * offset[1], _mm256_castpd256_pd128(t1)); in transposeScatterStoreU()
212 tA = _mm_add_pd(tA, _mm256_castpd256_pd128(t0)); in transposeScatterIncrU()
213 tB = _mm_add_pd(tB, _mm256_castpd256_pd128(v2.simdInternal_)); in transposeScatterIncrU()
219 tA = _mm_add_pd(tA, _mm256_castpd256_pd128(t1)); in transposeScatterIncrU()
220 tB = _mm_add_pd(tB, _mm256_castpd256_pd128(v2.simdInternal_)); in transposeScatterIncrU()
274 tA = _mm_sub_pd(tA, _mm256_castpd256_pd128(t0)); in transposeScatterDecrU()
275 tB = _mm_sub_pd(tB, _mm256_castpd256_pd128(v2.simdInternal_)); in transposeScatterDecrU()
281 tA = _mm_sub_pd(tA, _mm256_castpd256_pd128(t1)); in transposeScatterDecrU()
282 tB = _mm_sub_pd(tB, _mm256_castpd256_pd128(v2.simdInternal_)); in transposeScatterDecrU()
[all …]
H A Dimpl_x86_avx_256_simd4_double.h207 tmp1 = _mm256_castpd256_pd128(a.simdInternal_); in dotProduct()
283 a0 = _mm256_castpd256_pd128(a.simdInternal_); in reduce()
/dports/multimedia/gstreamer1-plugins-rust/gst-plugins-rs-d0466b3eee114207f851b37cae0015c0e718f021/cargo-crates/rustfft-5.1.1/src/avx/
H A Davx64_utils.rs31 _mm256_castpd256_pd128(rows1[0]),
135 _mm256_castpd256_pd128(rows1[0]),
137 _mm256_castpd256_pd128(rows2[0]),
139 _mm256_castpd256_pd128(rows3[0]),
141 _mm256_castpd256_pd128(rows4[0]),
/dports/devel/libsimdpp/libsimdpp-2.1-400-g9dac213d/simdpp/detail/shuffle/
H A Dsse_float64_4x2.h151 __m128d a1 = _mm256_castpd256_pd128(a.native());
152 __m128d b1 = _mm256_castpd256_pd128(b.native());
171 __m128d a1 = _mm256_castpd256_pd128(a.native());
172 __m128d b1 = _mm256_castpd256_pd128(b.native());
/dports/devel/inastemp/inastemp-0.2.4/Src/AVX/
H A DInaVecAVXDouble.hpp251 const __m128d rest = _mm256_castpd256_pd128(vec); in horizontalSum()
259 const __m128d rest = _mm256_castpd256_pd128(vec); in horizontalMul()
305 __m128d vallower = _mm256_castpd256_pd128(x); in exp()
341 __m128d vallower = _mm256_castpd256_pd128(x); in expLowAcc()
601 __m128d vallower = _mm256_castpd256_pd128(val_a01_b01_a23_b23); in MultiHorizontalSum()
/dports/audio/libsoxr/soxr-0.1.3-Source/src/
H A Ddev64s.h36 _mm_store_sd(a, _mm256_castpd256_pd128(_mm256_hadd_pd(b,b)));} in vStorSum()
/dports/audio/audacity/audacity-Audacity-3.1.3/lib-src/libsoxr/src/
H A Ddev64s.h36 _mm_store_sd(a, _mm256_castpd256_pd128(_mm256_hadd_pd(b,b)));} in vStorSum()
/dports/graphics/povray38/povunix-v3.8.0-beta.2-src/platform/x86/avx2fma3/
H A Davx2fma3noise.cpp273 sumr_up = _mm_add_pd(_mm256_castpd256_pd128(sumr),sumr_up); in AVX2FMA3Noise()
472 xy_up = _mm_add_pd(_mm256_castpd256_pd128(xy),xy_up); in AVX2FMA3DNoise()
476 z_up = _mm_add_pd(_mm256_castpd256_pd128(z),z_up); in AVX2FMA3DNoise()
/dports/audio/gogglesmm/gogglesmm-1.2.2/cfox/lib/
H A DFXMat3d.cpp55 #define _mm256_storeu_sd(p,x) _mm_storel_pd(p,_mm256_castpd256_pd128(x))
58 #define _mm256_store_sd(p,x) _mm_storel_pd(p,_mm256_castpd256_pd128(x))
61 …56_div_sd(a,b) _mm256_castpd128_pd256(_mm_div_sd(_mm256_castpd256_pd128(a),_mm256_castpd256_pd1…
62 …56_mul_sd(a,b) _mm256_castpd128_pd256(_mm_mul_sd(_mm256_castpd256_pd128(a),_mm256_castpd256_pd1…
63 …56_add_sd(a,b) _mm256_castpd128_pd256(_mm_add_sd(_mm256_castpd256_pd128(a),_mm256_castpd256_pd1…
64 …56_sub_sd(a,b) _mm256_castpd128_pd256(_mm_sub_sd(_mm256_castpd256_pd128(a),_mm256_castpd256_pd1…
/dports/x11-toolkits/fox17/fox-1.7.77/lib/
H A DFXMat3d.cpp55 #define _mm256_storeu_sd(p,x) _mm_storel_pd(p,_mm256_castpd256_pd128(x))
58 #define _mm256_store_sd(p,x) _mm_storel_pd(p,_mm256_castpd256_pd128(x))
61 …56_div_sd(a,b) _mm256_castpd128_pd256(_mm_div_sd(_mm256_castpd256_pd128(a),_mm256_castpd256_pd1…
62 …56_mul_sd(a,b) _mm256_castpd128_pd256(_mm_mul_sd(_mm256_castpd256_pd128(a),_mm256_castpd256_pd1…
63 …56_add_sd(a,b) _mm256_castpd128_pd256(_mm_add_sd(_mm256_castpd256_pd128(a),_mm256_castpd256_pd1…
64 …56_sub_sd(a,b) _mm256_castpd128_pd256(_mm_sub_sd(_mm256_castpd256_pd128(a),_mm256_castpd256_pd1…
/dports/graphics/povray38/povunix-v3.8.0-beta.2-src/platform/x86/avx/
H A Davxnoise.cpp286 sumr_up = _mm_add_pd(_mm256_castpd256_pd128(sumr),sumr_up); in AVXNoise()
485 xy_up = _mm_add_pd(_mm256_castpd256_pd128(xy),xy_up); in AVXDNoise()
489 z_up = _mm_add_pd(_mm256_castpd256_pd128(z),z_up); in AVXDNoise()
/dports/science/gromacs/gromacs-2021.4/src/gromacs/simd/impl_x86_avx_128_fma/
H A Dimpl_x86_avx_128_fma_simd4_double.h200 tmp1 = _mm256_castpd256_pd128(a.simdInternal_); in dotProduct()
276 a0 = _mm256_castpd256_pd128(a.simdInternal_); in reduce()
/dports/science/gromacs/gromacs-2021.4/src/gromacs/simd/impl_x86_avx_512/
H A Dimpl_x86_avx_512_simd4_double.h200 tmp1 = _mm256_castpd256_pd128(a.simdInternal_); in dotProduct()
284 a0 = _mm256_castpd256_pd128(a.simdInternal_); in reduce()
/dports/math/openblas/OpenBLAS-0.3.18/kernel/simd/
H A Dintrin_avx.h54 __m128d lo = _mm256_castpd256_pd128(sum_halves); in v_sum_f64()
/dports/math/py-numpy/numpy-1.20.3/numpy/core/src/common/simd/avx2/
H A Dmemory.h67 #define npyv_storel_f64(PTR, VEC) _mm_storeu_pd(PTR, _mm256_castpd256_pd128(VEC)) in NPYV_IMPL_AVX2_MEM_INT()
134 __m128d a0 = _mm256_castpd256_pd128(a); in npyv_storen_f64()
278 __m128d a0 = _mm256_castpd256_pd128(_mm256_castsi256_pd(a)); in npyv_storen_till_s64()
/dports/math/blasfeo/blasfeo-0.1.2/kernel/avx2/
H A Dkernel_dgetrf_pivot_lib.c188 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_12_lib()
423 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_12_lib()
646 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_12_lib()
856 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_12_lib()
1054 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_12_lib()
1238 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_12_lib()
1409 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_12_lib()
1567 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_12_lib()
1714 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_12_lib()
1846 inv = _mm_div_pd( _mm256_castpd256_pd128( ones ), inv ); in kernel_dgetrf_pivot_12_lib()
[all …]
/dports/lang/gcc10/gcc-10.3.0/gcc/testsuite/gcc.target/i386/
H A Davx-typecast-1.c60 fd.x = _mm256_castpd256_pd128 (c.x); in avx_test()
/dports/lang/gcc11-devel/gcc-11-20211009/gcc/testsuite/gcc.target/i386/
H A Davx-typecast-1.c60 fd.x = _mm256_castpd256_pd128 (c.x); in avx_test()
/dports/lang/gcc11/gcc-11.2.0/gcc/testsuite/gcc.target/i386/
H A Davx-typecast-1.c60 fd.x = _mm256_castpd256_pd128 (c.x); in avx_test()
/dports/devel/avr-gcc/gcc-10.2.0/gcc/testsuite/gcc.target/i386/
H A Davx-typecast-1.c60 fd.x = _mm256_castpd256_pd128 (c.x); in avx_test()
/dports/misc/cxx_atomics_pic/gcc-11.2.0/gcc/testsuite/gcc.target/i386/
H A Davx-typecast-1.c60 fd.x = _mm256_castpd256_pd128 (c.x); in avx_test()
/dports/lang/gcc10-devel/gcc-10-20211008/gcc/testsuite/gcc.target/i386/
H A Davx-typecast-1.c60 fd.x = _mm256_castpd256_pd128 (c.x); in avx_test()

12345678