/dports/math/openblas/OpenBLAS-0.3.18/kernel/x86_64/ |
H A D | sgemv_n_microk_skylakex-8.c | 55 for (BLASLONG idx_n = 0; idx_n < n; idx_n++) { in sgemv_kernel_n_128() local 56 xArray_0 = _mm512_set1_ps(x[idx_n]); in sgemv_kernel_n_128() 93 for (BLASLONG idx_n = 0; idx_n < n; idx_n++) { in sgemv_kernel_n_128() local 118 for (BLASLONG idx_n = 0; idx_n < n; idx_n++) { in sgemv_kernel_n_128() local 137 for (BLASLONG idx_n = 0; idx_n < n; idx_n++) { in sgemv_kernel_n_128() local 154 for(BLASLONG idx_n = 0; idx_n < n; idx_n++) { in sgemv_kernel_n_128() local 187 for (BLASLONG idx_n = 0; idx_n < n; idx_n++) { in sgemv_kernel_n_64() local 188 xv = _mm256_set1_ps(x[idx_n]); in sgemv_kernel_n_64() 211 for (BLASLONG idx_n = 0; idx_n < n; idx_n++) { in sgemv_kernel_n_64() local 227 for (BLASLONG idx_n = 0; idx_n < n; idx_n++) { in sgemv_kernel_n_64() local [all …]
|
H A D | bf16_common_macros.h | 81 regArray = _mm512_loadu_si512(&a[idx_m*lda + idx_n]); 151 #define BF16_VECTOR_LOAD_1x32(reg, x, idx_n) \ argument 152 reg = _mm512_loadu_si512(x + idx_n); 155 #define BF16_VECTOR_LOAD_1x16(reg, x, idx_n) \ argument 156 reg = _mm256_loadu_si256((__m256i *)(x + idx_n)); 159 #define BF16_VECTOR_LOAD_1x8(reg, x, idx_n) \ argument 160 reg = _mm_loadu_si128((__m128i *)(x + idx_n)); 163 #define BF16_VECTOR_MASKZ_LOAD_1x32(reg, x, idx_n, mask) \ argument 164 reg = _mm512_maskz_loadu_epi16(mask, x + idx_n); 168 reg = _mm256_maskz_loadu_epi16(mask, x + idx_n); [all …]
|
H A D | sbgemm_microk_cooperlake_template.c | 581 for (BLASLONG idx_n = n_from; idx_n < tag_n_Nx; idx_n += BF16_BLOCK_STEP_N) { in sbgemm_blocking_kernel_nn_alpha() local 595 for (BLASLONG idx_n = n_from; idx_n < tag_n_Nx; idx_n += BF16_BLOCK_STEP_N) { in sbgemm_blocking_kernel_nn_alpha() local 649 for (BLASLONG idx_n = n_from; idx_n < tag_n_Nx; idx_n += BF16_BLOCK_STEP_N) { in sbgemm_blocking_kernel_nn_alpha() local 676 for (BLASLONG idx_n = n_from; idx_n < tag_n_Nx; idx_n += BF16_BLOCK_STEP_N) { in sbgemm_blocking_kernel_nn_alpha() local 864 for (BLASLONG idx_n = n_from; idx_n < tag_n_Nx; idx_n += BF16_BLOCK_STEP_N) { in sbgemm_blocking_kernel_nt_alpha() local 878 for (BLASLONG idx_n = n_from; idx_n < tag_n_Nx; idx_n += BF16_BLOCK_STEP_N) { in sbgemm_blocking_kernel_nt_alpha() local 932 for (BLASLONG idx_n = n_from; idx_n < tag_n_Nx; idx_n += BF16_BLOCK_STEP_N) { in sbgemm_blocking_kernel_nt_alpha() local 960 for (BLASLONG idx_n = n_from; idx_n < tag_n_Nx; idx_n += BF16_BLOCK_STEP_N) { in sbgemm_blocking_kernel_nt_alpha() local 1401 for (BLASLONG idx_n = n_from; idx_n < tag_n_Nx; idx_n += BF16_BLOCK_STEP_N) { in sbgemm_blocking_kernel_tn_alpha() local 1415 for (BLASLONG idx_n = n_from; idx_n < tag_n_Nx; idx_n += BF16_BLOCK_STEP_N) { in sbgemm_blocking_kernel_tn_alpha() local [all …]
|
H A D | sbgemv_n_microk_cooperlake_template.c | 143 for (BLASLONG idx_n = 0; idx_n < n; idx_n++) { in sbgemv_kernel_32xN_lda_direct_alpha_beta() local 144 xArray_0 = _mm512_set1_epi16(x[idx_n]); in sbgemv_kernel_32xN_lda_direct_alpha_beta() 146 BF16_MATRIX_LOAD_1x32(matrixArray_seed_0, a, lda, idx_n, idx_m + 0) in sbgemv_kernel_32xN_lda_direct_alpha_beta() 147 BF16_MATRIX_LOAD_1x32(matrixArray_seed_1, a, lda, idx_n, idx_m + 32) in sbgemv_kernel_32xN_lda_direct_alpha_beta() 148 BF16_MATRIX_LOAD_1x32(matrixArray_seed_2, a, lda, idx_n, idx_m + 64) in sbgemv_kernel_32xN_lda_direct_alpha_beta() 149 BF16_MATRIX_LOAD_1x32(matrixArray_seed_3, a, lda, idx_n, idx_m + 96) in sbgemv_kernel_32xN_lda_direct_alpha_beta() 192 for (BLASLONG idx_n = 0; idx_n < n; idx_n++) { in sbgemv_kernel_32xN_lda_direct_alpha_beta() local 193 xArray_0 = _mm512_set1_epi16(x[idx_n]); in sbgemv_kernel_32xN_lda_direct_alpha_beta() 195 BF16_MATRIX_LOAD_1x32(matrixArray_seed_0, a, lda, idx_n, idx_m) in sbgemv_kernel_32xN_lda_direct_alpha_beta() 220 for (BLASLONG idx_n = 0; idx_n < n; idx_n++) { in sbgemv_kernel_32xN_lda_direct_alpha_beta() local [all …]
|
H A D | sbgemv_t_microk_cooperlake_template.c | 2715 for (long idx_n = 0; idx_n < tag_n_128x; idx_n += 128) { in sbgemv_kernel_1x128_lda_direct_alpha_beta() local 2733 for (long idx_n = tag_n_128x; idx_n < tag_n_32x; idx_n += 32) { in sbgemv_kernel_1x128_lda_direct_alpha_beta() local 2735 BF16_VECTOR_LOAD_1x32(xArray_0, x, idx_n) in sbgemv_kernel_1x128_lda_direct_alpha_beta() 2773 for (long idx_n = 0; idx_n < tag_n_128x; idx_n += 128) { in sbgemv_kernel_1x128_lda_direct_alpha_beta() local 2779 BF16_VECTOR_LOAD_1x32(xArray_0, x, idx_n + 0) in sbgemv_kernel_1x128_lda_direct_alpha_beta() 2791 for (long idx_n = tag_n_128x; idx_n < tag_n_32x; idx_n += 32) { in sbgemv_kernel_1x128_lda_direct_alpha_beta() local 2793 BF16_VECTOR_LOAD_1x32(xArray_0, x, idx_n) in sbgemv_kernel_1x128_lda_direct_alpha_beta() 2887 for (BLASLONG idx_n = 0; idx_n < tag_n_32x; idx_n+=32) { in sbgemv_kernel_8x32_lda_direct_alpha_beta() local 2892 BF16_VECTOR_LOAD_1x32(xArray_0, x, idx_n) in sbgemv_kernel_8x32_lda_direct_alpha_beta() 2927 for (BLASLONG idx_n = 0; idx_n < tag_n_32x; idx_n+=32) { in sbgemv_kernel_8x32_lda_direct_alpha_beta() local [all …]
|
/dports/cad/horizon-eda/horizon-2.1.0/3rd_party/router/router/ |
H A D | pns_index.cpp | 40 int idx_n = -1; in getSubindex() local 47 idx_n = SI_Multilayer; in getSubindex() 53 idx_n = SI_Multilayer; in getSubindex() 55 idx_n = SI_PadsTop; in getSubindex() 57 idx_n = SI_PadsBottom; in getSubindex() 72 if( idx_n < 0 || idx_n >= MaxSubIndices ) in getSubindex() 74 assert( idx_n >= 0 ); in getSubindex() 75 assert( idx_n < MaxSubIndices ); in getSubindex() 79 if( !m_subIndices[idx_n] ) in getSubindex() 80 m_subIndices[idx_n] = new ITEM_SHAPE_INDEX; in getSubindex() [all …]
|
/dports/math/tblis/tblis-1.2.0/src/external/tci/tci/ |
H A D | communicator.c | 201 unsigned idx_n = idx / m; in tci_distribute_2d() local 209 uint64_t nfirst = (idx_n*ngrain)/n; in tci_distribute_2d() 211 uint64_t nlast = ((idx_n+1)*ngrain)/n; in tci_distribute_2d() 270 for (unsigned idx_n = 0;idx_n < n;idx_n++) in tci_distribute_2d() local 273 [&,idx_m,idx_n] in tci_distribute_2d() 344 for (uint64_t idx_n = 0;idx_n < n;idx_n++) in tci_distribute_2d() local 398 unsigned idx_n = idx / data->m; in tci_distribute_2d_func() local 403 uint64_t nfirst = (idx_n*ngrain)/data->n; in tci_distribute_2d_func() 509 unsigned idx_n = idx / m; in tci_distribute_2d() 512 uint64_t nfirst = (idx_n*ngrain)/n; in tci_distribute_2d() [all …]
|
/dports/net-im/libsignal-client/libsignal-client-0.9.6/cargo-crates/blake2-0.9.2/src/simd/ |
H A D | simd_opt.rs | 11 ($tmp:ident, $shuffle:ident, $vec:expr, $idx_n:expr, $idx:expr) => { 17 const IDX: [u32; $idx_n] = $idx;
|
/dports/net-p2p/bitcoin-utils/bitcoin-22.0/src/secp256k1/src/ |
H A D | ecmult_const_impl.h | 21 int idx_n = abs_n >> 1; \ 35 secp256k1_fe_cmov(&(r)->x, &(pre)[m].x, m == idx_n); \ 36 secp256k1_fe_cmov(&(r)->y, &(pre)[m].y, m == idx_n); \
|
/dports/net-p2p/bitcoin/bitcoin-22.0/src/secp256k1/src/ |
H A D | ecmult_const_impl.h | 21 int idx_n = abs_n >> 1; \ 35 secp256k1_fe_cmov(&(r)->x, &(pre)[m].x, m == idx_n); \ 36 secp256k1_fe_cmov(&(r)->y, &(pre)[m].y, m == idx_n); \
|
/dports/net-p2p/bitcoin-daemon/bitcoin-22.0/src/secp256k1/src/ |
H A D | ecmult_const_impl.h | 21 int idx_n = abs_n >> 1; \ 35 secp256k1_fe_cmov(&(r)->x, &(pre)[m].x, m == idx_n); \ 36 secp256k1_fe_cmov(&(r)->y, &(pre)[m].y, m == idx_n); \
|
/dports/net-p2p/litecoin-daemon/litecoin-0.18.1/src/secp256k1/src/ |
H A D | ecmult_const_impl.h | 26 int idx_n = abs_n / 2; \ 36 secp256k1_fe_cmov(&(r)->x, &(pre)[m].x, m == idx_n); \ 37 secp256k1_fe_cmov(&(r)->y, &(pre)[m].y, m == idx_n); \
|
/dports/net-p2p/litecoin-utils/litecoin-0.18.1/src/secp256k1/src/ |
H A D | ecmult_const_impl.h | 26 int idx_n = abs_n / 2; \ 36 secp256k1_fe_cmov(&(r)->x, &(pre)[m].x, m == idx_n); \ 37 secp256k1_fe_cmov(&(r)->y, &(pre)[m].y, m == idx_n); \
|
/dports/net-p2p/zetacoin-utils/zetacoin-0.13.2.1/src/secp256k1/src/ |
H A D | ecmult_const_impl.h | 26 int idx_n = abs_n / 2; \ 36 secp256k1_fe_cmov(&(r)->x, &(pre)[m].x, m == idx_n); \ 37 secp256k1_fe_cmov(&(r)->y, &(pre)[m].y, m == idx_n); \
|
/dports/net-p2p/qtum/qtum-mainnet-fastlane-v0.20.3/src/secp256k1/src/ |
H A D | ecmult_const_impl.h | 19 int idx_n = abs_n / 2; \ 29 secp256k1_fe_cmov(&(r)->x, &(pre)[m].x, m == idx_n); \ 30 secp256k1_fe_cmov(&(r)->y, &(pre)[m].y, m == idx_n); \
|
/dports/net-p2p/namecoin/namecoin-core-nc0.21.0.1/src/secp256k1/src/ |
H A D | ecmult_const_impl.h | 21 int idx_n = abs_n >> 1; \ 35 secp256k1_fe_cmov(&(r)->x, &(pre)[m].x, m == idx_n); \ 36 secp256k1_fe_cmov(&(r)->y, &(pre)[m].y, m == idx_n); \
|
/dports/net-p2p/namecoin-daemon/namecoin-core-nc0.21.0.1/src/secp256k1/src/ |
H A D | ecmult_const_impl.h | 21 int idx_n = abs_n >> 1; \ 35 secp256k1_fe_cmov(&(r)->x, &(pre)[m].x, m == idx_n); \ 36 secp256k1_fe_cmov(&(r)->y, &(pre)[m].y, m == idx_n); \
|
/dports/math/secp256k1/secp256k1-aa15154/src/ |
H A D | ecmult_const_impl.h | 19 int idx_n = abs_n / 2; \ 29 secp256k1_fe_cmov(&(r)->x, &(pre)[m].x, m == idx_n); \ 30 secp256k1_fe_cmov(&(r)->y, &(pre)[m].y, m == idx_n); \
|
/dports/security/john/john-1.9.0-jumbo-1/src/secp256k1/ |
H A D | ecmult_const_impl.h | 26 int idx_n = abs_n / 2; \ 36 secp256k1_fe_cmov(&(r)->x, &(pre)[m].x, m == idx_n); \ 37 secp256k1_fe_cmov(&(r)->y, &(pre)[m].y, m == idx_n); \
|
/dports/net-p2p/go-ethereum/go-ethereum-1.10.14/vendor/github.com/status-im/keycard-go/vendor/github.com/ethereum/go-ethereum/crypto/secp256k1/libsecp256k1/src/ |
H A D | ecmult_const_impl.h | 26 int idx_n = abs_n / 2; \ 36 secp256k1_fe_cmov(&(r)->x, &(pre)[m].x, m == idx_n); \ 37 secp256k1_fe_cmov(&(r)->y, &(pre)[m].y, m == idx_n); \
|
/dports/net-p2p/zetacoin/zetacoin-0.13.2.1/src/secp256k1/src/ |
H A D | ecmult_const_impl.h | 26 int idx_n = abs_n / 2; \ 36 secp256k1_fe_cmov(&(r)->x, &(pre)[m].x, m == idx_n); \ 37 secp256k1_fe_cmov(&(r)->y, &(pre)[m].y, m == idx_n); \
|
/dports/net-p2p/zetacoin-daemon/zetacoin-0.13.2.1/src/secp256k1/src/ |
H A D | ecmult_const_impl.h | 26 int idx_n = abs_n / 2; \ 36 secp256k1_fe_cmov(&(r)->x, &(pre)[m].x, m == idx_n); \ 37 secp256k1_fe_cmov(&(r)->y, &(pre)[m].y, m == idx_n); \
|
/dports/net-p2p/namecoin-utils/namecoin-core-nc0.21.0.1/src/secp256k1/src/ |
H A D | ecmult_const_impl.h | 21 int idx_n = abs_n >> 1; \ 35 secp256k1_fe_cmov(&(r)->x, &(pre)[m].x, m == idx_n); \ 36 secp256k1_fe_cmov(&(r)->y, &(pre)[m].y, m == idx_n); \
|
/dports/net-p2p/litecoin/litecoin-0.18.1/src/secp256k1/src/ |
H A D | ecmult_const_impl.h | 26 int idx_n = abs_n / 2; \ 36 secp256k1_fe_cmov(&(r)->x, &(pre)[m].x, m == idx_n); \ 37 secp256k1_fe_cmov(&(r)->y, &(pre)[m].y, m == idx_n); \
|
/dports/net-p2p/c-lightning/lightning-0.10.2/external/libwally-core/src/secp256k1/src/ |
H A D | ecmult_const_impl.h | 21 int idx_n = abs_n >> 1; \ 35 secp256k1_fe_cmov(&(r)->x, &(pre)[m].x, m == idx_n); \ 36 secp256k1_fe_cmov(&(r)->y, &(pre)[m].y, m == idx_n); \
|