/dports/misc/mxnet/incubator-mxnet-1.9.0/3rdparty/mkldnn/src/cpu/x64/injectors/ |
H A D | jit_uni_eltwise_injector.hpp | 40 Xbyak::Opmask k_mask = Xbyak::Opmask(1), bool is_fwd = true, in static_params_t() 44 , k_mask(k_mask) in static_params_t() 50 Xbyak::Opmask k_mask; member 91 Xbyak::Opmask k_mask = Xbyak::Opmask(1), bool is_fwd = true, in jit_uni_eltwise_injector_f32() 100 , k_mask(k_mask) in jit_uni_eltwise_injector_f32() 111 Xbyak::Opmask k_mask = Xbyak::Opmask(1), bool is_fwd = true, in jit_uni_eltwise_injector_f32() 114 eltwise.beta, eltwise.scale, save_state, p_table, k_mask, in jit_uni_eltwise_injector_f32() 133 const Xbyak::Opmask k_mask; member
|
/dports/math/onednn/oneDNN-2.5.1/src/cpu/x64/injectors/ |
H A D | jit_uni_eltwise_injector.hpp | 41 Xbyak::Opmask k_mask = Xbyak::Opmask(1), bool is_fwd = true, in static_params_t() 45 , k_mask(k_mask) in static_params_t() 51 Xbyak::Opmask k_mask; member 94 Xbyak::Opmask k_mask = Xbyak::Opmask(1), bool is_fwd = true, in jit_uni_eltwise_injector_f32() 103 , k_mask(k_mask) in jit_uni_eltwise_injector_f32() 114 Xbyak::Opmask k_mask = Xbyak::Opmask(1), bool is_fwd = true, in jit_uni_eltwise_injector_f32() 117 eltwise.beta, eltwise.scale, save_state, p_table, k_mask, in jit_uni_eltwise_injector_f32() 136 const Xbyak::Opmask k_mask; member
|
/dports/math/onednn/oneDNN-2.5.1/src/cpu/x64/brgemm/ |
H A D | jit_brdgmm_kernel.cpp | 56 static_cast<size_t>(n_vlen_tail()), k_mask, in jit_brdgmm_kernel_base_t() 75 return mask_flag ? (store ? vmm_in | k_mask : vmm_in | k_mask | T_z) in vmm_mask() 81 return mask_flag ? (store ? wmm_in | k_mask : wmm_in | k_mask | T_z) in wmm_mask() 649 kmovd(k_mask, k_tail_mask); in compute_loop() 689 if (reset_mask) kxnorq(k_mask, k_mask, k_mask); in compute_loop() 712 if (reset_mask) { kxnorq(k_mask, k_mask, k_mask); } in compute_loop() 741 kmovq(k_mask, reg_tmp); in generate() 750 kxnorq(k_mask, k_mask, k_mask); in generate()
|
H A D | jit_brgemm_amx_uker.cpp | 488 auto k_mask = (!is_ld_tail) ? ld_full_mask : ld_tail_mask; in apply_alpha_beta_to_vector() local 515 auto zmm_masked = zmm | k_mask | T_z; in apply_alpha_beta_to_vector() 521 cvt2ps(brg.dt_c, zmm_prev_dst, addr, true, false, k_mask); in apply_alpha_beta_to_vector() 565 const auto k_mask = (!is_ld_tail) ? ld_full_mask : ld_tail_mask; in apply_post_ops_to_vector() local 568 cvt2ps(brg.sum_dt, zmm_prev_dst, addr, true, false, k_mask); in apply_post_ops_to_vector() 590 auto k_mask = (!is_ld_tail) ? ld_full_mask : ld_tail_mask; in store_vector_with_post_ops() local 607 cvt2ps(brg.dt_bias, zmm_bias, ptr_bias, true, false, k_mask); in store_vector_with_post_ops() 619 k_mask); in store_vector_with_post_ops() 637 const Xbyak::Zmm scaled_zmm = zmm_mask(zmm, true, false, k_mask); in store_vector_with_post_ops() 675 const Xbyak::Zmm r_zmm = zmm_mask(zmm, true, true, k_mask); in store_vector_with_post_ops() [all …]
|
/dports/math/ntl/ntl-11.5.1/src/ |
H A D | mat_GF2.cpp | 179 _ntl_ulong k_mask = 1UL << bk; in determinant() local 183 if (M[i].rep.elts()[wk] & k_mask) { in determinant() 200 if (M[i].rep.elts()[wk] & k_mask) { in determinant() 357 _ntl_ulong k_mask = 1UL << bk; in solve_impl() local 361 if (M[i].rep.elts()[wk] & k_mask) { in solve_impl() 377 if (M[i].rep.elts()[wk] & k_mask) { in solve_impl() 451 _ntl_ulong k_mask = 1UL << bk; in inv() local 455 if (M[i].rep.elts()[wk] & k_mask) { in inv() 471 if (M[i].rep.elts()[wk] & k_mask) { in inv() 532 _ntl_ulong k_mask = 1UL << bk; in gauss() local [all …]
|
/dports/multimedia/v4l_compat/linux-5.13-rc2/fs/orangefs/ |
H A D | orangefs-debugfs.c | 739 static void do_k_string(void *k_mask, int index) in do_k_string() argument 741 __u64 *mask = (__u64 *) k_mask; in do_k_string() 808 __u64 *k_mask; in check_amalgam_keyword() local 831 k_mask = (__u64 *) mask; in check_amalgam_keyword() 833 if (*k_mask >= s_kmod_keyword_mask_map[k_all_index].mask_val) { in check_amalgam_keyword() 857 __u64 *k_mask = NULL; in debug_string_to_mask() local 865 k_mask = (__u64 *)mask; in debug_string_to_mask() 866 *k_mask = 0; in debug_string_to_mask() 881 &k_mask); in debug_string_to_mask()
|
/dports/multimedia/libv4l/linux-5.13-rc2/fs/orangefs/ |
H A D | orangefs-debugfs.c | 739 static void do_k_string(void *k_mask, int index) in do_k_string() argument 741 __u64 *mask = (__u64 *) k_mask; in do_k_string() 808 __u64 *k_mask; in check_amalgam_keyword() local 831 k_mask = (__u64 *) mask; in check_amalgam_keyword() 833 if (*k_mask >= s_kmod_keyword_mask_map[k_all_index].mask_val) { in check_amalgam_keyword() 857 __u64 *k_mask = NULL; in debug_string_to_mask() local 865 k_mask = (__u64 *)mask; in debug_string_to_mask() 866 *k_mask = 0; in debug_string_to_mask() 881 &k_mask); in debug_string_to_mask()
|
/dports/multimedia/v4l-utils/linux-5.13-rc2/fs/orangefs/ |
H A D | orangefs-debugfs.c | 739 static void do_k_string(void *k_mask, int index) in do_k_string() argument 741 __u64 *mask = (__u64 *) k_mask; in do_k_string() 808 __u64 *k_mask; in check_amalgam_keyword() local 831 k_mask = (__u64 *) mask; in check_amalgam_keyword() 833 if (*k_mask >= s_kmod_keyword_mask_map[k_all_index].mask_val) { in check_amalgam_keyword() 857 __u64 *k_mask = NULL; in debug_string_to_mask() local 865 k_mask = (__u64 *)mask; in debug_string_to_mask() 866 *k_mask = 0; in debug_string_to_mask() 881 &k_mask); in debug_string_to_mask()
|
/dports/misc/mxnet/incubator-mxnet-1.9.0/3rdparty/mkldnn/src/cpu/x64/ |
H A D | jit_avx512_core_bf16_sum.cpp | 148 kmovd(k_mask, reg32_mask); in generate() 162 vmovdqu16(vysrc0 | k_mask | T_z, yword[reg_src[isrc0]]); in generate() 165 vmovdqu16(vysrc1 | k_mask | T_z, yword[reg_src[isrc1]]); in generate() 176 vmovups(zword[reg_dst] | k_mask, vacc); in generate() 181 vmovdqu16(yword[reg_dst] | k_mask, ymm_str); in generate() 185 vmovdqu16(yword[reg_dst] | k_mask, ymm_str); in generate()
|
H A D | jit_brgemm_post_ops.hpp | 408 const auto k_mask = tail == 0 ? k_full_mask : k_tail_mask; in inject_attr_postops() local 422 cvt2ps(out_dt_, zmm_prev_dst, addr, true, false, k_mask); in inject_attr_postops() 457 auto k_mask = (tail == 0) ? k_full_mask : k_tail_mask; in apply_post_ops() local 474 cvt2ps(inp_dt_, vector(m, n), inp_addr, true, false, k_mask); in apply_post_ops() 485 cvt2ps(bia_dt_, zmm_bias, bias_addr, true, false, k_mask); in apply_post_ops() 494 = zmm_mask(vector(m, n), true, false, k_mask); in apply_post_ops() 525 const Xbyak::Ymm r_ymm = ymm_mask(ymm, true, true, k_mask); in apply_post_ops() 533 const Xbyak::Zmm r_zmm = zmm_mask(zmm, true, true, k_mask); in apply_post_ops()
|
/dports/math/onednn/oneDNN-2.5.1/src/cpu/x64/ |
H A D | jit_avx512_core_bf16_sum.cpp | 148 kmovd(k_mask, reg32_mask); in generate() 162 vmovdqu16(vysrc0 | k_mask | T_z, yword[reg_src[isrc0]]); in generate() 165 vmovdqu16(vysrc1 | k_mask | T_z, yword[reg_src[isrc1]]); in generate() 176 vmovups(zword[reg_dst] | k_mask, vacc); in generate() 181 vmovdqu16(yword[reg_dst] | k_mask, ymm_str); in generate() 185 vmovdqu16(yword[reg_dst] | k_mask, ymm_str); in generate()
|
H A D | jit_brgemm_post_ops.hpp | 410 const auto k_mask = tail == 0 ? k_full_mask : k_tail_mask; in inject_attr_postops() local 431 cvt2ps(sum_dt, zmm_prev_dst, addr, true, false, k_mask); in inject_attr_postops() 468 auto k_mask = (tail == 0) ? k_full_mask : k_tail_mask; in apply_post_ops() local 485 cvt2ps(inp_dt_, vector(m, n), inp_addr, true, false, k_mask); in apply_post_ops() 496 cvt2ps(bia_dt_, zmm_bias, bias_addr, true, false, k_mask); in apply_post_ops() 505 = zmm_mask(vector(m, n), true, false, k_mask); in apply_post_ops() 536 const Xbyak::Ymm r_ymm = ymm_mask(ymm, true, true, k_mask); in apply_post_ops() 544 const Xbyak::Zmm r_zmm = zmm_mask(zmm, true, true, k_mask); in apply_post_ops()
|
/dports/science/lammps/lammps-stable_29Sep2021/src/KOKKOS/ |
H A D | compute_temp_deform_kokkos.cpp | 73 mask = atomKK->k_mask.view<DeviceType>(); in compute_scalar() 142 mask = atomKK->k_mask.view<DeviceType>(); in compute_vector() 207 mask = atomKK->k_mask.view<DeviceType>(); in remove_bias_all() 247 mask = atomKK->k_mask.view<DeviceType>(); in restore_bias_all()
|
H A D | atom_vec_atomic_kokkos.cpp | 70 memoryKK->grow_kokkos(atomKK->k_mask,atomKK->mask,nmax,"atom:mask"); in grow() 99 d_mask = atomKK->k_mask.d_view; in grow_pointers() 100 h_mask = atomKK->k_mask.h_view; in grow_pointers() 501 _mask(atom->k_mask.view<DeviceType>()), in AtomVecAtomicKokkos_PackExchangeFunctor() 507 _maskw(atom->k_mask.view<DeviceType>()), in AtomVecAtomicKokkos_PackExchangeFunctor() 620 _mask(atom->k_mask.view<DeviceType>()), in AtomVecAtomicKokkos_UnpackExchangeFunctor() 911 if (mask & MASK_MASK) atomKK->k_mask.sync<LMPDeviceType>(); in sync() 919 if (mask & MASK_MASK) atomKK->k_mask.sync<LMPHostType>(); in sync() 940 perform_async_copy<DAT::tdual_int_1d>(atomKK->k_mask,space); in sync_overlapping_device() 971 if (mask & MASK_MASK) atomKK->k_mask.modify<LMPDeviceType>(); in modified() [all …]
|
H A D | atom_vec_sphere_kokkos.cpp | 139 d_mask = atomKK->k_mask.d_view; in grow_pointers() 140 h_mask = atomKK->k_mask.h_view; in grow_pointers() 472 atomKK->k_x,atomKK->k_mask, in pack_comm_vel_kokkos() 557 atomKK->k_x,atomKK->k_mask, in pack_comm_vel_kokkos() 566 atomKK->k_x,atomKK->k_mask, in pack_comm_vel_kokkos() 577 atomKK->k_x,atomKK->k_mask, in pack_comm_vel_kokkos() 586 atomKK->k_x,atomKK->k_mask, in pack_comm_vel_kokkos() 688 atomKK->k_x,atomKK->k_mask, in pack_comm_vel_kokkos() 697 atomKK->k_x,atomKK->k_mask, in pack_comm_vel_kokkos() 708 atomKK->k_x,atomKK->k_mask, in pack_comm_vel_kokkos() [all …]
|
H A D | atom_vec_charge_kokkos.cpp | 73 memoryKK->grow_kokkos(atomKK->k_mask,atomKK->mask,nmax,"atom:mask"); in grow() 104 d_mask = atomKK->k_mask.d_view; in grow_pointers() 105 h_mask = atomKK->k_mask.h_view; in grow_pointers() 610 _mask(atom->k_mask.view<DeviceType>()), in AtomVecChargeKokkos_PackExchangeFunctor() 617 _maskw(atom->k_mask.view<DeviceType>()), in AtomVecChargeKokkos_PackExchangeFunctor() 741 _mask(atom->k_mask.view<DeviceType>()), in AtomVecChargeKokkos_UnpackExchangeFunctor() 1079 if (mask & MASK_MASK) atomKK->k_mask.sync<LMPDeviceType>(); in sync() 1088 if (mask & MASK_MASK) atomKK->k_mask.sync<LMPHostType>(); in sync() 1104 if (mask & MASK_MASK) atomKK->k_mask.modify<LMPDeviceType>(); in modified() 1113 if (mask & MASK_MASK) atomKK->k_mask.modify<LMPHostType>(); in modified() [all …]
|
H A D | atom_vec_kokkos.cpp | 540 atomKK->k_x,atomKK->k_mask, in pack_comm_vel_kokkos() 548 atomKK->k_x,atomKK->k_mask, in pack_comm_vel_kokkos() 558 atomKK->k_x,atomKK->k_mask, in pack_comm_vel_kokkos() 566 atomKK->k_x,atomKK->k_mask, in pack_comm_vel_kokkos() 577 atomKK->k_x,atomKK->k_mask, in pack_comm_vel_kokkos() 585 atomKK->k_x,atomKK->k_mask, in pack_comm_vel_kokkos() 599 atomKK->k_x,atomKK->k_mask, in pack_comm_vel_kokkos() 607 atomKK->k_x,atomKK->k_mask, in pack_comm_vel_kokkos() 617 atomKK->k_x,atomKK->k_mask, in pack_comm_vel_kokkos() 636 atomKK->k_x,atomKK->k_mask, in pack_comm_vel_kokkos() [all …]
|
H A D | atom_vec_spin_kokkos.cpp | 86 memoryKK->grow_kokkos(atomKK->k_mask,atomKK->mask,nmax,"atom:mask"); in grow() 123 d_mask = atomKK->k_mask.d_view; in grow_pointers() 124 h_mask = atomKK->k_mask.h_view; in grow_pointers() 687 _mask(atom->k_mask.view<DeviceType>()), in AtomVecSpinKokkos_PackExchangeFunctor() 694 _maskw(atom->k_mask.view<DeviceType>()), in AtomVecSpinKokkos_PackExchangeFunctor() 827 _mask(atom->k_mask.view<DeviceType>()), in AtomVecSpinKokkos_UnpackExchangeFunctor() 1208 if (mask & MASK_MASK) atomKK->k_mask.sync<LMPDeviceType>(); in sync() 1219 if (mask & MASK_MASK) atomKK->k_mask.sync<LMPHostType>(); in sync() 1237 if (mask & MASK_MASK) atomKK->k_mask.modify<LMPDeviceType>(); in modified() 1248 if (mask & MASK_MASK) atomKK->k_mask.modify<LMPHostType>(); in modified() [all …]
|
H A D | fix_nve_sphere_kokkos.cpp | 71 mask = atomKK->k_mask.view<DeviceType>(); in initial_integrate() 119 mask = atomKK->k_mask.view<DeviceType>(); in final_integrate()
|
H A D | compute_temp_kokkos.cpp | 58 mask = atomKK->k_mask.view<DeviceType>(); in compute_scalar() 113 mask = atomKK->k_mask.view<DeviceType>(); in compute_vector()
|
H A D | atom_vec_bond_kokkos.cpp | 73 memoryKK->grow_kokkos(atomKK->k_mask,atomKK->mask,nmax,"atom:mask"); in grow() 109 d_mask = atomKK->k_mask.d_view; in grow_pointers() 110 h_mask = atomKK->k_mask.h_view; in grow_pointers() 606 _mask(atom->k_mask.view<DeviceType>()), in AtomVecBondKokkos_PackExchangeFunctor() 618 _maskw(atom->k_mask.view<DeviceType>()), in AtomVecBondKokkos_PackExchangeFunctor() 793 _mask(atom->k_mask.view<DeviceType>()), in AtomVecBondKokkos_UnpackExchangeFunctor() 1191 if (mask & MASK_MASK) atomKK->k_mask.sync<LMPDeviceType>(); in sync() 1209 if (mask & MASK_MASK) atomKK->k_mask.sync<LMPHostType>(); in sync() 1240 perform_async_copy<DAT::tdual_int_1d>(atomKK->k_mask,space); in sync_overlapping_device() 1303 if (mask & MASK_MASK) atomKK->k_mask.modify<LMPDeviceType>(); in modified() [all …]
|
H A D | fix_nve_kokkos.cpp | 66 mask = atomKK->k_mask.view<DeviceType>(); in initial_integrate() 122 mask = atomKK->k_mask.view<DeviceType>(); in final_integrate()
|
/dports/multimedia/libv4l/linux-5.13-rc2/drivers/clk/sunxi-ng/ |
H A D | ccu_nkmp.c | 167 u32 n_mask = 0, k_mask = 0, m_mask = 0, p_mask = 0; in ccu_nkmp_set_rate() local 196 k_mask = GENMASK(nkmp->k.width + nkmp->k.shift - 1, in ccu_nkmp_set_rate() 208 reg &= ~(n_mask | k_mask | m_mask | p_mask); in ccu_nkmp_set_rate() 211 reg |= ((_nkmp.k - nkmp->k.offset) << nkmp->k.shift) & k_mask; in ccu_nkmp_set_rate()
|
/dports/multimedia/v4l-utils/linux-5.13-rc2/drivers/clk/sunxi-ng/ |
H A D | ccu_nkmp.c | 167 u32 n_mask = 0, k_mask = 0, m_mask = 0, p_mask = 0; in ccu_nkmp_set_rate() local 196 k_mask = GENMASK(nkmp->k.width + nkmp->k.shift - 1, in ccu_nkmp_set_rate() 208 reg &= ~(n_mask | k_mask | m_mask | p_mask); in ccu_nkmp_set_rate() 211 reg |= ((_nkmp.k - nkmp->k.offset) << nkmp->k.shift) & k_mask; in ccu_nkmp_set_rate()
|
/dports/multimedia/v4l_compat/linux-5.13-rc2/drivers/clk/sunxi-ng/ |
H A D | ccu_nkmp.c | 167 u32 n_mask = 0, k_mask = 0, m_mask = 0, p_mask = 0; in ccu_nkmp_set_rate() local 196 k_mask = GENMASK(nkmp->k.width + nkmp->k.shift - 1, in ccu_nkmp_set_rate() 208 reg &= ~(n_mask | k_mask | m_mask | p_mask); in ccu_nkmp_set_rate() 211 reg |= ((_nkmp.k - nkmp->k.offset) << nkmp->k.shift) & k_mask; in ccu_nkmp_set_rate()
|