Searched refs:xmm_scale (Results 1 – 3 of 3) sorted by relevance
/dports/misc/mxnet/incubator-mxnet-1.9.0/3rdparty/mkldnn/src/cpu/x64/ |
H A D | jit_uni_reorder.cpp | 655 uni_vmulps(Xmm(ur), Xmm(ur), xmm_scale); in process_unroll_generic_step() 705 uni_vmulps(Xmm(ur), Xmm(ur), xmm_scale); in process_unroll_generic_step() 719 uni_vbroadcastss(xmm_scale, s_addr(s_off[ur])); in process_unroll_generic_step() 720 uni_vmulps(Xmm(ur), Xmm(ur), xmm_scale); in process_unroll_generic_step() 731 uni_vmovups(xmm_scale, s_addr(s_off[ur])); in process_unroll_generic_step() 732 uni_vmulps(Xmm(ur), Xmm(ur), xmm_scale); in process_unroll_generic_step() 740 uni_vpinsrd(xmm_scale, xmm_scale, s_addr(s_off[r]), in process_unroll_generic_step() 743 uni_vmulps(Xmm(ur), Xmm(ur), xmm_scale); in process_unroll_generic_step() 771 uni_vmulss(Xmm(ur), Xmm(ur), xmm_scale); in process_unroll_generic_step() 976 uni_vbroadcastss(xmm_scale, ptr[reg_ptr_scale_tmp]); in generate() [all …]
|
/dports/misc/mxnet/incubator-mxnet-1.9.0/3rdparty/mkldnn/src/cpu/aarch64/ |
H A D | jit_uni_reorder.cpp | 645 fmul(VReg4S(ur), VReg4S(ur), xmm_scale); in process_unroll_generic_step() 699 fmul(VReg4S(ur), VReg4S(ur), xmm_scale); in process_unroll_generic_step() 712 VReg4S v(xmm_scale.getIdx()); in process_unroll_generic_step() 728 uint32_t idx = xmm_scale.getIdx(); in process_unroll_generic_step() 748 VReg4S v(xmm_scale.getIdx()); in process_unroll_generic_step() 751 fmul(VReg4S(ur), VReg4S(ur), xmm_scale); in process_unroll_generic_step() 810 fmul(tmp, tmp, VReg4S(xmm_scale.getIdx())); in process_unroll_generic_step() 1232 dup(xmm_scale, W_TMP_1); in generate() 1287 VReg4S xmm_scale = v15.s; member
|
/dports/math/onednn/oneDNN-2.5.1/src/cpu/aarch64/ |
H A D | jit_uni_reorder.cpp | 645 fmul(VReg4S(ur), VReg4S(ur), xmm_scale); in process_unroll_generic_step() 699 fmul(VReg4S(ur), VReg4S(ur), xmm_scale); in process_unroll_generic_step() 712 VReg4S v(xmm_scale.getIdx()); in process_unroll_generic_step() 728 uint32_t idx = xmm_scale.getIdx(); in process_unroll_generic_step() 748 VReg4S v(xmm_scale.getIdx()); in process_unroll_generic_step() 751 fmul(VReg4S(ur), VReg4S(ur), xmm_scale); in process_unroll_generic_step() 810 fmul(tmp, tmp, VReg4S(xmm_scale.getIdx())); in process_unroll_generic_step() 1232 dup(xmm_scale, W_TMP_1); in generate() 1287 VReg4S xmm_scale = v15.s; member
|