/dports/misc/mxnet/incubator-mxnet-1.9.0/3rdparty/mkldnn/src/cpu/x64/ |
H A D | jit_sse41_conv_kernel_f32.hpp | 61 reg64_t reg_oc_blocks = r14; member 62 reg64_t imm_addr64 = reg_oc_blocks;
|
H A D | jit_avx512_core_amx_1x1_conv_kernel.hpp | 87 const Xbyak::Reg64 ®_oc_blocks = rdx; member 94 const Xbyak::Reg64 ®_src_zero_point = reg_oc_blocks;
|
H A D | jit_sse41_conv_kernel_f32.cpp | 362 mov(reg_oc_blocks, ptr[this->param1 + GET_OFF(oc_blocks)]); in generate() 367 cmp(reg_oc_blocks, jcp.nb_oc_blocking); in generate() 375 cmp(reg_oc_blocks, nb_oc_tail); in generate()
|
H A D | jit_uni_x8s8s32x_conv_kernel.hpp | 79 const Xbyak::Reg64 reg_oc_blocks = rsi; member
|
H A D | jit_avx512_core_x8s8s32x_conv_kernel.hpp | 88 const Xbyak::Reg64 reg_oc_blocks = rsi; member
|
H A D | jit_avx512_core_x8s8s32x_deconvolution.hpp | 100 const Xbyak::Reg64 reg_oc_blocks = rsi; member
|
H A D | jit_avx512_core_amx_conv_kernel.hpp | 64 const reg64_t reg_oc_blocks = r12; member 323 const Xbyak::Reg64 ®_oc_blocks = rax; member
|
H A D | jit_uni_x8s8s32x_conv_kernel.cpp | 805 cmp(reg_oc_blocks, jcp.nb_ch - jcp.nb_ch_blocking); in icb_loop() 844 cmp(reg_oc_blocks, jcp.nb_ch - jcp.nb_ch_blocking); in icb_loop() 846 cmp(reg_oc_blocks, jcp.nb_oc - jcp.nb_oc_blocking); in icb_loop() 921 mov(reg_oc_blocks, ptr[param1 + GET_OFF(oc_blocks)]); in generate()
|
H A D | jit_avx2_conv_kernel_f32.cpp | 271 push(reg_oc_blocks); in width_blk_step() 491 if (oc_tail) pop(reg_oc_blocks); in width_blk_step() 552 mov(reg_oc_blocks, ptr[this->param1 + GET_OFF(oc_blocks)]); in generate() 562 cmp(reg_oc_blocks, jcp.nb_oc_blocking); in generate() 570 cmp(reg_oc_blocks, nb_oc_tail); in generate()
|
H A D | jit_avx512_core_x8s8s32x_conv_kernel.cpp | 835 cmp(reg_oc_blocks, jcp.nb_ch - jcp.nb_ch_blocking); in icb_loop() 874 cmp(reg_oc_blocks, jcp.nb_ch - jcp.nb_ch_blocking); in icb_loop() 876 cmp(reg_oc_blocks, jcp.nb_oc - jcp.nb_oc_blocking); in icb_loop() 955 mov(reg_oc_blocks, ptr[param1 + GET_OFF(oc_blocks)]); in generate()
|
/dports/math/onednn/oneDNN-2.5.1/src/cpu/x64/ |
H A D | jit_sse41_conv_kernel_f32.hpp | 61 reg64_t reg_oc_blocks = r14; member 62 reg64_t imm_addr64 = reg_oc_blocks;
|
H A D | jit_avx512_core_amx_1x1_conv_kernel.hpp | 88 const Xbyak::Reg64 ®_oc_blocks = rdx; member 95 const Xbyak::Reg64 ®_src_zero_point = reg_oc_blocks;
|
H A D | jit_sse41_conv_kernel_f32.cpp | 355 mov(reg_oc_blocks, ptr[this->param1 + GET_OFF(oc_blocks)]); in generate() 360 cmp(reg_oc_blocks, jcp.nb_oc_blocking); in generate() 368 cmp(reg_oc_blocks, nb_oc_tail); in generate()
|
H A D | jit_uni_x8s8s32x_conv_kernel.hpp | 80 const Xbyak::Reg64 reg_oc_blocks = rsi; member
|
H A D | jit_avx512_core_x8s8s32x_conv_kernel.hpp | 89 const Xbyak::Reg64 reg_oc_blocks = rsi; member
|
H A D | jit_avx512_core_x8s8s32x_deconvolution.cpp | 431 cmp(reg_oc_blocks, jcp.nb_ch - 1); in apply_zp_src_pad_str_comp() 433 cmp(reg_oc_blocks, jcp.nb_oc - jcp.nb_oc_blocking); in apply_zp_src_pad_str_comp() 1129 mov(reg_oc_blocks, ptr[param1 + GET_OFF(oc_blocks)]); in icb_loop() 1171 mov(reg_oc_blocks, ptr[param1 + GET_OFF(oc_blocks)]); in icb_loop() 1173 cmp(reg_oc_blocks, jcp.nb_ch - 1); in icb_loop() 1175 cmp(reg_oc_blocks, jcp.nb_oc - jcp.nb_oc_blocking); in icb_loop()
|
H A D | jit_avx512_core_amx_conv_kernel.hpp | 64 const reg64_t reg_oc_blocks = r12; member 324 const Xbyak::Reg64 ®_oc_blocks = rax; member
|
H A D | jit_avx512_core_x8s8s32x_deconvolution.hpp | 103 const Xbyak::Reg64 reg_oc_blocks = rsi; member
|
H A D | jit_avx2_conv_kernel_f32.cpp | 260 push(reg_oc_blocks); in width_blk_step() 480 if (oc_tail) pop(reg_oc_blocks); in width_blk_step() 541 mov(reg_oc_blocks, ptr[this->param1 + GET_OFF(oc_blocks)]); in generate() 551 cmp(reg_oc_blocks, jcp.nb_oc_blocking); in generate() 559 cmp(reg_oc_blocks, nb_oc_tail); in generate()
|
H A D | jit_uni_x8s8s32x_conv_kernel.cpp | 822 cmp(reg_oc_blocks, jcp.nb_ch - jcp.nb_ch_blocking); in icb_loop() 861 cmp(reg_oc_blocks, jcp.nb_ch - jcp.nb_ch_blocking); in icb_loop() 863 cmp(reg_oc_blocks, jcp.nb_oc - jcp.nb_oc_blocking); in icb_loop() 938 mov(reg_oc_blocks, ptr[param1 + GET_OFF(oc_blocks)]); in generate()
|
H A D | jit_avx512_core_x8s8s32x_conv_kernel.cpp | 837 cmp(reg_oc_blocks, jcp.nb_ch - jcp.nb_ch_blocking); in icb_loop() 876 cmp(reg_oc_blocks, jcp.nb_ch - jcp.nb_ch_blocking); in icb_loop() 878 cmp(reg_oc_blocks, jcp.nb_oc - jcp.nb_oc_blocking); in icb_loop() 957 mov(reg_oc_blocks, ptr[param1 + GET_OFF(oc_blocks)]); in generate()
|
/dports/misc/mxnet/incubator-mxnet-1.9.0/3rdparty/mkldnn/src/cpu/aarch64/ |
H A D | jit_sve_512_x8s8s32x_conv_kernel.hpp | 101 const XReg reg_oc_blocks = x6; member
|
H A D | jit_sve_512_x8s8s32x_conv_kernel.cpp | 814 cmp(reg_oc_blocks, jcp.nb_ch - jcp.nb_ch_blocking); in icb_loop() 849 cmp(reg_oc_blocks, jcp.nb_ch - jcp.nb_ch_blocking); in icb_loop() 851 cmp(reg_oc_blocks, jcp.nb_oc - jcp.nb_oc_blocking); in icb_loop() 946 ldr(reg_oc_blocks, ptr(reg_param1, GET_OFF(oc_blocks))); in generate()
|
/dports/math/onednn/oneDNN-2.5.1/src/cpu/aarch64/ |
H A D | jit_sve_512_x8s8s32x_conv_kernel.hpp | 101 const XReg reg_oc_blocks = x6; member
|
H A D | jit_sve_512_x8s8s32x_conv_kernel.cpp | 814 cmp(reg_oc_blocks, jcp.nb_ch - jcp.nb_ch_blocking); in icb_loop() 849 cmp(reg_oc_blocks, jcp.nb_ch - jcp.nb_ch_blocking); in icb_loop() 851 cmp(reg_oc_blocks, jcp.nb_oc - jcp.nb_oc_blocking); in icb_loop() 946 ldr(reg_oc_blocks, ptr(reg_param1, GET_OFF(oc_blocks))); in generate()
|