/dports/misc/mxnet/incubator-mxnet-1.9.0/3rdparty/mkldnn/src/cpu/x64/ |
H A D | jit_avx512_core_bf16_dw_conv_kernel.hpp | 122 std::unique_ptr<bf16_emulation_t> bf16_emu_; member 131 : jcp(ajcp), bf16_emu_(nullptr) { in jit_avx512_dw_conv_bwd_data_kernel_bf16() 134 bf16_emu_ = new bf16_emulation_t(this, bf16_emu_reserv_1, in jit_avx512_dw_conv_bwd_data_kernel_bf16() 139 ~jit_avx512_dw_conv_bwd_data_kernel_bf16() { delete bf16_emu_; } in ~jit_avx512_dw_conv_bwd_data_kernel_bf16() 184 bf16_emulation_t *bf16_emu_; member 208 : jcp(ajcp), bf16_emu_(nullptr) { in jit_avx512_dw_conv_bwd_weights_kernel_bf16() 211 bf16_emu_ = new bf16_emulation_t(this, bf16_emu_reserv_1, in jit_avx512_dw_conv_bwd_weights_kernel_bf16() 216 ~jit_avx512_dw_conv_bwd_weights_kernel_bf16() { delete bf16_emu_; } in ~jit_avx512_dw_conv_bwd_weights_kernel_bf16() 276 bf16_emulation_t *bf16_emu_; member
|
H A D | jit_avx512_core_bf16cvt.hpp | 184 bf16_emu_ = new bf16_emulation_t( in jit_avx512_core_cvt_ps_to_bf16_t() 190 ~jit_avx512_core_cvt_ps_to_bf16_t() { delete bf16_emu_; } in ~jit_avx512_core_cvt_ps_to_bf16_t() 200 bf16_emu_->vcvtneps2bf16(bf16_out, fp32_inp); in generate() 212 if (use_bf16_emu) bf16_emu_->init_vcvtneps2bf16(); in generate() 293 bf16_emulation_t *bf16_emu_; member 345 bf16_emu_ = new bf16_emulation_t( in jit_avx512_core_add_cvt_ps_to_bf16_t() 351 ~jit_avx512_core_add_cvt_ps_to_bf16_t() { delete bf16_emu_; } in ~jit_avx512_core_add_cvt_ps_to_bf16_t() 364 bf16_emu_->vcvtneps2bf16(bf16_out, fp32_inp); in generate() 377 if (use_bf16_emu) bf16_emu_->init_vcvtneps2bf16(); in generate() 424 bf16_emulation_t *bf16_emu_; member
|
H A D | jit_avx512_core_bf16_sum.cpp | 70 bf16_emu_->vdpbf16ps(vacc0, vsrc0, vscale); in loop_iteration() 71 bf16_emu_->vdpbf16ps(vacc1, vsrc1, vscale); in loop_iteration() 88 bf16_emu_->vcvtneps2bf16(ymm_str, vacc0); in loop_iteration() 90 bf16_emu_->vcvtneps2bf16(ymm_str, vacc1); in loop_iteration() 127 if (!isa_has_bf16(jsp.isa)) bf16_emu_->init_vcvtneps2bf16(); in generate() 170 bf16_emu_->vdpbf16ps(vacc, vsrc, vscale); in generate() 184 bf16_emu_->vcvtneps2bf16(ymm_str, vacc); in generate()
|
H A D | jit_avx512_core_bf16_sum.hpp | 52 : jsp(ajsp), bf16_emu_(nullptr) { in jit_avx512_core_bf16_sum_kernel() 54 bf16_emu_ = new bf16_emulation_t(this, bf16_emu_reserved_1, in jit_avx512_core_bf16_sum_kernel() 59 ~jit_avx512_core_bf16_sum_kernel() { delete bf16_emu_; } in ~jit_avx512_core_bf16_sum_kernel() 159 bf16_emulation_t *bf16_emu_; member
|
H A D | jit_avx512_core_bf16_conv_kernel.hpp | 129 std::unique_ptr<bf16_emulation_t> bf16_emu_; member 255 , bf16_emu_(nullptr) { in _jit_avx512_core_bf16_bwd_data_kernel() 257 bf16_emu_ = utils::make_unique<bf16_emulation_t>(this, in _jit_avx512_core_bf16_bwd_data_kernel() 341 std::unique_ptr<bf16_emulation_t> bf16_emu_; member 463 , bf16_emu_(nullptr) { in jit_avx512_core_bf16_conv_bwd_weights_kernel_f32() 465 bf16_emu_ = utils::make_unique<bf16_emulation_t>( in jit_avx512_core_bf16_conv_bwd_weights_kernel_f32() 695 std::unique_ptr<bf16_emulation_t> bf16_emu_; member
|
H A D | jit_uni_eltwise.cpp | 129 bf16_emu_.reset(new bf16_emulation_t(this, bf16_emu_reserv_1, in jit_uni_kernel_t() 133 this, k_tail_mask, bf16_emu_.get())); in jit_uni_kernel_t() 151 if (!mayiuse(avx512_core_bf16)) bf16_emu_->init_vcvtneps2bf16(); in generate() 281 std::unique_ptr<bf16_emulation_t> bf16_emu_; member
|
H A D | jit_uni_softmax.cpp | 272 std::unique_ptr<bf16_emulation_t> bf16_emu_ = nullptr; member 300 if (bf16_emu_) in store() 301 bf16_emu_->vcvtneps2bf16(bf16_cvt_ymm, src_vmm); in store() 440 if (bf16_emu_) bf16_emu_->init_vcvtneps2bf16(); in initialization_hook() 445 bf16_emu_.reset(new bf16_emulation_t(this, bf16_emu_zmm_1, in jit_softmax_t()
|
/dports/math/onednn/oneDNN-2.5.1/src/cpu/x64/ |
H A D | jit_avx512_core_bf16_dw_conv_kernel.hpp | 125 std::unique_ptr<bf16_emulation_t> bf16_emu_; member 134 : jcp(ajcp), bf16_emu_(nullptr) { in jit_avx512_dw_conv_bwd_data_kernel_bf16() 137 bf16_emu_ = new bf16_emulation_t(this, bf16_emu_reserv_1, in jit_avx512_dw_conv_bwd_data_kernel_bf16() 142 ~jit_avx512_dw_conv_bwd_data_kernel_bf16() { delete bf16_emu_; } in ~jit_avx512_dw_conv_bwd_data_kernel_bf16() 187 bf16_emulation_t *bf16_emu_; member 211 : jcp(ajcp), bf16_emu_(nullptr) { in jit_avx512_dw_conv_bwd_weights_kernel_bf16() 214 bf16_emu_ = new bf16_emulation_t(this, bf16_emu_reserv_1, in jit_avx512_dw_conv_bwd_weights_kernel_bf16() 219 ~jit_avx512_dw_conv_bwd_weights_kernel_bf16() { delete bf16_emu_; } in ~jit_avx512_dw_conv_bwd_weights_kernel_bf16() 279 bf16_emulation_t *bf16_emu_; member
|
H A D | jit_avx512_core_bf16cvt.hpp | 184 bf16_emu_ = new bf16_emulation_t( in jit_avx512_core_cvt_ps_to_bf16_t() 190 ~jit_avx512_core_cvt_ps_to_bf16_t() { delete bf16_emu_; } in ~jit_avx512_core_cvt_ps_to_bf16_t() 200 bf16_emu_->vcvtneps2bf16(bf16_out, fp32_inp); in generate() 212 if (use_bf16_emu) bf16_emu_->init_vcvtneps2bf16(); in generate() 293 bf16_emulation_t *bf16_emu_; member 345 bf16_emu_ = new bf16_emulation_t( in jit_avx512_core_add_cvt_ps_to_bf16_t() 351 ~jit_avx512_core_add_cvt_ps_to_bf16_t() { delete bf16_emu_; } in ~jit_avx512_core_add_cvt_ps_to_bf16_t() 364 bf16_emu_->vcvtneps2bf16(bf16_out, fp32_inp); in generate() 377 if (use_bf16_emu) bf16_emu_->init_vcvtneps2bf16(); in generate() 424 bf16_emulation_t *bf16_emu_; member
|
H A D | jit_avx512_core_bf16_sum.cpp | 70 bf16_emu_->vdpbf16ps(vacc0, vsrc0, vscale); in loop_iteration() 71 bf16_emu_->vdpbf16ps(vacc1, vsrc1, vscale); in loop_iteration() 88 bf16_emu_->vcvtneps2bf16(ymm_str, vacc0); in loop_iteration() 90 bf16_emu_->vcvtneps2bf16(ymm_str, vacc1); in loop_iteration() 127 if (!isa_has_bf16(jsp.isa)) bf16_emu_->init_vcvtneps2bf16(); in generate() 170 bf16_emu_->vdpbf16ps(vacc, vsrc, vscale); in generate() 184 bf16_emu_->vcvtneps2bf16(ymm_str, vacc); in generate()
|
H A D | jit_avx512_core_bf16_sum.hpp | 52 : jsp(ajsp), bf16_emu_(nullptr) { in jit_avx512_core_bf16_sum_kernel() 54 bf16_emu_ = new bf16_emulation_t(this, bf16_emu_reserved_1, in jit_avx512_core_bf16_sum_kernel() 59 ~jit_avx512_core_bf16_sum_kernel() { delete bf16_emu_; } in ~jit_avx512_core_bf16_sum_kernel() 159 bf16_emulation_t *bf16_emu_; member
|
H A D | jit_avx512_core_bf16_conv_kernel.hpp | 132 std::unique_ptr<bf16_emulation_t> bf16_emu_; member 258 , bf16_emu_(nullptr) { in _jit_avx512_core_bf16_bwd_data_kernel() 260 bf16_emu_ = utils::make_unique<bf16_emulation_t>(this, in _jit_avx512_core_bf16_bwd_data_kernel() 344 std::unique_ptr<bf16_emulation_t> bf16_emu_; member 466 , bf16_emu_(nullptr) { in jit_avx512_core_bf16_conv_bwd_weights_kernel_f32() 468 bf16_emu_ = utils::make_unique<bf16_emulation_t>( in jit_avx512_core_bf16_conv_bwd_weights_kernel_f32() 698 std::unique_ptr<bf16_emulation_t> bf16_emu_; member
|
H A D | jit_uni_eltwise.cpp | 129 bf16_emu_.reset(new bf16_emulation_t(this, bf16_emu_reserv_1, in jit_uni_kernel_t() 133 this, k_tail_mask, bf16_emu_.get())); in jit_uni_kernel_t() 151 if (!mayiuse(avx512_core_bf16)) bf16_emu_->init_vcvtneps2bf16(); in generate() 281 std::unique_ptr<bf16_emulation_t> bf16_emu_; member
|
H A D | jit_uni_softmax.cpp | 270 std::unique_ptr<bf16_emulation_t> bf16_emu_ = nullptr; member 298 if (bf16_emu_) in store() 299 bf16_emu_->vcvtneps2bf16(bf16_cvt_ymm, src_vmm); in store() 438 if (bf16_emu_) bf16_emu_->init_vcvtneps2bf16(); in initialization_hook() 443 bf16_emu_.reset(new bf16_emulation_t(this, bf16_emu_zmm_1, in jit_softmax_t()
|
/dports/misc/mxnet/incubator-mxnet-1.9.0/3rdparty/mkldnn/src/cpu/x64/rnn/ |
H A D | jit_uni_rnn_common_postgemm.hpp | 61 if (bf16_emu_) delete bf16_emu_; in ~jit_uni_rnn_postgemm() 70 bf16_emu_ = new bf16_emulation_t(this, bf16_reg1, bf16_reg2, in init() 74 bf16_emu_ = nullptr; in init() 314 if (bf16_emu_) bf16_emu_->init_vcvtneps2bf16(); in init_regs() 552 if (bf16_emu_) in bf16_dc() 553 bf16_emu_->vcvtneps2bf16(bf16_reg_dc, srcz); in bf16_dc() 613 bf16_emulation_t *bf16_emu_; member
|
/dports/math/onednn/oneDNN-2.5.1/src/cpu/x64/rnn/ |
H A D | jit_uni_rnn_common_postgemm.hpp | 63 if (bf16_emu_) delete bf16_emu_; in ~jit_uni_rnn_postgemm() 72 bf16_emu_ = new bf16_emulation_t(this, bf16_reg1, bf16_reg2, in init() 76 bf16_emu_ = nullptr; in init() 322 if (bf16_emu_) bf16_emu_->init_vcvtneps2bf16(); in init_regs() 560 if (bf16_emu_) in bf16_dc() 561 bf16_emu_->vcvtneps2bf16(bf16_reg_dc, srcz); in bf16_dc() 624 bf16_emulation_t *bf16_emu_ = nullptr; member
|
/dports/misc/mxnet/incubator-mxnet-1.9.0/3rdparty/mkldnn/src/cpu/x64/lrn/ |
H A D | jit_avx512_common_lrn_fwd_base.cpp | 103 this->bf16_emu_->vcvtneps2bf16(yr, zr); in store_data() 196 bf16_emu_ = utils::make_unique<bf16_emulation_t>(this, 199 bf16_emu_->init_vcvtneps2bf16();
|
H A D | jit_avx512_common_lrn_bwd_base.cpp | 68 bf16_emu_->vcvtneps2bf16(yr, zr); in store_data() 197 bf16_emu_ = utils::make_unique<bf16_emulation_t>(this, 200 bf16_emu_->init_vcvtneps2bf16();
|
/dports/math/onednn/oneDNN-2.5.1/src/cpu/x64/lrn/ |
H A D | jit_avx512_common_lrn_bwd_base.cpp | 68 bf16_emu_->vcvtneps2bf16(yr, zr); in store_data() 197 bf16_emu_ = utils::make_unique<bf16_emulation_t>(this, 200 bf16_emu_->init_vcvtneps2bf16();
|
H A D | jit_avx512_common_lrn_fwd_base.cpp | 103 this->bf16_emu_->vcvtneps2bf16(yr, zr); in store_data() 196 bf16_emu_ = utils::make_unique<bf16_emulation_t>(this, 199 bf16_emu_->init_vcvtneps2bf16();
|
/dports/misc/mxnet/incubator-mxnet-1.9.0/3rdparty/mkldnn/src/cpu/x64/utils/ |
H A D | jit_io_helper.cpp | 78 , bf16_emu_(nullptr) in jit_io_helper_t() 88 bf16_emu_ = utils::make_unique<bf16_emulation_t>(host_, in jit_io_helper_t() 123 if (bf16_emu_) { in init_bf16() 126 bf16_emu_->init_vcvtneps2bf16(); in init_bf16() 630 if (bf16_emu_) { in store_bf16() 632 bf16_emu_->vcvtneps2bf16(src_ymm, src_raw_vmm); in store_bf16() 634 bf16_emu_->vcvtneps2bf16(src_xmm, src_raw_vmm); in store_bf16()
|
/dports/math/onednn/oneDNN-2.5.1/src/cpu/x64/utils/ |
H A D | jit_io_helper.cpp | 78 , bf16_emu_(nullptr) in jit_io_helper_t() 88 bf16_emu_ = utils::make_unique<bf16_emulation_t>(host_, in jit_io_helper_t() 123 if (bf16_emu_) { in init_bf16() 126 bf16_emu_->init_vcvtneps2bf16(); in init_bf16() 630 if (bf16_emu_) { in store_bf16() 632 bf16_emu_->vcvtneps2bf16(src_ymm, src_raw_vmm); in store_bf16() 634 bf16_emu_->vcvtneps2bf16(src_xmm, src_raw_vmm); in store_bf16()
|
/dports/misc/mxnet/incubator-mxnet-1.9.0/3rdparty/mkldnn/src/cpu/x64/gemm/bf16/ |
H A D | jit_avx512_core_gemm_bf16bf16f32_kern.cpp | 84 bf16_emu_->vdpbf16ps(make_zmm(dst), make_zmm(src1), make_zmm(src2)); in dot_product() 494 bf16_emu_ = nullptr; in jit_avx512_core_gemm_bf16bf16f32_kern() 506 bf16_emu_ = new bf16_emulation_t( in jit_avx512_core_gemm_bf16bf16f32_kern() 513 delete bf16_emu_; in ~jit_avx512_core_gemm_bf16bf16f32_kern()
|
H A D | jit_avx512_core_gemv_bf16bf16f32_kern.cpp | 57 bf16_emu_->vdpbf16ps(make_zmm(dst), make_zmm(src1), make_zmm(src2)); in dot_product() 593 bf16_emu_ = nullptr; in jit_avx512_core_gemv_bf16bf16f32_kern() 604 bf16_emu_ = new bf16_emulation_t( in jit_avx512_core_gemv_bf16bf16f32_kern() 611 delete bf16_emu_; in ~jit_avx512_core_gemv_bf16bf16f32_kern()
|
/dports/math/onednn/oneDNN-2.5.1/src/cpu/x64/gemm/bf16/ |
H A D | jit_avx512_core_gemm_bf16bf16f32_kern.cpp | 84 bf16_emu_->vdpbf16ps(make_zmm(dst), make_zmm(src1), make_zmm(src2)); in dot_product() 505 bf16_emu_ = nullptr; in jit_avx512_core_gemm_bf16bf16f32_kern() 507 bf16_emu_ = new bf16_emulation_t( in jit_avx512_core_gemm_bf16bf16f32_kern() 513 delete bf16_emu_; in ~jit_avx512_core_gemm_bf16bf16f32_kern()
|