/dports/graphics/libosmesa-gallium/mesa-21.3.6/src/freedreno/ir3/ |
H A D | ir3_nir_lower_tg4_to_tex.c | 41 int num_srcs = tg4->num_srcs + 1 /* lod */; in ir3_nir_lower_tg4_to_tex_instr() local 43 num_srcs++; in ir3_nir_lower_tg4_to_tex_instr() 45 nir_tex_instr *tex = nir_tex_instr_create(b->shader, num_srcs); in ir3_nir_lower_tg4_to_tex_instr() 56 for (int j = 0; j < tg4->num_srcs; j++) { in ir3_nir_lower_tg4_to_tex_instr() 64 tex->src[tg4->num_srcs].src = nir_src_for_ssa(offset); in ir3_nir_lower_tg4_to_tex_instr() 65 tex->src[tg4->num_srcs].src_type = nir_tex_src_offset; in ir3_nir_lower_tg4_to_tex_instr() 74 tex->src[num_srcs - 1].src = nir_src_for_ssa(nir_imm_float(b, 0)); in ir3_nir_lower_tg4_to_tex_instr() 75 tex->src[num_srcs - 1].src_type = nir_tex_src_lod; in ir3_nir_lower_tg4_to_tex_instr()
|
/dports/graphics/mesa-libs/mesa-21.3.6/src/freedreno/ir3/ |
H A D | ir3_nir_lower_tg4_to_tex.c | 41 int num_srcs = tg4->num_srcs + 1 /* lod */; in ir3_nir_lower_tg4_to_tex_instr() local 43 num_srcs++; in ir3_nir_lower_tg4_to_tex_instr() 45 nir_tex_instr *tex = nir_tex_instr_create(b->shader, num_srcs); in ir3_nir_lower_tg4_to_tex_instr() 56 for (int j = 0; j < tg4->num_srcs; j++) { in ir3_nir_lower_tg4_to_tex_instr() 64 tex->src[tg4->num_srcs].src = nir_src_for_ssa(offset); in ir3_nir_lower_tg4_to_tex_instr() 65 tex->src[tg4->num_srcs].src_type = nir_tex_src_offset; in ir3_nir_lower_tg4_to_tex_instr() 74 tex->src[num_srcs - 1].src = nir_src_for_ssa(nir_imm_float(b, 0)); in ir3_nir_lower_tg4_to_tex_instr() 75 tex->src[num_srcs - 1].src_type = nir_tex_src_lod; in ir3_nir_lower_tg4_to_tex_instr()
|
/dports/graphics/mesa-gallium-va/mesa-21.3.6/src/freedreno/ir3/ |
H A D | ir3_nir_lower_tg4_to_tex.c | 41 int num_srcs = tg4->num_srcs + 1 /* lod */; in ir3_nir_lower_tg4_to_tex_instr() local 43 num_srcs++; in ir3_nir_lower_tg4_to_tex_instr() 45 nir_tex_instr *tex = nir_tex_instr_create(b->shader, num_srcs); in ir3_nir_lower_tg4_to_tex_instr() 56 for (int j = 0; j < tg4->num_srcs; j++) { in ir3_nir_lower_tg4_to_tex_instr() 64 tex->src[tg4->num_srcs].src = nir_src_for_ssa(offset); in ir3_nir_lower_tg4_to_tex_instr() 65 tex->src[tg4->num_srcs].src_type = nir_tex_src_offset; in ir3_nir_lower_tg4_to_tex_instr() 74 tex->src[num_srcs - 1].src = nir_src_for_ssa(nir_imm_float(b, 0)); in ir3_nir_lower_tg4_to_tex_instr() 75 tex->src[num_srcs - 1].src_type = nir_tex_src_lod; in ir3_nir_lower_tg4_to_tex_instr()
|
/dports/graphics/mesa-dri-gallium/mesa-21.3.6/src/freedreno/ir3/ |
H A D | ir3_nir_lower_tg4_to_tex.c | 41 int num_srcs = tg4->num_srcs + 1 /* lod */; in ir3_nir_lower_tg4_to_tex_instr() local 43 num_srcs++; in ir3_nir_lower_tg4_to_tex_instr() 45 nir_tex_instr *tex = nir_tex_instr_create(b->shader, num_srcs); in ir3_nir_lower_tg4_to_tex_instr() 56 for (int j = 0; j < tg4->num_srcs; j++) { in ir3_nir_lower_tg4_to_tex_instr() 64 tex->src[tg4->num_srcs].src = nir_src_for_ssa(offset); in ir3_nir_lower_tg4_to_tex_instr() 65 tex->src[tg4->num_srcs].src_type = nir_tex_src_offset; in ir3_nir_lower_tg4_to_tex_instr() 74 tex->src[num_srcs - 1].src = nir_src_for_ssa(nir_imm_float(b, 0)); in ir3_nir_lower_tg4_to_tex_instr() 75 tex->src[num_srcs - 1].src_type = nir_tex_src_lod; in ir3_nir_lower_tg4_to_tex_instr()
|
/dports/graphics/mesa-gallium-vdpau/mesa-21.3.6/src/freedreno/ir3/ |
H A D | ir3_nir_lower_tg4_to_tex.c | 41 int num_srcs = tg4->num_srcs + 1 /* lod */; in ir3_nir_lower_tg4_to_tex_instr() local 43 num_srcs++; in ir3_nir_lower_tg4_to_tex_instr() 45 nir_tex_instr *tex = nir_tex_instr_create(b->shader, num_srcs); in ir3_nir_lower_tg4_to_tex_instr() 56 for (int j = 0; j < tg4->num_srcs; j++) { in ir3_nir_lower_tg4_to_tex_instr() 64 tex->src[tg4->num_srcs].src = nir_src_for_ssa(offset); in ir3_nir_lower_tg4_to_tex_instr() 65 tex->src[tg4->num_srcs].src_type = nir_tex_src_offset; in ir3_nir_lower_tg4_to_tex_instr() 74 tex->src[num_srcs - 1].src = nir_src_for_ssa(nir_imm_float(b, 0)); in ir3_nir_lower_tg4_to_tex_instr() 75 tex->src[num_srcs - 1].src_type = nir_tex_src_lod; in ir3_nir_lower_tg4_to_tex_instr()
|
/dports/graphics/mesa-gallium-xa/mesa-21.3.6/src/freedreno/ir3/ |
H A D | ir3_nir_lower_tg4_to_tex.c | 41 int num_srcs = tg4->num_srcs + 1 /* lod */; in ir3_nir_lower_tg4_to_tex_instr() local 43 num_srcs++; in ir3_nir_lower_tg4_to_tex_instr() 45 nir_tex_instr *tex = nir_tex_instr_create(b->shader, num_srcs); in ir3_nir_lower_tg4_to_tex_instr() 56 for (int j = 0; j < tg4->num_srcs; j++) { in ir3_nir_lower_tg4_to_tex_instr() 64 tex->src[tg4->num_srcs].src = nir_src_for_ssa(offset); in ir3_nir_lower_tg4_to_tex_instr() 65 tex->src[tg4->num_srcs].src_type = nir_tex_src_offset; in ir3_nir_lower_tg4_to_tex_instr() 74 tex->src[num_srcs - 1].src = nir_src_for_ssa(nir_imm_float(b, 0)); in ir3_nir_lower_tg4_to_tex_instr() 75 tex->src[num_srcs - 1].src_type = nir_tex_src_lod; in ir3_nir_lower_tg4_to_tex_instr()
|
/dports/graphics/libosmesa/mesa-21.3.6/src/freedreno/ir3/ |
H A D | ir3_nir_lower_tg4_to_tex.c | 41 int num_srcs = tg4->num_srcs + 1 /* lod */; in ir3_nir_lower_tg4_to_tex_instr() local 43 num_srcs++; in ir3_nir_lower_tg4_to_tex_instr() 45 nir_tex_instr *tex = nir_tex_instr_create(b->shader, num_srcs); in ir3_nir_lower_tg4_to_tex_instr() 56 for (int j = 0; j < tg4->num_srcs; j++) { in ir3_nir_lower_tg4_to_tex_instr() 64 tex->src[tg4->num_srcs].src = nir_src_for_ssa(offset); in ir3_nir_lower_tg4_to_tex_instr() 65 tex->src[tg4->num_srcs].src_type = nir_tex_src_offset; in ir3_nir_lower_tg4_to_tex_instr() 74 tex->src[num_srcs - 1].src = nir_src_for_ssa(nir_imm_float(b, 0)); in ir3_nir_lower_tg4_to_tex_instr() 75 tex->src[num_srcs - 1].src_type = nir_tex_src_lod; in ir3_nir_lower_tg4_to_tex_instr()
|
/dports/graphics/mesa-dri/mesa-21.3.6/src/freedreno/ir3/ |
H A D | ir3_nir_lower_tg4_to_tex.c | 41 int num_srcs = tg4->num_srcs + 1 /* lod */; in ir3_nir_lower_tg4_to_tex_instr() local 43 num_srcs++; in ir3_nir_lower_tg4_to_tex_instr() 45 nir_tex_instr *tex = nir_tex_instr_create(b->shader, num_srcs); in ir3_nir_lower_tg4_to_tex_instr() 56 for (int j = 0; j < tg4->num_srcs; j++) { in ir3_nir_lower_tg4_to_tex_instr() 64 tex->src[tg4->num_srcs].src = nir_src_for_ssa(offset); in ir3_nir_lower_tg4_to_tex_instr() 65 tex->src[tg4->num_srcs].src_type = nir_tex_src_offset; in ir3_nir_lower_tg4_to_tex_instr() 74 tex->src[num_srcs - 1].src = nir_src_for_ssa(nir_imm_float(b, 0)); in ir3_nir_lower_tg4_to_tex_instr() 75 tex->src[num_srcs - 1].src_type = nir_tex_src_lod; in ir3_nir_lower_tg4_to_tex_instr()
|
/dports/graphics/mesa-dri-classic/mesa-20.2.3/src/freedreno/ir3/ |
H A D | ir3_nir_lower_tg4_to_tex.c | 41 int num_srcs = tg4->num_srcs + 1 /* lod */; in ir3_nir_lower_tg4_to_tex_instr() local 43 num_srcs++; in ir3_nir_lower_tg4_to_tex_instr() 45 nir_tex_instr *tex = nir_tex_instr_create(b->shader, num_srcs); in ir3_nir_lower_tg4_to_tex_instr() 56 for (int j = 0; j < tg4->num_srcs; j++) { in ir3_nir_lower_tg4_to_tex_instr() 65 tex->src[tg4->num_srcs].src = nir_src_for_ssa(offset); in ir3_nir_lower_tg4_to_tex_instr() 66 tex->src[tg4->num_srcs].src_type = nir_tex_src_offset; in ir3_nir_lower_tg4_to_tex_instr() 75 tex->src[num_srcs - 1].src = nir_src_for_ssa(nir_imm_float(b, 0)); in ir3_nir_lower_tg4_to_tex_instr() 76 tex->src[num_srcs - 1].src_type = nir_tex_src_lod; in ir3_nir_lower_tg4_to_tex_instr()
|
/dports/lang/clover/mesa-21.3.6/src/freedreno/ir3/ |
H A D | ir3_nir_lower_tg4_to_tex.c | 41 int num_srcs = tg4->num_srcs + 1 /* lod */; in ir3_nir_lower_tg4_to_tex_instr() local 43 num_srcs++; in ir3_nir_lower_tg4_to_tex_instr() 45 nir_tex_instr *tex = nir_tex_instr_create(b->shader, num_srcs); in ir3_nir_lower_tg4_to_tex_instr() 56 for (int j = 0; j < tg4->num_srcs; j++) { in ir3_nir_lower_tg4_to_tex_instr() 64 tex->src[tg4->num_srcs].src = nir_src_for_ssa(offset); in ir3_nir_lower_tg4_to_tex_instr() 65 tex->src[tg4->num_srcs].src_type = nir_tex_src_offset; in ir3_nir_lower_tg4_to_tex_instr() 74 tex->src[num_srcs - 1].src = nir_src_for_ssa(nir_imm_float(b, 0)); in ir3_nir_lower_tg4_to_tex_instr() 75 tex->src[num_srcs - 1].src_type = nir_tex_src_lod; in ir3_nir_lower_tg4_to_tex_instr()
|
/dports/graphics/libosmesa-gallium/mesa-21.3.6/src/gallium/auxiliary/gallivm/ |
H A D | lp_bld_conv.c | 477 int num_dsts = num_srcs; in lp_build_conv_auto() 506 dst_type->length = num_srcs * 4 >= 16 ? 16 : num_srcs * 4; in lp_build_conv_auto() 517 dst_type->length = num_srcs * 8 >= 16 ? 16 : num_srcs * 8; in lp_build_conv_auto() 582 for(i = 0; i < num_srcs; ++i) { in lp_build_conv() 586 num_tmps = num_srcs; in lp_build_conv() 609 (num_dsts == 1 && dst_type.length * num_srcs == 16 && num_srcs != 3)) && in lp_build_conv() 684 if (num_srcs == 1) { in lp_build_conv() 691 if (num_srcs < 4) { in lp_build_conv() 699 if (num_srcs < 4) { in lp_build_conv() 779 if (num_srcs == 1) { in lp_build_conv() [all …]
|
H A D | lp_bld_pack.c | 259 unsigned num_srcs, in lp_build_concat_n() argument 263 int size = num_srcs / num_dsts; in lp_build_concat_n() 266 assert(num_srcs >= num_dsts); in lp_build_concat_n() 267 assert((num_srcs % size) == 0); in lp_build_concat_n() 269 if (num_srcs == num_dsts) { in lp_build_concat_n() 848 for(i = 0; i < num_srcs; ++i) in lp_build_pack() 861 num_srcs /= 2; in lp_build_pack() 863 for(i = 0; i < num_srcs; ++i) in lp_build_pack() 870 assert(num_srcs == 1); in lp_build_pack() 944 num_srcs *= size_ratio; in lp_build_resize() [all …]
|
/dports/graphics/libosmesa/mesa-21.3.6/src/gallium/auxiliary/gallivm/ |
H A D | lp_bld_conv.c | 477 int num_dsts = num_srcs; in lp_build_conv_auto() 506 dst_type->length = num_srcs * 4 >= 16 ? 16 : num_srcs * 4; in lp_build_conv_auto() 517 dst_type->length = num_srcs * 8 >= 16 ? 16 : num_srcs * 8; in lp_build_conv_auto() 582 for(i = 0; i < num_srcs; ++i) { in lp_build_conv() 586 num_tmps = num_srcs; in lp_build_conv() 609 (num_dsts == 1 && dst_type.length * num_srcs == 16 && num_srcs != 3)) && in lp_build_conv() 684 if (num_srcs == 1) { in lp_build_conv() 691 if (num_srcs < 4) { in lp_build_conv() 699 if (num_srcs < 4) { in lp_build_conv() 779 if (num_srcs == 1) { in lp_build_conv() [all …]
|
H A D | lp_bld_pack.c | 259 unsigned num_srcs, in lp_build_concat_n() argument 263 int size = num_srcs / num_dsts; in lp_build_concat_n() 266 assert(num_srcs >= num_dsts); in lp_build_concat_n() 267 assert((num_srcs % size) == 0); in lp_build_concat_n() 269 if (num_srcs == num_dsts) { in lp_build_concat_n() 848 for(i = 0; i < num_srcs; ++i) in lp_build_pack() 861 num_srcs /= 2; in lp_build_pack() 863 for(i = 0; i < num_srcs; ++i) in lp_build_pack() 870 assert(num_srcs == 1); in lp_build_pack() 944 num_srcs *= size_ratio; in lp_build_resize() [all …]
|
/dports/graphics/mesa-libs/mesa-21.3.6/src/gallium/auxiliary/gallivm/ |
H A D | lp_bld_conv.c | 477 int num_dsts = num_srcs; in lp_build_conv_auto() 506 dst_type->length = num_srcs * 4 >= 16 ? 16 : num_srcs * 4; in lp_build_conv_auto() 517 dst_type->length = num_srcs * 8 >= 16 ? 16 : num_srcs * 8; in lp_build_conv_auto() 582 for(i = 0; i < num_srcs; ++i) { in lp_build_conv() 586 num_tmps = num_srcs; in lp_build_conv() 609 (num_dsts == 1 && dst_type.length * num_srcs == 16 && num_srcs != 3)) && in lp_build_conv() 684 if (num_srcs == 1) { in lp_build_conv() 691 if (num_srcs < 4) { in lp_build_conv() 699 if (num_srcs < 4) { in lp_build_conv() 779 if (num_srcs == 1) { in lp_build_conv() [all …]
|
/dports/graphics/mesa-gallium-va/mesa-21.3.6/src/gallium/auxiliary/gallivm/ |
H A D | lp_bld_conv.c | 477 int num_dsts = num_srcs; in lp_build_conv_auto() 506 dst_type->length = num_srcs * 4 >= 16 ? 16 : num_srcs * 4; in lp_build_conv_auto() 517 dst_type->length = num_srcs * 8 >= 16 ? 16 : num_srcs * 8; in lp_build_conv_auto() 582 for(i = 0; i < num_srcs; ++i) { in lp_build_conv() 586 num_tmps = num_srcs; in lp_build_conv() 609 (num_dsts == 1 && dst_type.length * num_srcs == 16 && num_srcs != 3)) && in lp_build_conv() 684 if (num_srcs == 1) { in lp_build_conv() 691 if (num_srcs < 4) { in lp_build_conv() 699 if (num_srcs < 4) { in lp_build_conv() 779 if (num_srcs == 1) { in lp_build_conv() [all …]
|
/dports/graphics/mesa-dri-gallium/mesa-21.3.6/src/gallium/auxiliary/gallivm/ |
H A D | lp_bld_conv.c | 477 int num_dsts = num_srcs; in lp_build_conv_auto() 506 dst_type->length = num_srcs * 4 >= 16 ? 16 : num_srcs * 4; in lp_build_conv_auto() 517 dst_type->length = num_srcs * 8 >= 16 ? 16 : num_srcs * 8; in lp_build_conv_auto() 582 for(i = 0; i < num_srcs; ++i) { in lp_build_conv() 586 num_tmps = num_srcs; in lp_build_conv() 609 (num_dsts == 1 && dst_type.length * num_srcs == 16 && num_srcs != 3)) && in lp_build_conv() 684 if (num_srcs == 1) { in lp_build_conv() 691 if (num_srcs < 4) { in lp_build_conv() 699 if (num_srcs < 4) { in lp_build_conv() 779 if (num_srcs == 1) { in lp_build_conv() [all …]
|
/dports/graphics/mesa-gallium-vdpau/mesa-21.3.6/src/gallium/auxiliary/gallivm/ |
H A D | lp_bld_conv.c | 477 int num_dsts = num_srcs; in lp_build_conv_auto() 506 dst_type->length = num_srcs * 4 >= 16 ? 16 : num_srcs * 4; in lp_build_conv_auto() 517 dst_type->length = num_srcs * 8 >= 16 ? 16 : num_srcs * 8; in lp_build_conv_auto() 582 for(i = 0; i < num_srcs; ++i) { in lp_build_conv() 586 num_tmps = num_srcs; in lp_build_conv() 609 (num_dsts == 1 && dst_type.length * num_srcs == 16 && num_srcs != 3)) && in lp_build_conv() 684 if (num_srcs == 1) { in lp_build_conv() 691 if (num_srcs < 4) { in lp_build_conv() 699 if (num_srcs < 4) { in lp_build_conv() 779 if (num_srcs == 1) { in lp_build_conv() [all …]
|
/dports/graphics/mesa-gallium-xa/mesa-21.3.6/src/gallium/auxiliary/gallivm/ |
H A D | lp_bld_conv.c | 477 int num_dsts = num_srcs; in lp_build_conv_auto() 506 dst_type->length = num_srcs * 4 >= 16 ? 16 : num_srcs * 4; in lp_build_conv_auto() 517 dst_type->length = num_srcs * 8 >= 16 ? 16 : num_srcs * 8; in lp_build_conv_auto() 582 for(i = 0; i < num_srcs; ++i) { in lp_build_conv() 586 num_tmps = num_srcs; in lp_build_conv() 609 (num_dsts == 1 && dst_type.length * num_srcs == 16 && num_srcs != 3)) && in lp_build_conv() 684 if (num_srcs == 1) { in lp_build_conv() 691 if (num_srcs < 4) { in lp_build_conv() 699 if (num_srcs < 4) { in lp_build_conv() 779 if (num_srcs == 1) { in lp_build_conv() [all …]
|
/dports/graphics/mesa-devel/mesa-22.0-branchpoint-2059-ge8a63cf61ec/src/gallium/auxiliary/gallivm/ |
H A D | lp_bld_conv.c | 477 int num_dsts = num_srcs; in lp_build_conv_auto() 506 dst_type->length = num_srcs * 4 >= 16 ? 16 : num_srcs * 4; in lp_build_conv_auto() 517 dst_type->length = num_srcs * 8 >= 16 ? 16 : num_srcs * 8; in lp_build_conv_auto() 582 for(i = 0; i < num_srcs; ++i) { in lp_build_conv() 586 num_tmps = num_srcs; in lp_build_conv() 609 (num_dsts == 1 && dst_type.length * num_srcs == 16 && num_srcs != 3)) && in lp_build_conv() 684 if (num_srcs == 1) { in lp_build_conv() 691 if (num_srcs < 4) { in lp_build_conv() 699 if (num_srcs < 4) { in lp_build_conv() 779 if (num_srcs == 1) { in lp_build_conv() [all …]
|
/dports/graphics/mesa-dri/mesa-21.3.6/src/gallium/auxiliary/gallivm/ |
H A D | lp_bld_conv.c | 477 int num_dsts = num_srcs; in lp_build_conv_auto() 506 dst_type->length = num_srcs * 4 >= 16 ? 16 : num_srcs * 4; in lp_build_conv_auto() 517 dst_type->length = num_srcs * 8 >= 16 ? 16 : num_srcs * 8; in lp_build_conv_auto() 582 for(i = 0; i < num_srcs; ++i) { in lp_build_conv() 586 num_tmps = num_srcs; in lp_build_conv() 609 (num_dsts == 1 && dst_type.length * num_srcs == 16 && num_srcs != 3)) && in lp_build_conv() 684 if (num_srcs == 1) { in lp_build_conv() 691 if (num_srcs < 4) { in lp_build_conv() 699 if (num_srcs < 4) { in lp_build_conv() 779 if (num_srcs == 1) { in lp_build_conv() [all …]
|
/dports/graphics/mesa-dri-classic/mesa-20.2.3/src/gallium/auxiliary/gallivm/ |
H A D | lp_bld_conv.c | 466 int num_dsts = num_srcs; in lp_build_conv_auto() 495 dst_type->length = num_srcs * 4 >= 16 ? 16 : num_srcs * 4; in lp_build_conv_auto() 506 dst_type->length = num_srcs * 8 >= 16 ? 16 : num_srcs * 8; in lp_build_conv_auto() 571 for(i = 0; i < num_srcs; ++i) { in lp_build_conv() 575 num_tmps = num_srcs; in lp_build_conv() 598 (num_dsts == 1 && dst_type.length * num_srcs == 16 && num_srcs != 3)) && in lp_build_conv() 673 if (num_srcs == 1) { in lp_build_conv() 680 if (num_srcs < 4) { in lp_build_conv() 688 if (num_srcs < 4) { in lp_build_conv() 768 if (num_srcs == 1) { in lp_build_conv() [all …]
|
/dports/lang/clover/mesa-21.3.6/src/gallium/auxiliary/gallivm/ |
H A D | lp_bld_conv.c | 477 int num_dsts = num_srcs; in lp_build_conv_auto() 506 dst_type->length = num_srcs * 4 >= 16 ? 16 : num_srcs * 4; in lp_build_conv_auto() 517 dst_type->length = num_srcs * 8 >= 16 ? 16 : num_srcs * 8; in lp_build_conv_auto() 582 for(i = 0; i < num_srcs; ++i) { in lp_build_conv() 586 num_tmps = num_srcs; in lp_build_conv() 609 (num_dsts == 1 && dst_type.length * num_srcs == 16 && num_srcs != 3)) && in lp_build_conv() 684 if (num_srcs == 1) { in lp_build_conv() 691 if (num_srcs < 4) { in lp_build_conv() 699 if (num_srcs < 4) { in lp_build_conv() 779 if (num_srcs == 1) { in lp_build_conv() [all …]
|
/dports/misc/mxnet/incubator-mxnet-1.9.0/3rdparty/mkldnn/src/cpu/x64/ |
H A D | jit_avx512_core_bf16_sum.hpp | 32 int num_srcs; member 63 static status_t init_conf(jit_sum_conf_t &jsp, const int num_srcs, 118 = 2 * jsp.loop_unroll + utils::div_up(jsp.num_srcs, 2); in src_vreg_idx() 119 int idx = inp_idx_start + utils::rnd_up(jsp.num_srcs, 2) * i_unroll in src_vreg_idx() 126 int num_acc_iters = utils::div_up(jsp.num_srcs, 2); in tmp_vreg_idx() 128 int tmp_idx_start = utils::div_up(jsp.num_srcs, 2) in tmp_vreg_idx() 129 + (2 + utils::rnd_up(jsp.num_srcs, 2)) * jsp.loop_unroll; in tmp_vreg_idx() 135 static int num_vregs_required(int unroll, int num_srcs) { in num_vregs_required() 136 int num_acc_iters = utils::div_up(num_srcs, 2); in num_vregs_required() 138 int num_regs = utils::div_up(num_srcs, 2) in num_vregs_required() [all …]
|
/dports/math/onednn/oneDNN-2.5.1/src/cpu/x64/ |
H A D | jit_avx512_core_bf16_sum.hpp | 32 int num_srcs; member 63 static status_t init_conf(jit_sum_conf_t &jsp, const int num_srcs, 118 = 2 * jsp.loop_unroll + utils::div_up(jsp.num_srcs, 2); in src_vreg_idx() 119 int idx = inp_idx_start + utils::rnd_up(jsp.num_srcs, 2) * i_unroll in src_vreg_idx() 126 int num_acc_iters = utils::div_up(jsp.num_srcs, 2); in tmp_vreg_idx() 128 int tmp_idx_start = utils::div_up(jsp.num_srcs, 2) in tmp_vreg_idx() 129 + (2 + utils::rnd_up(jsp.num_srcs, 2)) * jsp.loop_unroll; in tmp_vreg_idx() 135 static int num_vregs_required(int unroll, int num_srcs) { in num_vregs_required() 136 int num_acc_iters = utils::div_up(num_srcs, 2); in num_vregs_required() 138 int num_regs = utils::div_up(num_srcs, 2) in num_vregs_required() [all …]
|