/dports/math/libxsmm/libxsmm-1.16.3/src/template/ |
H A D | libxsmm_dnn_convolve_st_bwd_custom_custom_generic.tpl.c | 18 int my_ifm_start = 0; variable 104 my_ifm_start = LIBXSMM_MIN(myIfmId * nIfmBlocks, handle->blocksifm); 128 my_ifm_start = LIBXSMM_MIN(ifm_id * ifmpt, handle->blocksifm); 136 for (ifmb = my_ifm_start; ifmb < my_ifm_end; ifmb += handle->block_bwd_ifm) { 210 for (ifmb = my_ifm_start; ifmb < my_ifm_end; ifmb += handle->block_bwd_ifm) { 262 for (ifmb = my_ifm_start; ifmb < my_ifm_end; ifmb += handle->block_bwd_ifm) { 312 for (ifm1 = my_ifm_start; ifm1 < my_ifm_end; ifm1++) { 333 for (ifm1 = my_ifm_start; ifm1 < my_ifm_end; ifm1++) {
|
H A D | libxsmm_dnn_convolve_st_bwd_nhwc_custom-rsck_generic.tpl.c | 18 int my_ifm_start = 0; variable 119 my_ifm_start = LIBXSMM_MIN(myIfmId * nIfmBlocks, handle->blocksifm); 143 my_ifm_start = LIBXSMM_MIN(ifm_id * ifmpt, handle->blocksifm); 151 for (ifmb = my_ifm_start; ifmb < my_ifm_end; ifmb += handle->block_bwd_ifm) { 225 for (ifmb = my_ifm_start; ifmb < my_ifm_end; ifmb += handle->block_bwd_ifm) { 277 for (ifmb = my_ifm_start; ifmb < my_ifm_end; ifmb += handle->block_bwd_ifm) { 327 for (ifm1 = my_ifm_start; ifm1 < my_ifm_end; ifm1++) { 348 for (ifm1 = my_ifm_start; ifm1 < my_ifm_end; ifm1++) {
|
H A D | libxsmm_dnn_convolve_st_bwd_custom_custom_generic_bf16.tpl.c | 19 int my_ifm_start = 0; variable 86 my_ifm_start = LIBXSMM_MIN(myIfmId * nIfmBlocks, handle->blocksifm); 110 my_ifm_start = LIBXSMM_MIN(ifm_id * ifmpt, handle->blocksifm); 118 for (ifmb = my_ifm_start; ifmb < my_ifm_end; ifmb += handle->block_bwd_ifm) { 240 for (ifmb = my_ifm_start; ifmb < my_ifm_end; ifmb += handle->block_bwd_ifm) { 306 for (ifmb = my_ifm_start; ifmb < my_ifm_end; ifmb += handle->block_bwd_ifm) { 370 for (ifm1 = my_ifm_start; ifm1 < my_ifm_end; ifm1++) { 391 for (ifm1 = my_ifm_start; ifm1 < my_ifm_end; ifm1++) {
|
H A D | libxsmm_dnn_convolve_st_upd_custom_custom_generic.tpl.c | 12 … ki, ind, j_br, img_br, img_block_size = 1, my_ofm_start, my_ofm_end, my_ifm_start, my_ifm_end, bl… variable 44 my_ifm_start = 0; 48 for (ifm1 = my_ifm_start; ifm1 < my_ifm_end; ifm1++) { 317 my_ifm_start = LIBXSMM_MIN(my_in_tile_id * ifms_per_thread, handle->blocksifm ); 325 my_ifm_start = 0; 330 my_ifm_start = 0; 340 my_ifm_start = 0; 344 block_ifm = my_ifm_end-my_ifm_start+1; 435 for (ifm1 = my_ifm_start; ifm1 < my_ifm_end; ifm1++) { 452 for (ifmb = my_ifm_start; ifmb < my_ifm_end; ifmb += block_ifm) { [all …]
|
H A D | libxsmm_dnn_convolve_st_upd_nhwc_custom-rsck_generic.tpl.c | 12 … ki, ind, j_br, img_br, img_block_size = 1, my_ofm_start, my_ofm_end, my_ifm_start, my_ifm_end, bl… variable 58 my_ifm_start = 0; 62 for (ifm1 = my_ifm_start; ifm1 < my_ifm_end; ifm1++) { 386 my_ifm_start = LIBXSMM_MIN(my_in_tile_id * ifms_per_thread, handle->blocksifm ); 394 my_ifm_start = 0; 399 my_ifm_start = 0; 407 block_ifm = my_ifm_end-my_ifm_start+1; 518 for (ifm1 = my_ifm_start; ifm1 < my_ifm_end; ifm1++) { 540 for (ifmb = my_ifm_start; ifmb < my_ifm_end; ifmb += block_ifm) { 577 for (ifmb = my_ifm_start; ifmb < my_ifm_end; ifmb += block_ifm) {
|
H A D | libxsmm_dnn_convolve_st_upd_custom_custom_generic_bf16.tpl.c | 67 …ki, j_br, img_br, i, j, img_block_size = 1, my_ofm_start, my_ofm_end, my_ifm_start, my_ifm_end, bl… variable 468 my_ifm_start = LIBXSMM_MIN(my_in_tile_id * ifms_per_thread, handle->blocksifm ); 476 my_ifm_start = 0; 481 my_ifm_start = 0; 489 block_ifm = my_ifm_end-my_ifm_start+1; 498 for (ifm1 = my_ifm_start; ifm1 < my_ifm_end; ifm1++) { 511 for (ifmb = my_ifm_start; ifmb < my_ifm_end; ifmb += block_ifm) {
|
H A D | libxsmm_dnn_convolve_st_fwd_custom_custom_generic_i8i32.tpl.c | 48 int my_ifm_start = LIBXSMM_MIN(ifm_id * ifmpt, handle->blocksifm); variable 52 for (ifm1 = my_ifm_start; ifm1 < my_ifm_end; ifm1++) {
|
H A D | libxsmm_dnn_convolve_st_fwd_custom_custom_generic.tpl.c | 76 int my_ifm_start = LIBXSMM_MIN(ifm_id * ifmpt, handle->blocksifm); variable 80 for (ifm1 = my_ifm_start; ifm1 < my_ifm_end; ifm1++) { 102 int my_ifm_start = LIBXSMM_MIN(ifm_id * ifmpt, handle->blocksifm); variable 106 for (ifm1 = my_ifm_start; ifm1 < my_ifm_end; ifm1++) {
|
H A D | libxsmm_dnn_convolve_st_fwd_nhwc_custom-rsck_generic.tpl.c | 81 int my_ifm_start = LIBXSMM_MIN(ifm_id * ifmpt, handle->blocksifm); variable 86 for (ifm1 = my_ifm_start; ifm1 < my_ifm_end; ifm1++) { 108 int my_ifm_start = LIBXSMM_MIN(ifm_id * ifmpt, handle->blocksifm); variable 112 for (ifm1 = my_ifm_start; ifm1 < my_ifm_end; ifm1++) {
|
H A D | libxsmm_dnn_convolve_st_fwd_custom_custom_generic_bf16.tpl.c | 83 int my_ifm_start = LIBXSMM_MIN(ifm_id * ifmpt, handle->blocksifm); variable 87 for (ifm1 = my_ifm_start; ifm1 < my_ifm_end; ifm1++) {
|