/dports/math/libxsmm/libxsmm-1.16.3/src/template/ |
H A D | libxsmm_dnn_fullyconnected_st_bwdupd_custom_generic.tpl.c | 21 const int ltid = tid - start_thread; variable 27 const int thr_begin = (ltid * chunksize < work) ? (ltid * chunksize) : work; 28 const int thr_end = ((ltid + 1) * chunksize < work) ? ((ltid + 1) * chunksize) : work; 58 …const int thr_begin_input = (ltid * chunksize_input < work_input) ? (ltid * chunksize_input) : wor… 59 …const int thr_end_input = ((ltid + 1) * chunksize_input < work_input) ? ((ltid + 1) * chunksize_in… 66 libxsmm_barrier_init(handle->barrier, ltid); 89 libxsmm_barrier_wait(handle->barrier, ltid); 140 const int ltid = tid - start_thread; variable 146 const int thr_begin = (ltid * chunksize < work) ? (ltid * chunksize) : work; 147 const int thr_end = ((ltid + 1) * chunksize < work) ? ((ltid + 1) * chunksize) : work; [all …]
|
H A D | libxsmm_dnn_fullyconnected_st_fwd_custom_generic.tpl.c | 20 const int ltid = tid - start_thread; variable 26 const int thr_begin = (ltid * chunksize < work) ? (ltid * chunksize) : work; 27 const int thr_end = ((ltid + 1) * chunksize < work) ? ((ltid + 1) * chunksize) : work; 44 const int thr_begin_input = (ltid * chunksize_input < work_input) ? (ltid * chunksize_input) : work… 45 const int thr_end_input = ((ltid + 1) * chunksize_input < work_input) ? ((ltid + 1) * chunksize_inp… 52 const int thr_begin_filter = (ltid * chunksize_filter < work_filter) ? (ltid * chunksize_filter) : … 53 const int thr_end_filter = ((ltid + 1) * chunksize_filter < work_filter) ? ((ltid + 1) * chunksize_… 60 libxsmm_barrier_init(handle->barrier, ltid); 66 libxsmm_barrier_wait(handle->barrier, ltid); 101 libxsmm_barrier_wait(handle->barrier, ltid);
|
H A D | libxsmm_dnn_softmaxloss_st_bwd_ncnc_generic.tpl.c | 62 const int ltid = tid - start_thread; variable 69 const int n_thr_begin = (ltid * n_chunksize < n_work) ? (ltid * n_chunksize) : n_work; 70 const int n_thr_end = ((ltid + 1) * n_chunksize < n_work) ? ((ltid + 1) * n_chunksize) : n_work; 78 const int nc_thr_begin = (ltid * nc_chunksize < nc_work) ? (ltid * nc_chunksize) : nc_work; 79 const int nc_thr_end = ((ltid + 1) * nc_chunksize < nc_work) ? ((ltid + 1) * nc_chunksize) : nc_wor… 94 libxsmm_barrier_init( handle->barrier, ltid ); 104 libxsmm_barrier_wait( handle->barrier, ltid ); 109 libxsmm_barrier_wait( handle->barrier, ltid ); 130 libxsmm_barrier_wait( handle->barrier, ltid ); 140 libxsmm_barrier_wait( handle->barrier, ltid ); [all …]
|
H A D | libxsmm_dnn_fullyconnected_st_bwdupd_ncnc_kcck_generic.tpl.c | 21 const int ltid = tid - start_thread; variable 32 const int eltwise_thr_begin = (ltid * eltwise_chunksize < eltwise_work) ? (ltid * eltwise_chunksize… 43 const int dbias_thr_begin = (ltid * dbias_chunksize < dbias_work) ? (ltid * dbias_chunksize) : dbia… 118 const int thr_begin = (ltid * chunksize < work) ? (ltid * chunksize) : work; 119 const int thr_end = ((ltid + 1) * chunksize < work) ? ((ltid + 1) * chunksize) : work; 146 my_col_id = ltid % column_teams; 147 my_row_id = ltid / column_teams; 256 const int thr_begin = (ltid * chunksize < work) ? (ltid * chunksize) : work; 257 const int thr_end = ((ltid + 1) * chunksize < work) ? ((ltid + 1) * chunksize) : work; 272 my_col_id = ltid % column_teams; [all …]
|
H A D | libxsmm_dnn_softmaxloss_st_fwd_ncnc_generic.tpl.c | 60 const int ltid = tid - start_thread; variable 67 const int n_thr_begin = (ltid * n_chunksize < n_work) ? (ltid * n_chunksize) : n_work; 68 const int n_thr_end = ((ltid + 1) * n_chunksize < n_work) ? ((ltid + 1) * n_chunksize) : n_work; 76 const int nc_thr_begin = (ltid * nc_chunksize < nc_work) ? (ltid * nc_chunksize) : nc_work; 77 const int nc_thr_end = ((ltid + 1) * nc_chunksize < nc_work) ? ((ltid + 1) * nc_chunksize) : nc_wor… 92 libxsmm_barrier_init( handle->barrier, ltid ); 102 libxsmm_barrier_wait( handle->barrier, ltid ); 107 libxsmm_barrier_wait( handle->barrier, ltid ); 144 libxsmm_barrier_wait( handle->barrier, ltid ); 147 if ( ltid == 0 ) { [all …]
|
H A D | libxsmm_dnn_rnncell_st_lstm_fwd_nc_kcck_fused_bf16.tpl.c | 47 if (ltid == 0) { 60 if (ltid == 0) { 75 if (ltid == 0) { 88 if (ltid == 0) { 103 if (ltid == 0) { 116 if (ltid == 0) { 131 if (ltid == 0) { 144 if (ltid == 0) { 152 if (ltid == 0) { 190 if (ltid == 0) { [all …]
|
H A D | libxsmm_dnn_rnncell_st_lstm_bwdupd_nc_kcck.tpl.c | 170 const libxsmm_blasint thr_begin_nk = (ltid * chunksize_nk < work_nk) ? (ltid * chunksize_nk) : work… 171 const libxsmm_blasint thr_end_nk = ((ltid + 1) * chunksize_nk < work_nk) ? ((ltid + 1) * chunksize_… 178 const libxsmm_blasint thr_begin_nc = (ltid * chunksize_nc < work_nc) ? (ltid * chunksize_nc) : work… 186 const libxsmm_blasint thr_begin_ck = (ltid * chunksize_ck < work_ck) ? (ltid * chunksize_ck) : work… 194 const libxsmm_blasint thr_begin_kk = (ltid * chunksize_kk < work_kk) ? (ltid * chunksize_kk) : work… 202 const libxsmm_blasint k_thr_begin = (ltid * k_chunksize * 16 < K) ? (ltid * k_chunksize * 16) : K; 209 const libxsmm_blasint thr_begin_k = (ltid * chunksize_k < K) ? (ltid * chunksize_k) : K; 210 const libxsmm_blasint thr_end_k = ((ltid + 1) * chunksize_k < K) ? ((ltid + 1) * chunksize_k) : K; 253 if (ltid == 0) _start = _rdtsc(); 283 if (ltid == 0) { [all …]
|
H A D | libxsmm_dnn_rnncell_st_lstm_fwd_nc_kcck_bf16.tpl.c | 148 const libxsmm_blasint thr_begin = (ltid * chunksize < work) ? (ltid * chunksize) : work; 149 const libxsmm_blasint thr_end = ((ltid + 1) * chunksize < work) ? ((ltid + 1) * chunksize) : work; 157 const libxsmm_blasint thr_begin_ck = (ltid * chunksize_ck < work_ck) ? (ltid * chunksize_ck) : work… 158 const libxsmm_blasint thr_end_ck = ((ltid + 1) * chunksize_ck < work_ck) ? ((ltid + 1) * chunksize_… 164 const libxsmm_blasint thr_begin_kk = (ltid * chunksize_kk < work_kk) ? (ltid * chunksize_kk) : work… 165 const libxsmm_blasint thr_end_kk = ((ltid + 1) * chunksize_kk < work_kk) ? ((ltid + 1) * chunksize_… 175 libxsmm_barrier_init(handle->barrier, (int)ltid); 200 if (ltid == 0) reformat_start = _rdtsc(); 211 libxsmm_barrier_wait(handle->barrier, (int)ltid); 213 if (ltid == 0) { [all …]
|
H A D | libxsmm_dnn_fullyconnected_st_bwdupd_ncnc_kcck_generic_bf16.tpl.c | 31 const int ltid = tid - start_thread; variable 39 const int eltwise_thr_begin = (ltid * eltwise_chunksize < eltwise_work) ? (ltid * eltwise_chunksize… 49 const int dbias_thr_begin = (ltid * dbias_chunksize < dbias_work) ? (ltid * dbias_chunksize) : dbia… 212 const int thr_begin = (ltid * chunksize < work) ? (ltid * chunksize) : work; 213 const int thr_end = ((ltid + 1) * chunksize < work) ? ((ltid + 1) * chunksize) : work; 242 my_col_id = ltid % column_teams; 243 my_row_id = ltid / column_teams; 396 const int thr_begin = (ltid * chunksize < work) ? (ltid * chunksize) : work; 397 const int thr_end = ((ltid + 1) * chunksize < work) ? ((ltid + 1) * chunksize) : work; 437 my_col_id = ltid % column_teams; [all …]
|
H A D | libxsmm_dnn_rnncell_st_rnn_bwdupd_nc_ck_generic.tpl.c | 71 const libxsmm_blasint thr_begin_nk = (ltid * chunksize_nk < work_nk) ? (ltid * chunksize_nk) : work… 72 const libxsmm_blasint thr_end_nk = ((ltid + 1) * chunksize_nk < work_nk) ? ((ltid + 1) * chunksize_… 79 const libxsmm_blasint thr_begin_nc = (ltid * chunksize_nc < work_nc) ? (ltid * chunksize_nc) : work… 80 const libxsmm_blasint thr_end_nc = ((ltid + 1) * chunksize_nc < work_nc) ? ((ltid + 1) * chunksize_… 87 const libxsmm_blasint thr_begin_ck = (ltid * chunksize_ck < work_ck) ? (ltid * chunksize_ck) : work… 88 const libxsmm_blasint thr_end_ck = ((ltid + 1) * chunksize_ck < work_ck) ? ((ltid + 1) * chunksize_… 95 const libxsmm_blasint thr_begin_kk = (ltid * chunksize_kk < work_kk) ? (ltid * chunksize_kk) : work… 96 const libxsmm_blasint thr_end_kk = ((ltid + 1) * chunksize_kk < work_kk) ? ((ltid + 1) * chunksize_… 102 const libxsmm_blasint thr_begin_k = (ltid * chunksize_k < K) ? (ltid * chunksize_k) : K; 103 const libxsmm_blasint thr_end_k = ((ltid + 1) * chunksize_k < K) ? ((ltid + 1) * chunksize_k) : K; [all …]
|
H A D | libxsmm_dnn_rnncell_st_rnn_bwdupd_nc_kcck.tpl.c | 84 const libxsmm_blasint thr_begin_nk = (ltid * chunksize_nk < work_nk) ? (ltid * chunksize_nk) : work… 85 const libxsmm_blasint thr_end_nk = ((ltid + 1) * chunksize_nk < work_nk) ? ((ltid + 1) * chunksize_… 92 const libxsmm_blasint thr_begin_nc = (ltid * chunksize_nc < work_nc) ? (ltid * chunksize_nc) : work… 93 const libxsmm_blasint thr_end_nc = ((ltid + 1) * chunksize_nc < work_nc) ? ((ltid + 1) * chunksize_… 100 const libxsmm_blasint thr_begin_ck = (ltid * chunksize_ck < work_ck) ? (ltid * chunksize_ck) : work… 101 const libxsmm_blasint thr_end_ck = ((ltid + 1) * chunksize_ck < work_ck) ? ((ltid + 1) * chunksize_… 108 const libxsmm_blasint thr_begin_kk = (ltid * chunksize_kk < work_kk) ? (ltid * chunksize_kk) : work… 115 const libxsmm_blasint k_thr_begin = (ltid * k_chunksize * 16 < K) ? (ltid * k_chunksize * 16) : K; 116 const libxsmm_blasint k_thr_end = ((ltid + 1) * k_chunksize * 16 < K) ? ((ltid + 1) * k_chunksize *… 123 const libxsmm_blasint thr_begin_k = (ltid * chunksize_k < K) ? (ltid * chunksize_k) : K; [all …]
|
H A D | libxsmm_dnn_rnncell_st_lstm_bwdupd_nc_ck_generic.tpl.c | 183 const libxsmm_blasint thr_begin_nk = (ltid * chunksize_nk < work_nk) ? (ltid * chunksize_nk) : work… 191 const libxsmm_blasint thr_begin_nc = (ltid * chunksize_nc < work_nc) ? (ltid * chunksize_nc) : work… 199 const libxsmm_blasint thr_begin_ck = (ltid * chunksize_ck < work_ck) ? (ltid * chunksize_ck) : work… 215 const libxsmm_blasint k_thr_begin = (ltid * k_chunksize * 16 < K) ? (ltid * k_chunksize * 16) : K; 222 const libxsmm_blasint thr_begin_k = (ltid * chunksize_k < K) ? (ltid * chunksize_k) : K; 223 const libxsmm_blasint thr_end_k = ((ltid + 1) * chunksize_k < K) ? ((ltid + 1) * chunksize_k) : K; 265 if (ltid == 0) _start = _rdtsc(); 295 if (ltid == 0) { 305 if (ltid == 0) _start = _rdtsc(); 339 if (ltid == 0) { [all …]
|
H A D | libxsmm_dnn_rnncell_st_lstm_bwdupd_nc_ck_generic_bf16.tpl.c | 187 const libxsmm_blasint thr_begin_nk = (ltid * chunksize_nk < work_nk) ? (ltid * chunksize_nk) : work… 195 const libxsmm_blasint thr_begin_nc = (ltid * chunksize_nc < work_nc) ? (ltid * chunksize_nc) : work… 202 const libxsmm_blasint thr_begin_ck = (ltid * chunksize_ck < work_ck) ? (ltid * chunksize_ck) : work… 217 const libxsmm_blasint k_thr_begin = (ltid * k_chunksize * 16 < K) ? (ltid * k_chunksize * 16) : K; 225 const libxsmm_blasint thr_begin_k = (ltid * chunksize_k < K) ? (ltid * chunksize_k) : K; 226 const libxsmm_blasint thr_end_k = ((ltid + 1) * chunksize_k < K) ? ((ltid + 1) * chunksize_k) : K; 269 if (ltid == 0) _start = _rdtsc(); 299 if (ltid == 0) { 309 if (ltid == 0) _start = _rdtsc(); 347 if (ltid == 0) { [all …]
|
H A D | libxsmm_dnn_rnncell_st_lstm_fwd_nc_ck_generic.tpl.c | 107 const libxsmm_blasint thr_begin = (ltid * chunksize < work) ? (ltid * chunksize) : work; 108 const libxsmm_blasint thr_end = ((ltid + 1) * chunksize < work) ? ((ltid + 1) * chunksize) : work; 115 const libxsmm_blasint thr_begin_ck = (ltid * chunksize_ck < work_ck) ? (ltid * chunksize_ck) : work… 116 const libxsmm_blasint thr_end_ck = ((ltid + 1) * chunksize_ck < work_ck) ? ((ltid + 1) * chunksize_… 123 const libxsmm_blasint thr_begin_kk = (ltid * chunksize_kk < work_kk) ? (ltid * chunksize_kk) : work… 124 const libxsmm_blasint thr_end_kk = ((ltid + 1) * chunksize_kk < work_kk) ? ((ltid + 1) * chunksize_… 134 libxsmm_barrier_init(handle->barrier, (int)ltid); 161 if (ltid == 0) reformat_start = _rdtsc(); 190 libxsmm_barrier_wait(handle->barrier, (int)ltid); 192 if (ltid == 0) { [all …]
|
H A D | libxsmm_dnn_rnncell_st_lstm_fwd_nc_kcck_diffused_bf16.tpl.c | 46 if (ltid == 0) { 61 if (ltid == 0) { 76 if (ltid == 0) { 92 if (ltid == 0) { 122 if (ltid == 0) { 135 if (ltid == 0) { 148 if (ltid == 0) { 161 if (ltid == 0) { 169 if (ltid == 0) { 208 if (ltid == 0) { [all …]
|
H A D | libxsmm_dnn_rnncell_st_lstm_fwd_nc_kcck_fused.tpl.c | 23 if (ltid == 0) gemm_start = _rdtsc(); 35 if (ltid == 0) { 59 if (ltid == 0) { 78 if (ltid == 0) { 102 if (ltid == 0) { 121 if (ltid == 0) { 145 if (ltid == 0) { 164 if (ltid == 0) { 188 if (ltid == 0) { 196 if (ltid == 0) { [all …]
|
H A D | libxsmm_dnn_rnncell_st_lstm_fwd_nc_kcck_diffused.tpl.c | 23 if (ltid == 0) gemm_start = _rdtsc(); 35 if (ltid == 0) { 55 if (ltid == 0) { 75 if (ltid == 0) { 95 if (ltid == 0) { 132 if (ltid == 0) { 157 if (ltid == 0) { 182 if (ltid == 0) { 206 if (ltid == 0) { 214 if (ltid == 0) { [all …]
|
H A D | libxsmm_dnn_optimizer_sgd_st_generic.tpl.c | 21 const int ltid = tid - start_thread; variable 28 const int thr_begin = (ltid * chunksize < work) ? (ltid * chunksize) : work; 29 const int thr_end = ((ltid + 1) * chunksize < work) ? ((ltid + 1) * chunksize) : work; 38 libxsmm_barrier_init( handle->barrier, ltid ); 90 libxsmm_barrier_wait( handle->barrier, ltid );
|
H A D | libxsmm_dnn_fusedgroupnorm_st_fwd_custom_f32_bf16_c16_avx512.tpl.c | 48 const int ltid = tid - start_thread; variable 54 const int thr_begin = (ltid * chunksize < work) ? (ltid * chunksize) : work; 55 const int thr_end = ((ltid + 1) * chunksize < work) ? ((ltid + 1) * chunksize) : work; 62 const int thr_begin2 = (ltid * chunksize2 < work2) ? (ltid * chunksize2) : work2; 63 const int thr_end2 = ((ltid + 1) * chunksize2 < work2) ? ((ltid + 1) * chunksize2) : work2; 96 libxsmm_barrier_init(handle->barrier, ltid); 124 libxsmm_barrier_wait(handle->barrier, ltid); 169 libxsmm_barrier_wait(handle->barrier, ltid); 226 libxsmm_barrier_wait(handle->barrier, ltid);
|
H A D | libxsmm_dnn_convolve_st_bwd_custom_custom_fallback_generic.tpl.c | 14 const int ltid = tid - start_thread; variable 21 const int thr_begin = (ltid * chunksize < work) ? (ltid * chunksize) : work; 22 const int thr_end = ((ltid + 1) * chunksize < work) ? ((ltid + 1) * chunksize) : work; 29 const int transpose_thr_begin = (ltid * transpose_chunksize < transpose_work) ? (ltid * transpose_c… 30 const int transpose_thr_end = ((ltid + 1) * transpose_chunksize < transpose_work) ? ((ltid + 1) * t… 45 …put_type*)((char*)handle->scratch + handle->bwd_packing_padding_scratch_offset) + ltid * size_tls1; 49 libxsmm_barrier_init(handle->barrier, ltid); 72 libxsmm_barrier_wait(handle->barrier, ltid); 177 libxsmm_barrier_wait(handle->barrier, ltid);
|
/dports/math/libxsmm/libxsmm-1.16.3/src/ |
H A D | libxsmm_dnn_elementwise.c | 29 const libxsmm_blasint thr_begin = (ltid * chunksize < size) ? (ltid * chunksize) : size; in libxsmm_internal_matrix_zero() 45 const libxsmm_blasint thr_begin = (ltid * chunksize < size) ? (ltid * chunksize) : size; in libxsmm_internal_matrix_add() 61 const libxsmm_blasint thr_begin = (ltid * chunksize < size) ? (ltid * chunksize) : size; in libxsmm_internal_matrix_eltwise_mult() 77 const libxsmm_blasint thr_begin = (ltid * chunksize < size) ? (ltid * chunksize) : size; in libxsmm_internal_matrix_sigmoid() 94 const libxsmm_blasint thr_begin = (ltid * chunksize < size) ? (ltid * chunksize) : size; in libxsmm_internal_matrix_tanh() 110 const libxsmm_blasint thr_begin = (ltid * chunksize < size) ? (ltid * chunksize) : size; in libxsmm_internal_matrix_relu() 126 const libxsmm_blasint thr_begin = (ltid * chunksize < size) ? (ltid * chunksize) : size; in libxsmm_internal_matrix_sigmoid_inverse() 263 const libxsmm_blasint thr_begin = (ltid * chunksize < m) ? (ltid * chunksize) : m; in libxsmm_internal_matrix_1D_2D() 296 if (ltid == 0) { in libxsmm_internal_recursive_step() 305 if (ltid == 0) { in libxsmm_internal_recursive_step() [all …]
|
/dports/math/libxsmm/libxsmm-1.16.3/samples/deeplearning/gxm/src/ |
H A D | Solver.cpp | 60 int tb = (ltid*jobs < len) ? ltid*jobs : len; in convert_bf16_f32() 61 int te = ((ltid+1)*jobs < len) ? (ltid+1)*jobs : len; in convert_bf16_f32() 133 int tb = (ltid * jobs < sn) ? (ltid * jobs) : sn; in applyUpdate() 134 int te = (ltid + 1)*jobs < sn ? (ltid + 1)*jobs : sn; in applyUpdate() 163 int tb = (ltid * jobs < sn) ? (ltid * jobs) : sn; in applyUpdate() 193 int tb = (ltid * jobs < sn) ? (ltid * jobs) : sn; in applyUpdate() 234 int tb = (ltid * jobs < sn) ? (ltid * jobs) : sn; in applyUpdate() 272 int tb = (ltid * jobs < sn) ? (ltid * jobs) : sn; in applyUpdate() 305 int tb = (ltid * jobs < sn) ? (ltid * jobs) : sn; in applyUpdate() 377 int tb = (ltid * jobs < sn) ? (ltid * jobs) : sn; in applyUpdate() [all …]
|
H A D | reduce_weight_grads.c | 5 int ltid = tid - n*ntps; variable 6 int tb = (ltid * jpt < jn) ? ltid*jpt : jn; 7 int te = ((ltid+1)*jpt < jn) ? (ltid+1)*jpt : jn;
|
/dports/net/openldap24-server/openldap-2.4.59/servers/slapd/back-bdb/ |
H A D | delete.c | 37 DB_TXN *ltid = NULL, *lt2; in bdb_delete() local 124 rs->sr_err = TXN_ABORT( ltid ); in bdb_delete() 125 ltid = NULL; in bdb_delete() 147 ltid->id(ltid), 0, 0 ); in bdb_delete() 159 opinfo.boi_txn = ltid; in bdb_delete() 513 bdb_last_id( op->o_bd, ltid ); in bdb_delete() 523 ltid = NULL; in bdb_delete() 538 rs->sr_err = TXN_COMMIT( ltid, 0 ); in bdb_delete() 540 ltid = NULL; in bdb_delete() 585 if( ltid != NULL ) { in bdb_delete() [all …]
|
/dports/net/openldap24-client/openldap-2.4.59/servers/slapd/back-bdb/ |
H A D | delete.c | 37 DB_TXN *ltid = NULL, *lt2; in bdb_delete() local 124 rs->sr_err = TXN_ABORT( ltid ); in bdb_delete() 125 ltid = NULL; in bdb_delete() 147 ltid->id(ltid), 0, 0 ); in bdb_delete() 159 opinfo.boi_txn = ltid; in bdb_delete() 513 bdb_last_id( op->o_bd, ltid ); in bdb_delete() 523 ltid = NULL; in bdb_delete() 538 rs->sr_err = TXN_COMMIT( ltid, 0 ); in bdb_delete() 540 ltid = NULL; in bdb_delete() 585 if( ltid != NULL ) { in bdb_delete() [all …]
|