/dports/math/libxsmm/libxsmm-1.16.3/src/template/ |
H A D | libxsmm_dnn_rnncell_st_lstm_bwdupd_nc_kcck_core_bf16.tpl.c | 164 …dout_ptr = (j > 0) ? (float*) &LIBXSMM_VLA_ACCESS(2, dout, in, ik, K) : (float*) &LIBXSMM_VLA_ACCE… 166 if (KB == 0) libxsmm_internal_matrix_zero_ld( bk, bn, K, dout_ptr); 170 dout_ptr, &blocks); 174 dout_ptr, &blocks); 178 dout_ptr, &blocks); 182 dout_ptr, &blocks); 186 … NATIVE_MATRIX_RNE_CVT_FP32_BFP16_LD(bk, bn, K, dout_ptr, &LIBXSMM_VLA_ACCESS(2, dhp, in, ik, K));
|
H A D | libxsmm_dnn_rnncell_st_lstm_bwdupd_nc_kcck_core.tpl.c | 239 …dout_ptr = (j > 0) ? (element_output_type*) &LIBXSMM_VLA_ACCESS(2, dout, in, ik, K) : (element_out… 241 if (KB == 0) libxsmm_internal_matrix_zero_ld( bk, bn, K, dout_ptr); 249 batchreduce_kerneld(A_array, B_array, dout_ptr, &blocks); 256 batchreduce_kerneld(A_array, B_array, dout_ptr, &blocks); 263 batchreduce_kerneld(A_array, B_array, dout_ptr, &blocks); 270 batchreduce_kerneld(A_array, B_array, dout_ptr, &blocks);
|
H A D | libxsmm_dnn_rnncell_st_gru_bwdupd_nc_kcck.tpl.c | 114 element_output_type *dout_ptr = NULL; variable 435 …dout_ptr = (j > 0) ? (element_output_type*) &LIBXSMM_VLA_ACCESS(2, dout, in, ik, K) : (element_out… 440 …, K, &LIBXSMM_VLA_ACCESS(2, t1, in, ik, K), &LIBXSMM_VLA_ACCESS(2, t2, in, ik, K), dout_ptr ); 450 batchreduce_kerneld(A_array, B_array, dout_ptr, &blocks); 457 batchreduce_kerneld(A_array, B_array, dout_ptr, &blocks);
|
H A D | libxsmm_dnn_rnncell_st_gru_bwdupd_nc_ck_generic.tpl.c | 129 element_output_type *dout_ptr = NULL; variable 415 …dout_ptr = (j > 0) ? (element_output_type*) &LIBXSMM_VLA_ACCESS(2, dout, in, ik, K) : (element_out… 420 …, K, &LIBXSMM_VLA_ACCESS(2, t1, in, ik, K), &LIBXSMM_VLA_ACCESS(2, t2, in, ik, K), dout_ptr ); 430 batchreduce_kerneld(A_array, B_array, dout_ptr, &blocks); 437 batchreduce_kerneld(A_array, B_array, dout_ptr, &blocks);
|
H A D | libxsmm_dnn_rnncell_st_lstm_bwdupd_nc_kcck.tpl.c | 144 element_output_type *dout_ptr = NULL; variable
|
H A D | libxsmm_dnn_rnncell_st_lstm_bwdupd_nc_ck_generic.tpl.c | 157 element_output_type *dout_ptr = NULL; variable
|
H A D | libxsmm_dnn_rnncell_st_lstm_bwdupd_nc_ck_generic_bf16.tpl.c | 174 float *dout_ptr = NULL; variable
|
H A D | libxsmm_dnn_rnncell_st_lstm_bwdupd_nc_kcck_bf16.tpl.c | 179 float *dout_ptr = NULL; variable
|
/dports/math/libxsmm/libxsmm-1.16.3/samples/deeplearning/gxm/src/ |
H A D | ConvXSMM.cpp | 495 dout_ptr[0] = deloutp->getBuffer(); in backPropagate() 497 dout_ptr[n] = dout_ptr[n-1] + imoff; in backPropagate() 530 libxsmm_deloutput[n] = libxsmm_dnn_link_tensor( libxsmm_layout, dout_ptr[n], &status ); in backPropagate() 551 …check_physical_pad( nname.c_str(), (float*)dout_ptr[0], conv_desc.N, nBOfm, ofh, ofw, VLEN, oph, o… in backPropagate() 553 …check_physical_pad( nname.c_str(), (libxsmm_bfloat16*)dout_ptr[0], conv_desc.N, nBOfm, ofh, ofw, V… in backPropagate() 608 …check_physical_pad( nname.c_str(), (float*)dout_ptr[0], conv_desc.N, nBOfm, ofh, ofw, VLEN, oph, o… in backPropagate() 610 …check_physical_pad( nname.c_str(), (libxsmm_bfloat16*)dout_ptr[0], conv_desc.N, nBOfm, ofh, ofw, V… in backPropagate() 657 dout_ptr[0] = deloutp->getBuffer(); in weightUpdate() 659 dout_ptr[n] = dout_ptr[n-1] + imoff; in weightUpdate() 688 libxsmm_deloutput[n] = libxsmm_dnn_link_tensor(libxsmm_layout, dout_ptr[n], &status ); in weightUpdate()
|
/dports/math/libxsmm/libxsmm-1.16.3/samples/deeplearning/gxm/include/ |
H A D | ConvXSMM.hpp | 53 void *din_ptr[NUM_NUMA_NODES] = {NULL}, *dout_ptr[NUM_NUMA_NODES] = {NULL}; member in ConvXSMM
|