/dports/math/gemmlowp/gemmlowp-dc69acd/meta/ |
H A D | multi_thread_gemm.h | 29 std::uint8_t* PrepareGemmTask(const Params& params, int kernel_m, int kernel_n, in PrepareGemmTask() argument 53 task, kernel_m, kernel_n, kernel_k); in PrepareGemmTask() 58 int kernel_m, int kernel_n, int kernel_k, in PrepareGemmTasks() argument 85 PrepareGemmTask<Executor, Params>(params, kernel_m, kernel_n, kernel_k, in PrepareGemmTasks() 92 params, kernel_m, kernel_n, kernel_k, scratch, 0, params.m, in PrepareGemmTasks() 104 template <typename Executor, typename Params, int kernel_m, int kernel_n, 110 Gemm<Executor, Params, kernel_m, kernel_n, kernel_k>(params); in Run() 119 int kernel_m, int kernel_n, int kernel_k> 122 typedef internal::GemmTaskRunner<Executor, Params, kernel_m, kernel_n, in MultiThreadGemm() 128 context, params, kernel_m, kernel_n, kernel_k, &task_params)) { in MultiThreadGemm() [all …]
|
H A D | single_thread_gemm.h | 24 template <typename Executor, typename Params, int kernel_m, int kernel_n, 31 static int EstimateScratchSize(const P& params, int kernel_m, int kernel_n, in EstimateScratchSize() argument 36 const int rhs_chunks = ((params.n + kernel_n - 1) / kernel_n); in EstimateScratchSize() 40 params.right_stream, kernel_n, kernel_k); in EstimateScratchSize() 220 static int EstimateScratchSize(const P& params, int kernel_m, int kernel_n, in EstimateScratchSize() argument 229 params.right_stream, kernel_n, kernel_k); in EstimateScratchSize() 441 static int EstimateScratchSize(const P& params, int kernel_m, int kernel_n, in EstimateScratchSize() argument 490 static int EstimateScratchSize(const P& params, int kernel_m, int kernel_n, in EstimateScratchSize() argument 676 template <typename Executor, typename Params, int kernel_m, int kernel_n, 679 internal::Dispatch3DStage1<Executor, Params, kernel_m, kernel_n, kernel_k, [all …]
|
H A D | base.h | 101 typename OutputStream, int kernel_m, int kernel_n, int pack_size>
|
/dports/math/gemmlowp/gemmlowp-dc69acd/meta/generators/ |
H A D | quantized_mul_kernels_common.py | 222 kernel_n): argument 435 for col in range(kernel_n): 436 index = row * kernel_n + col 439 for i in range(kernel_m * kernel_n): 452 assert kernel_n in [5, 6, 7, 8] 461 leftover = kernel_n - 4 501 if kernel_m is 3 and kernel_n is 3: 504 elif kernel_m is 2 and kernel_n is 4: 507 elif kernel_m is 1 and kernel_n is 8: 510 elif kernel_m is 1 and kernel_n > 4: [all …]
|
H A D | common.py | 95 def SpecializeMulKernel(self, in_type, out_type, kernel_m, kernel_n, argument 100 kernel_n, pack_size 112 self.EmitMultiply(in_type, out_type, kernel_m, kernel_n, pack_size)
|
/dports/graphics/gegl/gegl-0.4.34/gegl/opencl/ |
H A D | gegl-cl-init.c | 831 guint kernel_n = 0; in gegl_cl_compile_and_build() local 833 while (kernel_name[++kernel_n] != NULL); in gegl_cl_compile_and_build() 882 cl_data->kernel = g_new (cl_kernel, kernel_n); in gegl_cl_compile_and_build() 883 cl_data->work_group_size = g_new (size_t, kernel_n); in gegl_cl_compile_and_build() 885 for (i = 0; i < kernel_n; i++) in gegl_cl_compile_and_build()
|
/dports/math/py-arviz/arviz-0.11.4/arviz/stats/ |
H A D | density_utils.py | 705 kernel_n = int(bw * 2 * np.pi) 706 if kernel_n == 0: 707 kernel_n = 1 709 kernel = gaussian(kernel_n, bw)
|