Home
last modified time | relevance | path

Searched refs:CUDABackend (Results 1 – 23 of 23) sorted by relevance

/dports/misc/mnn/MNN-1.2.0/source/backend/cuda/core/
H A DCUDABackend.cpp21 std::map<OpType, CUDABackend::Creator*>* gCreator() { in gCreator()
67 return new CUDABackend(mBufferPool, mCUDARuntime); in onCreate()
74 CUDABackend::CUDABackend(std::shared_ptr<BufferAllocator> st, in CUDABackend() function in MNN::CUDA::CUDABackend
82 CUDABackend::~CUDABackend() { in ~CUDABackend()
88 CUDARuntime* CUDABackend::getCUDARuntime() { in getCUDARuntime()
135 bool CUDABackend::onClearBuffer() { in onClearBuffer()
139 size_t CUDABackend::realSize(const Tensor* tensor) { in realSize()
192 void CUDABackend::onResizeBegin() { in onResizeBegin()
195 void CUDABackend::onResizeEnd() { in onResizeEnd()
198 void CUDABackend::onExecuteBegin() const { in onExecuteBegin()
[all …]
H A DCUDABackend.hpp42 class CUDABackend final : public Backend { class
44 CUDABackend(std::shared_ptr<BufferAllocator> st, std::shared_ptr<CUDARuntime> rt);
45 ~CUDABackend();
92 CUDABackend::addCreator(type, t); in CUDACreatorRegister()
98 class TypedCreator : public CUDABackend::Creator {
/dports/misc/mnn/MNN-1.2.0/source/backend/cuda/execution/
H A DUnaryExecution.cu29 auto cudaBackend = static_cast<CUDABackend*>(backend); in UnaryExecution()
35 mCount = CUDABackend::realSize(inputs[0]); in onResize()
68 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute()
69 auto count = CUDABackend::realSize(inputs[0]); in onExecute()
98 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute()
99 auto count = CUDABackend::realSize(inputs[0]); in onExecute()
146 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute()
147 auto count = CUDABackend::realSize(inputs[0]); in onExecute()
186 class UnaryCreator : public CUDABackend::Creator {
H A DBinaryExecution.cu42 auto count = CUDABackend::realSize(outputs[0]); in onExecute()
43 auto inputS0 = CUDABackend::realSize(inputs[0]); in onExecute()
44 auto inputS1 = CUDABackend::realSize(inputs[1]); in onExecute()
47 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute()
65 class BinaryCreator : public CUDABackend::Creator {
H A DConvDepthWiseExecution.cu20 auto pool = static_cast<CUDABackend*>(bn)->getStaticBufferPool(); in ConvDepthWiseExecution()
44 auto pool = static_cast<CUDABackend*>(backend())->getStaticBufferPool(); in ~ConvDepthWiseExecution()
76 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onResize()
151 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute()
257 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onResize()
264 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute()
279 class ConvDepthWiseExecutionCreator : public CUDABackend::Creator {
H A DRasterExecution.cpp36 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute()
59 class RasterCreator : public CUDABackend::Creator {
H A DSoftmaxExecution.cu7 auto runtime = static_cast<CUDABackend*>(backend)->getCUDARuntime(); in SoftmaxExecution()
62 class SoftmaxCreator : public CUDABackend::Creator {
H A DArgMaxExecution.cu60 auto runtime = static_cast<CUDABackend *>(backend())->getCUDARuntime(); in onExecute()
72 class ArgMaxCreator : public CUDABackend::Creator {
H A DPReLUExecution.cu51 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute()
63 class PReLUCreator : public CUDABackend::Creator {
H A DMatMulExecution.cu37 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute()
91 class MatMulCreator : public CUDABackend::Creator {
H A DScaleExecution.cu69 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute()
81 class ScaleCreator : public CUDABackend::Creator {
H A DGatherV2Execution.cu58 auto runtime = static_cast<CUDABackend *>(backend())->getCUDARuntime(); in onExecute()
95 class GatherV2Creator : public CUDABackend::Creator {
H A DScatterNdExecution.cu76 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute()
93 class ScatterNdCreator : public CUDABackend::Creator {
H A DInterpExecution.cu79 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute()
96 class InterpCreator : public CUDABackend::Creator {
H A DPoolExecution.cu134 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute()
163 class PoolCreator : public CUDABackend::Creator {
H A DDeconvSingleInputExecution.cu68 auto runtime = static_cast<CUDABackend*>(backend)->getCUDARuntime(); in DeconvSingleInputExecution()
242 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute()
284 class CUDADeconvolutionCreator : public CUDABackend::Creator {
H A DConvSingleInputExecution.cu73 auto runtime = static_cast<CUDABackend*>(backend)->getCUDARuntime(); in ConvSingleInputExecution()
283 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute()
325 class CUDAConvolutionCreator : public CUDABackend::Creator {
H A DReductionExecution.cu97 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute()
159 class ReductionCreator : public CUDABackend::Creator {
H A DCUDALoop.cpp116 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute()
228 class LoopCreator : public CUDABackend::Creator {
H A DLayerNormExecution.cu311 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute()
340 class LayerNormCreator : public CUDABackend::Creator {
/dports/science/py-PyFR/pyfr-1.12.3/pyfr/backends/cuda/
H A D__init__.py3 from pyfr.backends.cuda.base import CUDABackend
H A Dbase.py9 class CUDABackend(BaseBackend): class
/dports/science/py-PyFR/pyfr-1.12.3/pyfr/backends/
H A D__init__.py4 from pyfr.backends.cuda import CUDABackend