/dports/misc/mnn/MNN-1.2.0/source/backend/cuda/core/ |
H A D | CUDABackend.cpp | 21 std::map<OpType, CUDABackend::Creator*>* gCreator() { in gCreator() 67 return new CUDABackend(mBufferPool, mCUDARuntime); in onCreate() 74 CUDABackend::CUDABackend(std::shared_ptr<BufferAllocator> st, in CUDABackend() function in MNN::CUDA::CUDABackend 82 CUDABackend::~CUDABackend() { in ~CUDABackend() 88 CUDARuntime* CUDABackend::getCUDARuntime() { in getCUDARuntime() 135 bool CUDABackend::onClearBuffer() { in onClearBuffer() 139 size_t CUDABackend::realSize(const Tensor* tensor) { in realSize() 192 void CUDABackend::onResizeBegin() { in onResizeBegin() 195 void CUDABackend::onResizeEnd() { in onResizeEnd() 198 void CUDABackend::onExecuteBegin() const { in onExecuteBegin() [all …]
|
H A D | CUDABackend.hpp | 42 class CUDABackend final : public Backend { class 44 CUDABackend(std::shared_ptr<BufferAllocator> st, std::shared_ptr<CUDARuntime> rt); 45 ~CUDABackend(); 92 CUDABackend::addCreator(type, t); in CUDACreatorRegister() 98 class TypedCreator : public CUDABackend::Creator {
|
/dports/misc/mnn/MNN-1.2.0/source/backend/cuda/execution/ |
H A D | UnaryExecution.cu | 29 auto cudaBackend = static_cast<CUDABackend*>(backend); in UnaryExecution() 35 mCount = CUDABackend::realSize(inputs[0]); in onResize() 68 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute() 69 auto count = CUDABackend::realSize(inputs[0]); in onExecute() 98 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute() 99 auto count = CUDABackend::realSize(inputs[0]); in onExecute() 146 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute() 147 auto count = CUDABackend::realSize(inputs[0]); in onExecute() 186 class UnaryCreator : public CUDABackend::Creator {
|
H A D | BinaryExecution.cu | 42 auto count = CUDABackend::realSize(outputs[0]); in onExecute() 43 auto inputS0 = CUDABackend::realSize(inputs[0]); in onExecute() 44 auto inputS1 = CUDABackend::realSize(inputs[1]); in onExecute() 47 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute() 65 class BinaryCreator : public CUDABackend::Creator {
|
H A D | ConvDepthWiseExecution.cu | 20 auto pool = static_cast<CUDABackend*>(bn)->getStaticBufferPool(); in ConvDepthWiseExecution() 44 auto pool = static_cast<CUDABackend*>(backend())->getStaticBufferPool(); in ~ConvDepthWiseExecution() 76 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onResize() 151 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute() 257 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onResize() 264 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute() 279 class ConvDepthWiseExecutionCreator : public CUDABackend::Creator {
|
H A D | RasterExecution.cpp | 36 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute() 59 class RasterCreator : public CUDABackend::Creator {
|
H A D | SoftmaxExecution.cu | 7 auto runtime = static_cast<CUDABackend*>(backend)->getCUDARuntime(); in SoftmaxExecution() 62 class SoftmaxCreator : public CUDABackend::Creator {
|
H A D | ArgMaxExecution.cu | 60 auto runtime = static_cast<CUDABackend *>(backend())->getCUDARuntime(); in onExecute() 72 class ArgMaxCreator : public CUDABackend::Creator {
|
H A D | PReLUExecution.cu | 51 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute() 63 class PReLUCreator : public CUDABackend::Creator {
|
H A D | MatMulExecution.cu | 37 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute() 91 class MatMulCreator : public CUDABackend::Creator {
|
H A D | ScaleExecution.cu | 69 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute() 81 class ScaleCreator : public CUDABackend::Creator {
|
H A D | GatherV2Execution.cu | 58 auto runtime = static_cast<CUDABackend *>(backend())->getCUDARuntime(); in onExecute() 95 class GatherV2Creator : public CUDABackend::Creator {
|
H A D | ScatterNdExecution.cu | 76 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute() 93 class ScatterNdCreator : public CUDABackend::Creator {
|
H A D | InterpExecution.cu | 79 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute() 96 class InterpCreator : public CUDABackend::Creator {
|
H A D | PoolExecution.cu | 134 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute() 163 class PoolCreator : public CUDABackend::Creator {
|
H A D | DeconvSingleInputExecution.cu | 68 auto runtime = static_cast<CUDABackend*>(backend)->getCUDARuntime(); in DeconvSingleInputExecution() 242 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute() 284 class CUDADeconvolutionCreator : public CUDABackend::Creator {
|
H A D | ConvSingleInputExecution.cu | 73 auto runtime = static_cast<CUDABackend*>(backend)->getCUDARuntime(); in ConvSingleInputExecution() 283 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute() 325 class CUDAConvolutionCreator : public CUDABackend::Creator {
|
H A D | ReductionExecution.cu | 97 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute() 159 class ReductionCreator : public CUDABackend::Creator {
|
H A D | CUDALoop.cpp | 116 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute() 228 class LoopCreator : public CUDABackend::Creator {
|
H A D | LayerNormExecution.cu | 311 auto runtime = static_cast<CUDABackend*>(backend())->getCUDARuntime(); in onExecute() 340 class LayerNormCreator : public CUDABackend::Creator {
|
/dports/science/py-PyFR/pyfr-1.12.3/pyfr/backends/cuda/ |
H A D | __init__.py | 3 from pyfr.backends.cuda.base import CUDABackend
|
H A D | base.py | 9 class CUDABackend(BaseBackend): class
|
/dports/science/py-PyFR/pyfr-1.12.3/pyfr/backends/ |
H A D | __init__.py | 4 from pyfr.backends.cuda import CUDABackend
|