/* * Copyright (C) 2018-2021 Intel Corporation * * SPDX-License-Identifier: MIT * */ #pragma once #include "shared/source/helpers/basic_math.h" #include "shared/source/helpers/constants.h" #include "opencl/extensions/public/cl_ext_private.h" #include "opencl/source/context/context_type.h" #include "opencl/source/mem_obj/mem_obj.h" #include "igfxfmid.h" #include "memory_properties_flags.h" #include namespace NEO { class Buffer; class ClDevice; class Device; class MemoryManager; struct EncodeSurfaceStateArgs; using BufferCreatFunc = Buffer *(*)(Context *context, MemoryProperties memoryProperties, cl_mem_flags flags, cl_mem_flags_intel flagsIntel, size_t size, void *memoryStorage, void *hostPtr, MultiGraphicsAllocation multiGraphicsAllocation, bool zeroCopy, bool isHostPtrSVM, bool isImageRedescribed); struct BufferFactoryFuncs { BufferCreatFunc createBufferFunction; }; extern BufferFactoryFuncs bufferFactory[IGFX_MAX_CORE]; namespace BufferFunctions { using ValidateInputAndCreateBufferFunc = std::function; extern ValidateInputAndCreateBufferFunc validateInputAndCreateBuffer; } // namespace BufferFunctions class Buffer : public MemObj { public: constexpr static size_t maxBufferSizeForReadWriteOnCpu = 10 * MB; constexpr static cl_ulong maskMagic = 0xFFFFFFFFFFFFFFFFLL; constexpr static cl_ulong objectMagic = MemObj::objectMagic | 0x02; bool forceDisallowCPUCopy = false; ~Buffer() override; static cl_mem validateInputAndCreateBuffer(cl_context context, const cl_mem_properties *properties, cl_mem_flags flags, cl_mem_flags_intel flagsIntel, size_t size, void *hostPtr, cl_int &retVal); static Buffer *create(Context *context, cl_mem_flags flags, size_t size, void *hostPtr, cl_int &errcodeRet); static Buffer *create(Context *context, MemoryProperties properties, cl_mem_flags flags, cl_mem_flags_intel flagsIntel, size_t size, void *hostPtr, cl_int &errcodeRet); static Buffer *createSharedBuffer(Context *context, cl_mem_flags flags, SharingHandler *sharingHandler, MultiGraphicsAllocation multiGraphicsAllocation); static Buffer *createBufferHw(Context *context, MemoryProperties memoryProperties, cl_mem_flags flags, cl_mem_flags_intel flagsIntel, size_t size, void *memoryStorage, void *hostPtr, MultiGraphicsAllocation multiGraphicsAllocation, bool zeroCopy, bool isHostPtrSVM, bool isImageRedescribed); static Buffer *createBufferHwFromDevice(const Device *device, cl_mem_flags flags, cl_mem_flags_intel flagsIntel, size_t size, void *memoryStorage, void *hostPtr, MultiGraphicsAllocation multiGraphicsAllocation, size_t offset, bool zeroCopy, bool isHostPtrSVM, bool isImageRedescribed); Buffer *createSubBuffer(cl_mem_flags flags, cl_mem_flags_intel flagsIntel, const cl_buffer_region *region, cl_int &errcodeRet); static void setSurfaceState(const Device *device, void *surfaceState, bool forceNonAuxMode, bool disableL3, size_t svmSize, void *svmPtr, size_t offset, GraphicsAllocation *gfxAlloc, cl_mem_flags flags, cl_mem_flags_intel flagsIntel, bool useGlobalAtomics, bool areMultipleSubDevicesInContext); static void provideCompressionHint(bool compressionEnabled, Context *context, Buffer *buffer); BufferCreatFunc createFunction = nullptr; bool isSubBuffer(); bool isValidSubBufferOffset(size_t offset); uint64_t setArgStateless(void *memory, uint32_t patchSize, uint32_t rootDeviceIndex, bool set32BitAddressing); virtual void setArgStateful(void *memory, bool forceNonAuxMode, bool disableL3, bool alignSizeForAuxTranslation, bool isReadOnly, const Device &device, bool useGlobalAtomics, bool areMultipleSubDevicesInContext) = 0; bool bufferRectPitchSet(const size_t *bufferOrigin, const size_t *region, size_t &bufferRowPitch, size_t &bufferSlicePitch, size_t &hostRowPitch, size_t &hostSlicePitch, bool isSrcBuffer); static size_t calculateHostPtrSize(const size_t *origin, const size_t *region, size_t rowPitch, size_t slicePitch); void transferDataToHostPtr(MemObjSizeArray ©Size, MemObjOffsetArray ©Offset) override; void transferDataFromHostPtr(MemObjSizeArray ©Size, MemObjOffsetArray ©Offset) override; bool isReadWriteOnCpuAllowed(const Device &device); bool isReadWriteOnCpuPreferred(void *ptr, size_t size, const Device &device); uint32_t getMocsValue(bool disableL3Cache, bool isReadOnlyArgument, uint32_t rootDeviceIndex) const; uint32_t getSurfaceSize(bool alignSizeForAuxTranslation, uint32_t rootDeviceIndex) const; uint64_t getBufferAddress(uint32_t rootDeviceIndex) const; bool isCompressed(uint32_t rootDeviceIndex) const; protected: Buffer(Context *context, MemoryProperties memoryProperties, cl_mem_flags flags, cl_mem_flags_intel flagsIntel, size_t size, void *memoryStorage, void *hostPtr, MultiGraphicsAllocation multiGraphicsAllocation, bool zeroCopy, bool isHostPtrSVM, bool isObjectRedescribed); Buffer(); static void checkMemory(MemoryProperties memoryProperties, size_t size, void *hostPtr, cl_int &errcodeRet, bool &isZeroCopy, bool ©MemoryFromHostPtr, MemoryManager *memMngr, uint32_t rootDeviceIndex, bool forceCopyHostPtr); static GraphicsAllocation::AllocationType getGraphicsAllocationTypeAndCompressionPreference(const MemoryProperties &properties, Context &context, bool &compressionEnabled, bool localMemoryEnabled); static bool isReadOnlyMemoryPermittedByFlags(const MemoryProperties &properties); void transferData(void *dst, void *src, size_t copySize, size_t copyOffset); void appendSurfaceStateArgs(EncodeSurfaceStateArgs &args); }; template class BufferHw : public Buffer { public: BufferHw(Context *context, MemoryProperties memoryProperties, cl_mem_flags flags, cl_mem_flags_intel flagsIntel, size_t size, void *memoryStorage, void *hostPtr, MultiGraphicsAllocation multiGraphicsAllocation, bool zeroCopy, bool isHostPtrSVM, bool isObjectRedescribed) : Buffer(context, memoryProperties, flags, flagsIntel, size, memoryStorage, hostPtr, std::move(multiGraphicsAllocation), zeroCopy, isHostPtrSVM, isObjectRedescribed) {} void setArgStateful(void *memory, bool forceNonAuxMode, bool disableL3, bool alignSizeForAuxTranslation, bool isReadOnlyArgument, const Device &device, bool useGlobalAtomics, bool areMultipleSubDevicesInContext) override; static Buffer *create(Context *context, MemoryProperties memoryProperties, cl_mem_flags flags, cl_mem_flags_intel flagsIntel, size_t size, void *memoryStorage, void *hostPtr, MultiGraphicsAllocation multiGraphicsAllocation, bool zeroCopy, bool isHostPtrSVM, bool isObjectRedescribed) { auto buffer = new BufferHw(context, memoryProperties, flags, flagsIntel, size, memoryStorage, hostPtr, std::move(multiGraphicsAllocation), zeroCopy, isHostPtrSVM, isObjectRedescribed); buffer->surfaceType = SURFACE_STATE::SURFACE_TYPE_SURFTYPE_1D; return buffer; } typedef typename GfxFamily::RENDER_SURFACE_STATE SURFACE_STATE; typename SURFACE_STATE::SURFACE_TYPE surfaceType; }; } // namespace NEO