Files
XCEngine/engine/third_party/physx/source/gpucommon/src/PxgCudaBuffer.cpp

165 lines
5.6 KiB
C++

// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions
// are met:
// * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
// * Redistributions in binary form must reproduce the above copyright
// notice, this list of conditions and the following disclaimer in the
// documentation and/or other materials provided with the distribution.
// * Neither the name of NVIDIA CORPORATION nor the names of its
// contributors may be used to endorse or promote products derived
// from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ''AS IS'' AND ANY
// EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
// PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
// CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
// EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
// PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
// PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
// OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
//
// Copyright (c) 2008-2025 NVIDIA Corporation. All rights reserved.
// Copyright (c) 2004-2008 AGEIA Technologies, Inc. All rights reserved.
// Copyright (c) 2001-2004 NovodeX AG. All rights reserved.
#include "PxgCudaBuffer.h"
#include "foundation/PxMath.h"
#include "foundation/PxAssert.h"
#include "cudamanager/PxCudaContext.h"
#include "PxPhysXGpu.h"
#include "PxsKernelWrangler.h"
#include "common/PxPhysXCommonConfig.h"
#include "PxgMemoryManager.h"
#define MEMCHECK_SUPPORT 0
using namespace physx;
void PxgCudaBuffer::allocate(const PxU64 size, const char* filename, PxI32 line)
{
PX_ASSERT(mHeapMemoryAllocator);
if (mSize < size)
{
if (mSize > 0 && mPtr)
{
#if MEMCHECK_SUPPORT
PX_UNUSED(filename);
PX_UNUSED(line);
PxgCudaAllocatorCallbackBase* alloc = reinterpret_cast<PxgCudaAllocatorCallbackBase*>(mHeapMemoryAllocator->getAllocator());
PxU8* ptr = reinterpret_cast<PxU8*>(mPtr);
alloc->mContextManager->freeDeviceBuffer(ptr);
mPtr = NULL;
#else
mHeapMemoryAllocator->deallocate(reinterpret_cast<void*>(mPtr));
#endif
}
//Allocate either double current size or the requested size, depending on which is larger
mSize = PxMax(size, mSize * 2);
#if MEMCHECK_SUPPORT
PxgCudaAllocatorCallbackBase* alloc = reinterpret_cast<PxgCudaAllocatorCallbackBase*>(mHeapMemoryAllocator->getAllocator());
mPtr = CUdeviceptr(alloc->mContextManager->allocDeviceBuffer<PxU8>(PxU32(mSize)));
PX_ASSERT(mPtr);
#else
mPtr = reinterpret_cast<CUdeviceptr>(mHeapMemoryAllocator->allocate(mSize, mStatGroup, filename, line));
#endif
#if PX_STOMP_ALLOCATED_MEMORY
if (mPtr)
{
PxgCudaAllocatorCallbackBase* alloc = reinterpret_cast<PxgCudaAllocatorCallbackBase*>(mHeapMemoryAllocator->getAllocator());
PxCudaContextManager* ccm = alloc->mContextManager;
if (ccm)
{
PxScopedCudaLock scl(*ccm);
CUresult result = ccm->getCudaContext()->memsetD8(mPtr, static_cast<unsigned char>(0xcd), mSize);
if (result != 0)
PX_ASSERT(result == 0);
}
else
{
PxGetFoundation().error(physx::PxErrorCode::eDEBUG_WARNING, PX_FL,
"Not possible to stomp PxgCudaBufferMemory because not cuda context manager is available.");
}
}
#endif
}
}
void PxgCudaBuffer::allocateCopyOldDataAsync(const PxU64 size, PxCudaContext* cudaContext, CUstream stream, const char* filename, PxI32 line)
{
PX_ASSERT(mHeapMemoryAllocator);
PxU64 oldSize = mSize;
//Allocate either double current size or the requested size, depending on which is larger
mSize = (oldSize < size) ? PxMax(size, mSize * 2) : mSize;
if (oldSize < size)
{
CUdeviceptr oldPtr = mPtr;
#if MEMCHECK_SUPPORT
PX_UNUSED(filename);
PX_UNUSED(line);
PxgCudaAllocatorCallbackBase* alloc = reinterpret_cast<PxgCudaAllocatorCallbackBase*>(mHeapMemoryAllocator->getAllocator());
mPtr = CUdeviceptr(alloc->mContextManager->allocDeviceBuffer<PxU8>(PxU32(mSize)));
PX_ASSERT(mPtr);
#else
mPtr = reinterpret_cast<CUdeviceptr>(mHeapMemoryAllocator->allocate(mSize, mStatGroup, filename, line));
#endif
if (oldSize > 0 && oldPtr)
{
cudaContext->memcpyDtoDAsync(mPtr, oldPtr, oldSize, stream);
//Defer deletion. This makes sure nothing else gets this memory until after the memcopy has completed
#if MEMCHECK_SUPPORT
//Since MEMCHECK_SUPPORT is only active for invalid memory access debugging, let it leak for now
#else
mHeapMemoryAllocator->deallocateDeferred(reinterpret_cast<void*>(oldPtr));
#endif
}
}
}
void PxgCudaBuffer::deallocate()
{
PX_ASSERT(mHeapMemoryAllocator);
if (mSize && mPtr)
{
#if MEMCHECK_SUPPORT
PxgCudaAllocatorCallbackBase* alloc = reinterpret_cast<PxgCudaAllocatorCallbackBase*>(mHeapMemoryAllocator->getAllocator());
PxU8* ptr = reinterpret_cast<PxU8*>(mPtr);
alloc->mContextManager->freeDeviceBuffer(ptr);
#else
mHeapMemoryAllocator->deallocate(reinterpret_cast<void*>(mPtr));
#endif
mPtr = 0;
mSize = 0;
}
}
void PxgCudaBuffer::deallocateDeferred()
{
#if MEMCHECK_SUPPORT
//Since MEMCHECK_SUPPORT is only active for invalid memory access debugging, let it leak for now
#else
PX_ASSERT(mHeapMemoryAllocator);
if (mSize && mPtr)
mHeapMemoryAllocator->deallocateDeferred(reinterpret_cast<void*>(mPtr));
#endif
}
PxgCudaBuffer::~PxgCudaBuffer()
{
deallocate();
}