diff --git a/src/Bullet3OpenCL/ParallelPrimitives/b3OpenCLArray.h b/src/Bullet3OpenCL/ParallelPrimitives/b3OpenCLArray.h index 36ecd6126..7497ba70d 100644 --- a/src/Bullet3OpenCL/ParallelPrimitives/b3OpenCLArray.h +++ b/src/Bullet3OpenCL/ParallelPrimitives/b3OpenCLArray.h @@ -7,8 +7,8 @@ template class b3OpenCLArray { - int m_size; - int m_capacity; + size_t m_size; + size_t m_capacity; cl_mem m_clBuffer; cl_context m_clContext; @@ -30,14 +30,14 @@ class b3OpenCLArray b3OpenCLArray& operator=(const b3OpenCLArray& src); - B3_FORCE_INLINE int allocSize(int size) + B3_FORCE_INLINE size_t allocSize(size_t size) { return (size ? size*2 : 1); } public: - b3OpenCLArray(cl_context ctx, cl_command_queue queue, int initialCapacity=0, bool allowGrowingCapacity=true) + b3OpenCLArray(cl_context ctx, cl_command_queue queue, size_t initialCapacity=0, bool allowGrowingCapacity=true) :m_size(0), m_capacity(0),m_clBuffer(0), m_clContext(ctx),m_commandQueue(queue), m_ownsMemory(true),m_allowGrowingCapacity(true) @@ -50,7 +50,7 @@ public: } ///this is an error-prone method with no error checking, be careful! - void setFromOpenCLBuffer(cl_mem buffer, int sizeInElements) + void setFromOpenCLBuffer(cl_mem buffer, size_t sizeInElements) { deallocate(); m_ownsMemory = false; @@ -81,18 +81,20 @@ public: m_capacity=0; } - B3_FORCE_INLINE void push_back(const T& _Val,bool waitForCompletion=true) + B3_FORCE_INLINE bool push_back(const T& _Val,bool waitForCompletion=true) { - int sz = size(); + bool result = true; + size_t sz = size(); if( sz == capacity() ) { - reserve( allocSize(size()) ); + result = reserve( allocSize(size()) ); } copyFromHostPointer(&_Val, 1, sz, waitForCompletion); m_size++; + return result; } - B3_FORCE_INLINE T forcedAt(int n) const + B3_FORCE_INLINE T forcedAt(size_t n) const { b3Assert(n>=0); b3Assert(n=0); b3Assert(n size()) { - reserve(newsize,copyOldContents); + result = reserve(newsize,copyOldContents); } //leave new data uninitialized (init in debug mode?) - //for (int i=curSize;i0); b3Assert(numElements<=m_size); - int srcOffsetBytes = sizeof(T)*firstElem; - int dstOffsetInBytes = sizeof(T)*dstOffsetInElems; + size_t srcOffsetBytes = sizeof(T)*firstElem; + size_t dstOffsetInBytes = sizeof(T)*dstOffsetInElems; status = clEnqueueCopyBuffer( m_commandQueue, m_clBuffer, destination, srcOffsetBytes, dstOffsetInBytes, sizeof(T)*numElements, 0, 0, 0 ); @@ -214,7 +228,7 @@ public: void copyFromHost(const b3AlignedObjectArray& srcArray, bool waitForCompletion=true) { - int newSize = srcArray.size(); + size_t newSize = srcArray.size(); bool copyOldContents = false; resize (newSize,copyOldContents); @@ -223,12 +237,12 @@ public: } - void copyFromHostPointer(const T* src, int numElems, int destFirstElem= 0, bool waitForCompletion=true) + void copyFromHostPointer(const T* src, size_t numElems, size_t destFirstElem= 0, bool waitForCompletion=true) { b3Assert(numElems+destFirstElem <= capacity()); cl_int status = 0; - int sizeInBytes=sizeof(T)*numElems; + size_t sizeInBytes=sizeof(T)*numElems; status = clEnqueueWriteBuffer( m_commandQueue, m_clBuffer, 0, sizeof(T)*destFirstElem, sizeInBytes, src, 0,0,0 ); b3Assert(status == CL_SUCCESS ); @@ -245,7 +259,7 @@ public: copyToHostPointer(&destArray[0], size(),0,waitForCompletion); } - void copyToHostPointer(T* destPtr, int numElem, int srcFirstElem=0, bool waitForCompletion=true) const + void copyToHostPointer(T* destPtr, size_t numElem, size_t srcFirstElem=0, bool waitForCompletion=true) const { b3Assert(numElem+srcFirstElem <= capacity()); @@ -260,7 +274,7 @@ public: void copyFromOpenCLArray(const b3OpenCLArray& src) { - int newSize = src.size(); + size_t newSize = src.size(); resize(newSize); if (size()) { diff --git a/src/Bullet3OpenCL/RigidBody/b3Config.h b/src/Bullet3OpenCL/RigidBody/b3Config.h index 2886f6a7c..1d46f8f17 100644 --- a/src/Bullet3OpenCL/RigidBody/b3Config.h +++ b/src/Bullet3OpenCL/RigidBody/b3Config.h @@ -19,22 +19,17 @@ struct b3Config int m_maxTriConvexPairCapacity; b3Config() -#ifdef __APPLE__ - :m_maxConvexBodies(32*1024), -#else - :m_maxConvexBodies(32*1024), -#endif - m_maxConvexShapes(81920), + :m_maxConvexBodies(128*1024), m_maxVerticesPerFace(64), - m_maxFacesPerShape(64), - m_maxConvexVertices(8192000), - m_maxConvexIndices(8192000), - m_maxConvexUniqueEdges(819200), - m_maxCompoundChildShapes(81920), - m_maxTriConvexPairCapacity(512*1024) - //m_maxTriConvexPairCapacity(256*1024) + m_maxFacesPerShape(12), + m_maxConvexVertices(8192), + m_maxConvexIndices(81920), + m_maxConvexUniqueEdges(8192), + m_maxCompoundChildShapes(8192), + m_maxTriConvexPairCapacity(256*1024) { - m_maxBroadphasePairs = 16*m_maxConvexBodies; + m_maxConvexShapes = m_maxConvexBodies; + m_maxBroadphasePairs = 8*m_maxConvexBodies; m_maxContactCapacity = m_maxBroadphasePairs; } }; diff --git a/test/OpenCL/BasicInitialize/main.cpp b/test/OpenCL/BasicInitialize/main.cpp index c85234125..5ead2bb9c 100644 --- a/test/OpenCL/BasicInitialize/main.cpp +++ b/test/OpenCL/BasicInitialize/main.cpp @@ -16,6 +16,8 @@ subject to the following restrictions: ///original author: Erwin Coumans #include "Bullet3OpenCL/Initialize/b3OpenCLUtils.h" +#include "Bullet3OpenCL/ParallelPrimitives/b3OpenCLArray.h" + #include cl_context g_cxMainContext; @@ -71,6 +73,27 @@ int main(int argc, char* argv[]) b3OpenCLDeviceInfo devInfo; b3OpenCLUtils::getDeviceInfo(dev,&devInfo); b3OpenCLUtils::printDeviceInfo(dev); + + + b3OpenCLArray memTester(g_cxMainContext,g_cqCommandQue,0,true); + int maxMem = 8192; + bool result=true; + for (size_t i=1;result;i++) + { + size_t numBytes = i*1024*1024; + result = memTester.resize(numBytes,false); + + if (result) + { + printf("allocated %d MB successfully\n",i); + } else + { + printf("allocated %d MB failed\n", i); + } + } + + + } clReleaseContext(context); @@ -101,6 +124,24 @@ int main(int argc, char* argv[]) oclCHECKERROR(ciErrNum, CL_SUCCESS); //normally you would create and execute kernels using this command queue + b3OpenCLArray memTester(g_cxMainContext,g_cqCommandQue,0,true); + int maxMem = 8192; + bool result=true; + for (size_t i=1;result;i++) + { + size_t numBytes = i*1024*1024; + result = memTester.resize(numBytes,false); + + if (result) + { + printf("allocated %d MB successfully\n",i); + } else + { + printf("allocated %d MB failed\n", i); + } + } + + clReleaseCommandQueue(g_cqCommandQue); }