only disable fastscan in radix sort for __APPLE__, this should improve Linux performance (previously it went through the slower path under Linux)
This commit is contained in:
@@ -319,10 +319,10 @@ void b3RadixSort32CL::execute(b3OpenCLArray<b3SortData>& keyValuesInOut, int sor
|
|||||||
|
|
||||||
|
|
||||||
//fast prefix scan is not working properly on Mac OSX yet
|
//fast prefix scan is not working properly on Mac OSX yet
|
||||||
#ifdef _WIN32
|
#ifdef __APPLE__
|
||||||
bool fastScan=!m_deviceCPU;//only use fast scan on GPU
|
|
||||||
#else
|
|
||||||
bool fastScan=false;
|
bool fastScan=false;
|
||||||
|
#else
|
||||||
|
bool fastScan=!m_deviceCPU;//only use fast scan on GPU
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
if (fastScan)
|
if (fastScan)
|
||||||
@@ -653,11 +653,10 @@ void b3RadixSort32CL::execute(b3OpenCLArray<unsigned int>& keysInOut, int sortBi
|
|||||||
|
|
||||||
|
|
||||||
//fast prefix scan is not working properly on Mac OSX yet
|
//fast prefix scan is not working properly on Mac OSX yet
|
||||||
#ifdef _WIN32
|
#ifdef __APPLE__
|
||||||
bool fastScan=!m_deviceCPU;
|
|
||||||
|
|
||||||
#else
|
|
||||||
bool fastScan=false;
|
bool fastScan=false;
|
||||||
|
#else
|
||||||
|
bool fastScan=!m_deviceCPU;
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
if (fastScan)
|
if (fastScan)
|
||||||
|
|||||||
Reference in New Issue
Block a user