fix out-of-bounds in AMD version of VectorAdd

2010-06-25 00:40:20 +00:00
parent 5db1c008bd
commit b83e16b7ff
3 changed files with 6 additions and 1 deletions
--- a/Demos/VectorAdd_OpenCL/MiniCL_VectorAdd.cpp
+++ b/Demos/VectorAdd_OpenCL/MiniCL_VectorAdd.cpp
@@ -300,9 +300,10 @@ int main(int argc, char **argv)
 		{
 			num_t++;
 			//this can cause problems -> processing outside of the buffer
 			//make sure to check kernel
 		}
-		size_t globalThreads[] = {actualGlobalSize};//num_t * workgroupSize};
+		size_t globalThreads[] = {num_t * workgroupSize};
 		size_t localThreads[] = {workgroupSize};
--- a/Demos/VectorAdd_OpenCL/VectorAddKernels.cl
+++ b/Demos/VectorAdd_OpenCL/VectorAddKernels.cl
@@ -24,6 +24,8 @@ __kernel void VectorAdd(__global const float8* a, __global const float8* b, __gl
 {
    // get oct-float index into global data array
    int iGID = get_global_id(0);
 	if (iGID>=100000)
 		return;
    // read inputs into registers
    float8 f8InA = a[iGID];
--- a/src/LinearMath/btMinMax.h
+++ b/src/LinearMath/btMinMax.h
@@ -17,6 +17,8 @@ subject to the following restrictions:
 #ifndef GEN_MINMAX_H
 #define GEN_MINMAX_H
 #include "btScalar.h"
 template <class T>
 SIMD_FORCE_INLINE const T& btMin(const T& a, const T& b) 
 {