Initial commit:

PhysX 3.4.0 Update @ 21294896 APEX 1.4.0 Update @ 21275617 [CL 21300167]
author: git perforce import user <a@b> 2016-10-25 12:29:14 -0600
committer: Sheikh Dawood Abdul Ajees <Sheikh Dawood Abdul Ajees> 2016-10-25 18:56:37 -0500
commit: 3dfe2108cfab31ba3ee5527e217d0d8e99a51162 (patch)
tree: fa6485c169e50d7415a651bf838f5bcd0fd3bfbd /APEX_1.4/common/include/RandState.h
download: physx-3.4-3dfe2108cfab31ba3ee5527e217d0d8e99a51162.tar.xz
physx-3.4-3dfe2108cfab31ba3ee5527e217d0d8e99a51162.zip
1 files changed, 185 insertions, 0 deletions
diff --git a/APEX_1.4/common/include/RandState.h b/APEX_1.4/common/include/RandState.h
new file mode 100644
index 00000000..315adde0
--- /dev/null
+++ b/APEX_1.4/common/include/RandState.h
@@ -0,0 +1,185 @@
+/*
+ * Copyright (c) 2008-2015, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * NVIDIA CORPORATION and its licensors retain all intellectual property
+ * and proprietary rights in and to this software, related documentation
+ * and any modifications thereto.  Any use, reproduction, disclosure or
+ * distribution of this software and related documentation without an express
+ * license agreement from NVIDIA CORPORATION is strictly prohibited.
+ */
+
+
+#ifndef RAND_STATE_H
+#define RAND_STATE_H
+
+// This is shared by legacy IOFX and shaders
+
+namespace nvidia
+{
+namespace apex
+{
+
+struct LCG_PRNG
+{
+	unsigned int a, c;
+
+	PX_CUDA_CALLABLE PX_INLINE LCG_PRNG()
+	{
+	}
+	PX_CUDA_CALLABLE PX_INLINE LCG_PRNG(unsigned int a, unsigned int c)
+	{
+		this->a = a;
+		this->c = c;
+	}
+
+	static PX_CUDA_CALLABLE PX_INLINE LCG_PRNG getIdentity()
+	{
+		return LCG_PRNG(1, 0);
+	}
+
+	static PX_CUDA_CALLABLE PX_INLINE LCG_PRNG getDefault()
+	{
+		return LCG_PRNG(1103515245u, 12345u);
+	}
+
+	PX_CUDA_CALLABLE PX_INLINE LCG_PRNG& operator *= (const LCG_PRNG& rhs)
+	{
+		a *= rhs.a;
+		c *= rhs.a; c += rhs.c;
+		return *this;
+	}
+
+	PX_CUDA_CALLABLE PX_INLINE LCG_PRNG leapFrog(unsigned int leap) const
+	{
+		LCG_PRNG ret = getIdentity();
+		for (unsigned int i = 0; i < leap; ++i)
+		{
+			ret *= (*this);
+		}
+		return ret;
+	}
+
+	PX_CUDA_CALLABLE PX_INLINE unsigned int operator()(unsigned int x) const
+	{
+		return x * a + c;
+	}
+};
+
+struct RandState
+{
+	explicit PX_CUDA_CALLABLE PX_INLINE RandState(unsigned int seed)
+	{
+		curr = seed;
+	}
+
+	PX_CUDA_CALLABLE PX_INLINE unsigned int next()
+	{
+		return (curr = LCG_PRNG::getDefault()(curr));
+	}
+
+	PX_CUDA_CALLABLE PX_INLINE float nextFloat()
+	{
+		return float(next()) * 0.00000000023283064365386962890625f;
+	}
+	PX_CUDA_CALLABLE PX_INLINE float nextFloat(float min, float max)
+	{
+		return min + nextFloat() * (max - min);
+	}
+
+private:
+	unsigned int curr;
+};
+
+// For CUDA PRNG
+struct PRNGInfo
+{
+	unsigned int* g_stateSpawnSeed;
+	nvidia::LCG_PRNG* g_randBlock;
+	unsigned int seed;
+	nvidia::LCG_PRNG randThread;
+	nvidia::LCG_PRNG randGrid;
+};
+
+// For CUDA PRNG: device part
+#ifdef __CUDACC__
+//*
+#define RAND_SCAN_OP(ofs) \
+	{ \
+		unsigned int a = aData[scanIdx], c = cData[scanIdx]; \
+		unsigned int aOfs = aData[scanIdx - ofs], cOfs = cData[scanIdx - ofs]; \
+		aData[scanIdx] = a * aOfs; \
+		cData[scanIdx] = c * aOfs + cOfs; \
+	}
+/*/
+//THIS CODE CRASH ON CUDA 5.0.35
+#define RAND_SCAN_OP(ofs) \
+	{ \
+		nvidia::LCG_PRNG val(aData[scanIdx], cData[scanIdx]); \
+		nvidia::LCG_PRNG valOfs(aData[scanIdx - ofs], cData[scanIdx - ofs]); \
+		val *= valOfs; \
+		aData[scanIdx] = val.a; cData[scanIdx] = val.c; \
+	}
+//*/
+PX_INLINE __device__ void randScanWarp(unsigned int scanIdx, volatile unsigned int* aData, volatile unsigned int* cData)
+{
+	RAND_SCAN_OP(1);
+	RAND_SCAN_OP(2);
+	RAND_SCAN_OP(4);
+	RAND_SCAN_OP(8);
+	RAND_SCAN_OP(16);
+}
+
+PX_INLINE __device__ nvidia::LCG_PRNG randScanBlock(nvidia::LCG_PRNG val, volatile unsigned int* aData, volatile unsigned int* cData)
+{
+	const unsigned int idx = threadIdx.x;
+	const unsigned int idxInWarp = idx & (WARP_SIZE-1);
+	const unsigned int warpIdx = (idx >> LOG2_WARP_SIZE);
+
+	//setup scan
+	unsigned int scanIdx = (warpIdx << (LOG2_WARP_SIZE + 1)) + idxInWarp;
+	//write identity
+	aData[scanIdx] = 1;
+	cData[scanIdx] = 0;
+
+	scanIdx += WARP_SIZE;
+	//write value
+	aData[scanIdx] = val.a;
+	cData[scanIdx] = val.c;
+
+	randScanWarp(scanIdx, aData, cData);
+
+	//read value
+	val.a = aData[scanIdx]; 
+	val.c = cData[scanIdx]; 
+
+	__syncthreads();
+
+	if (idxInWarp == WARP_SIZE-1)
+	{
+		const unsigned int idxWrite = warpIdx + WARP_SIZE;
+		aData[idxWrite] = val.a;
+		cData[idxWrite] = val.c;
+	}
+	__syncthreads();
+
+	if (warpIdx == 0)
+	{
+		randScanWarp(scanIdx, aData, cData);
+	}
+	__syncthreads();
+
+	if (warpIdx > 0)
+	{
+		const unsigned int idxRead = warpIdx + WARP_SIZE - 1;
+		const nvidia::LCG_PRNG valWarp(aData[idxRead], cData[idxRead]);
+		val *= valWarp;
+	}
+	return val;
+}
+
+#endif
+
+}
+} // nvidia::apex::
+
+#endif
+\ No newline at end of file
author	git perforce import user <a@b>	2016-10-25 12:29:14 -0600
committer	Sheikh Dawood Abdul Ajees <Sheikh Dawood Abdul Ajees>	2016-10-25 18:56:37 -0500
commit	3dfe2108cfab31ba3ee5527e217d0d8e99a51162 (patch)
tree	fa6485c169e50d7415a651bf838f5bcd0fd3bfbd /APEX_1.4/common/include/RandState.h
download	physx-3.4-3dfe2108cfab31ba3ee5527e217d0d8e99a51162.tar.xz physx-3.4-3dfe2108cfab31ba3ee5527e217d0d8e99a51162.zip