3 months ago · e1b4a498b6
--- a/Jolt/Core/Array.h
+++ b/Jolt/Core/Array.h
@@ -69,8 +69,8 @@ public:
 
				 		rev_it &			operator -- ()					{ ++mValue; return *this; }
			
 
				 		rev_it				operator -- (int)				{ return rev_it(mValue++); }
			
 
				 
			
 
				-		rev_it				operator + (int inValue)		{ return rev_it(mValue - inValue); }
			
 
				-		rev_it				operator - (int inValue)		{ return rev_it(mValue + inValue); }
			
 
				+		rev_it				operator + (int inValue) const	{ return rev_it(mValue - inValue); }
			
 
				+		rev_it				operator - (int inValue) const	{ return rev_it(mValue + inValue); }
			
 
				 
			
 
				 		rev_it &			operator += (int inValue)		{ mValue -= inValue; return *this; }
			
 
				 		rev_it &			operator -= (int inValue)		{ mValue += inValue; return *this; }
			
--- a/Jolt/Math/UVec4.h
+++ b/Jolt/Math/UVec4.h
@@ -115,15 +115,21 @@ public:
 
				 	JPH_INLINE uint32			operator [] (uint inCoordinate) const				{ JPH_ASSERT(inCoordinate < 4); return mU32[inCoordinate]; }
			
 
				 	JPH_INLINE uint32 &			operator [] (uint inCoordinate)						{ JPH_ASSERT(inCoordinate < 4); return mU32[inCoordinate]; }
			
 
				 
			
 
				-	/// Multiplies each of the 4 integer components with an integer (discards any overflow)
			
 
				+	/// Component wise multiplication of two integer vectors (stores low 32 bits of result only)
			
 
				 	JPH_INLINE UVec4			operator * (UVec4Arg inV2) const;
			
 
				 
			
 
				-	/// Adds an integer value to all integer components (discards any overflow)
			
 
				-	JPH_INLINE UVec4			operator + (UVec4Arg inV2);
			
 
				+	/// Add two integer vectors (component wise)
			
 
				+	JPH_INLINE UVec4			operator + (UVec4Arg inV2) const;
			
 
				 
			
 
				 	/// Add two integer vectors (component wise)
			
 
				 	JPH_INLINE UVec4 &			operator += (UVec4Arg inV2);
			
 
				 
			
 
				+	/// Subtract two integer vectors (component wise)
			
 
				+	JPH_INLINE UVec4			operator - (UVec4Arg inV2) const;
			
 
				+
			
 
				+	/// Subtract two integer vectors (component wise)
			
 
				+	JPH_INLINE UVec4 &			operator -= (UVec4Arg inV2);
			
 
				+
			
 
				 	/// Replicate the X component to all components
			
 
				 	JPH_INLINE UVec4			SplatX() const;
			
 
				 
			
@@ -142,6 +148,12 @@ public:
 
				 	/// Reinterpret UVec4 as a Vec4 (doesn't change the bits)
			
 
				 	JPH_INLINE Vec4				ReinterpretAsFloat() const;
			
 
				 
			
 
				+	/// Dot product, returns the dot product in X, Y, Z and W components
			
 
				+	JPH_INLINE UVec4			DotV(UVec4Arg inV2) const;
			
 
				+
			
 
				+	/// Dot product
			
 
				+	JPH_INLINE uint32			Dot(UVec4Arg inV2) const;
			
 
				+
			
 
				 	/// Store 4 ints to memory
			
 
				 	JPH_INLINE void				StoreInt4(uint32 *outV) const;
			
 
				 
			
--- a/Jolt/Math/UVec4.inl
+++ b/Jolt/Math/UVec4.inl
@@ -255,7 +255,7 @@ UVec4 UVec4::operator * (UVec4Arg inV2) const
 
				 #endif
			
 
				 }
			
 
				 
			
 
				-UVec4 UVec4::operator + (UVec4Arg inV2)
			
 
				+UVec4 UVec4::operator + (UVec4Arg inV2) const
			
 
				 {
			
 
				 #if defined(JPH_USE_SSE)
			
 
				 	return _mm_add_epi32(mValue, inV2.mValue);
			
@@ -282,6 +282,33 @@ UVec4 &UVec4::operator += (UVec4Arg inV2)
 
				 	return *this;
			
 
				 }
			
 
				 
			
 
				+UVec4 UVec4::operator - (UVec4Arg inV2) const
			
 
				+{
			
 
				+#if defined(JPH_USE_SSE)
			
 
				+	return _mm_sub_epi32(mValue, inV2.mValue);
			
 
				+#elif defined(JPH_USE_NEON)
			
 
				+	return vsubq_u32(mValue, inV2.mValue);
			
 
				+#else
			
 
				+	return UVec4(mU32[0] - inV2.mU32[0],
			
 
				+				 mU32[1] - inV2.mU32[1],
			
 
				+				 mU32[2] - inV2.mU32[2],
			
 
				+				 mU32[3] - inV2.mU32[3]);
			
 
				+#endif
			
 
				+}
			
 
				+
			
 
				+UVec4 &UVec4::operator -= (UVec4Arg inV2)
			
 
				+{
			
 
				+#if defined(JPH_USE_SSE)
			
 
				+	mValue = _mm_sub_epi32(mValue, inV2.mValue);
			
 
				+#elif defined(JPH_USE_NEON)
			
 
				+	mValue = vsubq_u32(mValue, inV2.mValue);
			
 
				+#else
			
 
				+	for (int i = 0; i < 4; ++i)
			
 
				+		mU32[i] -= inV2.mU32[i];
			
 
				+#endif
			
 
				+	return *this;
			
 
				+}
			
 
				+
			
 
				 UVec4 UVec4::SplatX() const
			
 
				 {
			
 
				 #if defined(JPH_USE_SSE)
			
@@ -348,6 +375,34 @@ Vec4 UVec4::ReinterpretAsFloat() const
 
				 #endif
			
 
				 }
			
 
				 
			
 
				+UVec4 UVec4::DotV(UVec4Arg inV2) const
			
 
				+{
			
 
				+#if defined(JPH_USE_SSE4_1)
			
 
				+	__m128i mul = _mm_mullo_epi32(mValue, inV2.mValue);
			
 
				+    __m128i sum = _mm_add_epi32(mul, _mm_shuffle_epi32(mul, _MM_SHUFFLE(2, 3, 0, 1)));
			
 
				+    return _mm_add_epi32(sum, _mm_shuffle_epi32(sum, _MM_SHUFFLE(1, 0, 3, 2)));
			
 
				+#elif defined(JPH_USE_NEON)
			
 
				+	uint32x4_t mul = vmulq_u32(mValue, inV2.mValue);
			
 
				+	return vdupq_n_u32(vaddvq_u32(mul));
			
 
				+#else
			
 
				+	return UVec4::sReplicate(mU32[0] * inV2.mU32[0] + mU32[1] * inV2.mU32[1] + mU32[2] * inV2.mU32[2] + mU32[3] * inV2.mU32[3]);
			
 
				+#endif
			
 
				+}
			
 
				+
			
 
				+uint32 UVec4::Dot(UVec4Arg inV2) const
			
 
				+{
			
 
				+#if defined(JPH_USE_SSE4_1)
			
 
				+	__m128i mul = _mm_mullo_epi32(mValue, inV2.mValue);
			
 
				+    __m128i sum = _mm_add_epi32(mul, _mm_shuffle_epi32(mul, _MM_SHUFFLE(2, 3, 0, 1)));
			
 
				+    return _mm_cvtsi128_si32(_mm_add_epi32(sum, _mm_shuffle_epi32(sum, _MM_SHUFFLE(1, 0, 3, 2))));
			
 
				+#elif defined(JPH_USE_NEON)
			
 
				+	uint32x4_t mul = vmulq_u32(mValue, inV2.mValue);
			
 
				+	return vaddvq_u32(mul);
			
 
				+#else
			
 
				+	return mU32[0] * inV2.mU32[0] + mU32[1] * inV2.mU32[1] + mU32[2] * inV2.mU32[2] + mU32[3] * inV2.mU32[3];
			
 
				+#endif
			
 
				+}
			
 
				+
			
 
				 void UVec4::StoreInt4(uint32 *outV) const
			
 
				 {
			
 
				 #if defined(JPH_USE_SSE)
			
--- a/Jolt/Math/Vec4.h
+++ b/Jolt/Math/Vec4.h
@@ -221,7 +221,7 @@ public:
 
				 	/// Reciprocal vector (1 / value) for each of the components
			
 
				 	JPH_INLINE Vec4				Reciprocal() const;
			
 
				 
			
 
				-	/// Dot product, returns the dot product in X, Y and Z components
			
 
				+	/// Dot product, returns the dot product in X, Y, Z and W components
			
 
				 	JPH_INLINE Vec4				DotV(Vec4Arg inV2) const;
			
 
				 
			
 
				 	/// Dot product
			
--- a/UnitTests/Math/UVec4Tests.cpp
+++ b/UnitTests/Math/UVec4Tests.cpp
@@ -222,11 +222,15 @@ TEST_SUITE("UVec4Tests")
 
				 	{
			
 
				 		CHECK(UVec4(1, 2, 3, 4) + UVec4(5, 6, 7, 8) == UVec4(6, 8, 10, 12));
			
 
				 
			
 
				+		CHECK(UVec4(5, 6, 7, 8) - UVec4(4, 3, 2, 1) == UVec4(1, 3, 5, 7));
			
 
				+
			
 
				 		CHECK(UVec4(1, 2, 3, 4) * UVec4(5, 6, 7, 8) == UVec4(1 * 5, 2 * 6, 3 * 7, 4 * 8));
			
 
				 
			
 
				 		UVec4 v = UVec4(1, 2, 3, 4);
			
 
				 		v += UVec4(5, 6, 7, 8);
			
 
				 		CHECK(v == UVec4(6, 8, 10, 12));
			
 
				+		v -= UVec4(4, 3, 2, 1);
			
 
				+		CHECK(v == UVec4(2, 5, 8, 11));
			
 
				 	}
			
 
				 
			
 
				 	TEST_CASE("TestUVec4Swizzle")
			
@@ -499,6 +503,12 @@ TEST_SUITE("UVec4Tests")
 
				 		CHECK(v.Swizzle<SWIZZLE_W, SWIZZLE_W, SWIZZLE_W, SWIZZLE_W>() == UVec4(4, 4, 4, 4));
			
 
				 	}
			
 
				 
			
 
				+	TEST_CASE("TestUVec4Dot")
			
 
				+	{
			
 
				+		CHECK(UVec4(1, 2, 3, 4).Dot(UVec4(5, 6, 7, 8)) == 1 * 5 + 2 * 6 + 3 * 7 + 4 * 8);
			
 
				+		CHECK(UVec4(1, 2, 3, 4).DotV(UVec4(5, 6, 7, 8)) == UVec4::sReplicate(1 * 5 + 2 * 6 + 3 * 7 + 4 * 8));
			
 
				+	}
			
 
				+
			
 
				 	TEST_CASE("TestUVec4Cast")
			
 
				 	{
			
 
				 		CHECK(UVec4(1, 2, 3, 4).ToFloat() == Vec4(1, 2, 3, 4));