| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164 |
- // zlib open source license
- //
- // Copyright (c) 2025 David Forsgren Piuva
- //
- // This software is provided 'as-is', without any express or implied
- // warranty. In no event will the authors be held liable for any damages
- // arising from the use of this software.
- //
- // Permission is granted to anyone to use this software for any purpose,
- // including commercial applications, and to alter it and redistribute it
- // freely, subject to the following restrictions:
- //
- // 1. The origin of this software must not be misrepresented; you must not
- // claim that you wrote the original software. If you use this software
- // in a product, an acknowledgment in the product documentation would be
- // appreciated but is not required.
- //
- // 2. Altered source versions must be plainly marked as such, and must not be
- // misrepresented as being the original software.
- //
- // 3. This notice may not be removed or altered from any source
- // distribution.
- // Functions used to simplify template programming when using functions both with and without simd.h.
- #ifndef DFPSR_NO_SIMD
- #define DFPSR_NO_SIMD
- #include <stdint.h>
- #include <cmath>
- #include "SafePointer.h"
- #include "DsrTraits.h"
- namespace dsr {
- // Type conversions.
- inline int32_t truncateToI32(float value) { return (int32_t)value; }
- inline uint32_t truncateToU32(float value) { return (uint32_t)value; }
- inline float floatFromI32(int32_t value) { return (float)value; }
- inline float floatFromU32(uint32_t value) { return (float)value; }
- inline int32_t I32FromU32(uint32_t value) { return (int32_t)value; }
- inline uint32_t U32FromI32(int32_t value) { return (uint32_t)value; }
- // Memory read operations.
- inline uint32_t gather_U32(dsr::SafePointer<const uint32_t> data, const uint32_t &elementOffset) { return data[elementOffset]; }
- inline int32_t gather_I32(dsr::SafePointer<const int32_t> data, const uint32_t &elementOffset) { return data[elementOffset]; }
- inline float gather_F32(dsr::SafePointer<const float> data, const uint32_t &elementOffset) { return data[elementOffset]; }
- // Comparisons between all lanes, which is one lane for scalar types.
- inline bool allLanesEqual (const uint8_t& left, const uint8_t& right) { return left == right; }
- inline bool allLanesEqual (const uint16_t& left, const uint16_t& right) { return left == right; }
- inline bool allLanesEqual (const uint32_t& left, const uint32_t& right) { return left == right; }
- inline bool allLanesEqual (const int32_t& left, const int32_t& right) { return left == right; }
- inline bool allLanesEqual (const float& left, const float& right) { return abs(left - right) < 0.0001f; }
- inline bool allLanesNotEqual (const uint8_t& left, const uint8_t& right) { return left != right; }
- inline bool allLanesNotEqual (const uint16_t& left, const uint16_t& right) { return left != right; }
- inline bool allLanesNotEqual (const uint32_t& left, const uint32_t& right) { return left != right; }
- inline bool allLanesNotEqual (const int32_t& left, const int32_t& right) { return left != right; }
- inline bool allLanesNotEqual (const float& left, const float& right) { return abs(left - right) >= 0.0001f; }
- inline bool allLanesGreater (const uint8_t& left, const uint8_t& right) { return left > right; }
- inline bool allLanesGreater (const uint16_t& left, const uint16_t& right) { return left > right; }
- inline bool allLanesGreater (const uint32_t& left, const uint32_t& right) { return left > right; }
- inline bool allLanesGreater (const int32_t& left, const int32_t& right) { return left > right; }
- inline bool allLanesGreater (const float& left, const float& right) { return left > right; }
- inline bool allLanesGreaterOrEqual(const uint8_t& left, const uint8_t& right) { return left >= right; }
- inline bool allLanesGreaterOrEqual(const uint16_t& left, const uint16_t& right) { return left >= right; }
- inline bool allLanesGreaterOrEqual(const uint32_t& left, const uint32_t& right) { return left >= right; }
- inline bool allLanesGreaterOrEqual(const int32_t& left, const int32_t& right) { return left >= right; }
- inline bool allLanesGreaterOrEqual(const float& left, const float& right) { return left >= right; }
- inline bool allLanesLesser (const uint8_t& left, const uint8_t& right) { return left < right; }
- inline bool allLanesLesser (const uint16_t& left, const uint16_t& right) { return left < right; }
- inline bool allLanesLesser (const uint32_t& left, const uint32_t& right) { return left < right; }
- inline bool allLanesLesser (const int32_t& left, const int32_t& right) { return left < right; }
- inline bool allLanesLesser (const float& left, const float& right) { return left < right; }
- inline bool allLanesLesserOrEqual (const uint8_t& left, const uint8_t& right) { return left <= right; }
- inline bool allLanesLesserOrEqual (const uint16_t& left, const uint16_t& right) { return left <= right; }
- inline bool allLanesLesserOrEqual (const uint32_t& left, const uint32_t& right) { return left <= right; }
- inline bool allLanesLesserOrEqual (const int32_t& left, const int32_t& right) { return left <= right; }
- inline bool allLanesLesserOrEqual (const float& left, const float& right) { return left <= right; }
- template <uint32_t bitOffset>
- inline uint32_t bitShiftLeftImmediate(const uint32_t& left) {
- static_assert(bitOffset < 32u, "Immediate left shift of 32-bit values may not shift more than 31 bits!");
- return left << bitOffset;
- }
- template <uint32_t bitOffset>
- inline uint32_t bitShiftRightImmediate(const uint32_t& left) {
- static_assert(bitOffset < 32u, "Immediate right shift of 32-bit values may not shift more than 31 bits!");
- return left >> bitOffset;
- }
- template <uint16_t bitOffset>
- inline uint16_t bitShiftLeftImmediate(const uint16_t& left) {
- static_assert(bitOffset < 16u, "Immediate left shift of 16-bit values may not shift more than 15 bits!");
- return left << bitOffset;
- }
- template <uint16_t bitOffset>
- inline uint16_t bitShiftRightImmediate(const uint16_t& left) {
- static_assert(bitOffset < 16u, "Immediate right shift of 16-bit values may not shift more than 15 bits!");
- return left >> bitOffset;
- }
- template <uint8_t bitOffset>
- inline uint8_t bitShiftLeftImmediate(const uint8_t& left) {
- static_assert(bitOffset < 8u, "Immediate left shift of 8-bit values may not shift more than 7 bits!");
- return left << bitOffset;
- }
- template <uint8_t bitOffset>
- inline uint8_t bitShiftRightImmediate(const uint8_t& left) {
- static_assert(bitOffset < 8u, "Immediate right shift of 8-bit values may not shift more than 7 bits!");
- return left >> bitOffset;
- }
- // A minimum function that can take more than two arguments.
- // Post-condition: Returns the smallest of all given values, which must be comparable using the < operator and have the same type.
- template <typename T, DSR_ENABLE_IF(DSR_CHECK_PROPERTY(DsrTrait_Scalar, T))>
- inline T min(const T &a, const T &b) {
- return (a < b) ? a : b;
- }
- template <typename T, typename... TAIL, DSR_ENABLE_IF(DSR_CHECK_PROPERTY(DsrTrait_Scalar, T))>
- inline T min(const T &a, const T &b, TAIL... tail) {
- return min(min(a, b), tail...);
- }
- // A maximum function that can take more than two arguments.
- // Post-condition: Returns the largest of all given values, which must be comparable using the > operator and have the same type.
- template <typename T, DSR_ENABLE_IF(DSR_CHECK_PROPERTY(DsrTrait_Scalar, T))>
- inline T max(const T &a, const T &b) {
- return (a > b) ? a : b;
- }
- template <typename T, typename... TAIL, DSR_ENABLE_IF(DSR_CHECK_PROPERTY(DsrTrait_Scalar, T))>
- inline T max(const T &a, const T &b, TAIL... tail) {
- return max(max(a, b), tail...);
- }
- // TODO: Implement min and max for integer vectors in simd.h.
- // Start by implementing vectorized comparisons and blend functions as a fallback for unsupported types.
- // Pre-condition: minValue <= maxValue
- // Post-condition: Returns value clamped from minValue to maxValue.
- template <typename T, DSR_ENABLE_IF(DSR_CHECK_PROPERTY(DsrTrait_Any, T))>
- inline T clamp(const T &minValue, const T &value, const T &maxValue) {
- return max(minValue, min(value, maxValue));
- }
- // Post-condition: Returns value clamped to minValue.
- template <typename T, DSR_ENABLE_IF(DSR_CHECK_PROPERTY(DsrTrait_Any, T))>
- inline T clampLower(const T &minValue, const T &value) {
- return max(minValue, value);
- }
- // Post-condition: Returns value clamped to maxValue.
- template <typename T, DSR_ENABLE_IF(DSR_CHECK_PROPERTY(DsrTrait_Any, T))>
- inline T clampUpper(const T &value, const T &maxValue) {
- return min(value, maxValue);
- }
- inline float reciprocal(float value) { return 1.0f / value; }
- inline float reciprocalSquareRoot(float value) { return 1.0f / sqrt(value); }
- inline float squareRoot(float value) { return sqrt(value); }
- // TODO: Add more functions from simd.h.
- }
- #endif
|