// Copyright 2022 The SwiftShader Authors. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #ifndef rr_SIMD_hpp #define rr_SIMD_hpp #include "Reactor.hpp" #include #include namespace rr { namespace scalar { using Int = rr::Int; using UInt = rr::UInt; using Float = rr::Float; template using Pointer = rr::Pointer; } // namespace scalar namespace packed { using Int4 = rr::Int4; using UInt4 = rr::UInt4; using Float4 = rr::Float4; } // namespace packed namespace SIMD { extern const int Width; class Int; class UInt; class Float; class Pointer; class Int : public LValue, public XYZW // TODO(b/214583550): Eliminate and replace with SwizzleQuad() and/or other intrinsics. { public: explicit Int(RValue cast); Int(); Int(int broadcast); Int(int x, int y, int z, int w); Int(std::vector v); Int(std::function LaneValueProducer); Int(RValue rhs); Int(const Int &rhs); Int(const Reference &rhs); Int(RValue rhs); Int(const UInt &rhs); Int(const Reference &rhs); Int(RValue rhs); Int(const scalar::Int &rhs); Int(const Reference &rhs); template Int(const SwizzleMask1 &rhs); RValue operator=(int broadcast); RValue operator=(RValue rhs); RValue operator=(const Int &rhs); RValue operator=(const Reference &rhs); static Type *type(); static int element_count() { return SIMD::Width; } }; class UInt : public LValue, public XYZW // TODO(b/214583550): Eliminate and replace with SwizzleQuad() and/or other intrinsics. { public: explicit UInt(RValue cast); UInt(); UInt(int broadcast); UInt(int x, int y, int z, int w); UInt(std::vector v); UInt(std::function LaneValueProducer); UInt(RValue rhs); UInt(const UInt &rhs); UInt(const Reference &rhs); UInt(RValue rhs); UInt(const Int &rhs); UInt(const Reference &rhs); UInt(RValue rhs); UInt(const scalar::UInt &rhs); UInt(const Reference &rhs); RValue operator=(RValue rhs); RValue operator=(const UInt &rhs); RValue operator=(const Reference &rhs); static Type *type(); static int element_count() { return SIMD::Width; } }; class Float : public LValue, public XYZW // TODO(b/214583550): Eliminate and replace with SwizzleQuad() and/or other intrinsics. { public: explicit Float(RValue cast); explicit Float(RValue cast); Float(); Float(float broadcast); Float(float x, float y, float z, float w); Float(std::vector v); Float(std::function LaneValueProducer); Float(RValue rhs); Float(const Float &rhs); Float(const Reference &rhs); Float(RValue rhs); Float(const scalar::Float &rhs); Float(const Reference &rhs); Float(RValue rhs); RValue operator=(RValue rhs); template Float(const SwizzleMask1 &rhs); RValue operator=(float broadcast); RValue operator=(RValue rhs); RValue operator=(const Float &rhs); RValue operator=(const Reference &rhs); RValue operator=(RValue rhs); RValue operator=(const scalar::Float &rhs); RValue operator=(const Reference &rhs); static SIMD::Float infinity(); static Type *type(); static int element_count() { return SIMD::Width; } }; class Pointer { public: Pointer(scalar::Pointer base, scalar::Int limit); Pointer(scalar::Pointer base, unsigned int limit); Pointer(scalar::Pointer base, scalar::Int limit, SIMD::Int offset); Pointer(scalar::Pointer base, unsigned int limit, SIMD::Int offset); Pointer(std::vector> pointers); explicit Pointer(SIMD::UInt cast); // Cast from 32-bit integers to 32-bit pointers explicit Pointer(SIMD::UInt castLow, SIMD::UInt castHight); // Cast from pairs of 32-bit integers to 64-bit pointers Pointer &operator+=(SIMD::Int i); Pointer operator+(SIMD::Int i); Pointer &operator+=(int i); Pointer operator+(int i); SIMD::Int offsets() const; SIMD::Int isInBounds(unsigned int accessSize, OutOfBoundsBehavior robustness) const; bool isStaticallyInBounds(unsigned int accessSize, OutOfBoundsBehavior robustness) const; Int limit() const; // Returns true if all offsets are compile-time static and sequential // (N+0*step, N+1*step, N+2*step, N+3*step) bool hasStaticSequentialOffsets(unsigned int step) const; // Returns true if all offsets are compile-time static and equal // (N, N, N, N) bool hasStaticEqualOffsets() const; template inline T Load(OutOfBoundsBehavior robustness, SIMD::Int mask, bool atomic = false, std::memory_order order = std::memory_order_relaxed, int alignment = sizeof(float)); template inline void Store(T val, OutOfBoundsBehavior robustness, SIMD::Int mask, bool atomic = false, std::memory_order order = std::memory_order_relaxed); template inline void Store(RValue val, OutOfBoundsBehavior robustness, SIMD::Int mask, bool atomic = false, std::memory_order order = std::memory_order_relaxed); scalar::Pointer getUniformPointer() const; scalar::Pointer getPointerForLane(int lane) const; static Pointer IfThenElse(SIMD::Int condition, const Pointer &lhs, const Pointer &rhs); void castTo(SIMD::UInt &bits) const; // Cast from 32-bit pointers to 32-bit integers void castTo(SIMD::UInt &lowerBits, SIMD::UInt &upperBits) const; // Cast from 64-bit pointers to pairs of 32-bit integers #ifdef ENABLE_RR_PRINT std::vector getPrintValues() const; #endif private: // Base address for the pointer, common across all lanes. scalar::Pointer base; // Per-lane address for dealing with non-uniform data std::vector> pointers; public: // Upper (non-inclusive) limit for offsets from base. scalar::Int dynamicLimit; // If hasDynamicLimit is false, dynamicLimit is zero. unsigned int staticLimit = 0; // Per lane offsets from base. SIMD::Int dynamicOffsets; // If hasDynamicOffsets is false, all dynamicOffsets are zero. std::vector staticOffsets; bool hasDynamicLimit = false; // True if dynamicLimit is non-zero. bool hasDynamicOffsets = false; // True if any dynamicOffsets are non-zero. bool isBasePlusOffset = false; // True if this uses base+offset. False if this is a collection of Pointers }; } // namespace SIMD RValue operator+(RValue lhs, RValue rhs); RValue operator-(RValue lhs, RValue rhs); RValue operator*(RValue lhs, RValue rhs); RValue operator/(RValue lhs, RValue rhs); RValue operator%(RValue lhs, RValue rhs); RValue operator&(RValue lhs, RValue rhs); RValue operator|(RValue lhs, RValue rhs); RValue operator^(RValue lhs, RValue rhs); RValue operator<<(RValue lhs, unsigned char rhs); RValue operator>>(RValue lhs, unsigned char rhs); RValue operator<<(RValue lhs, RValue rhs); RValue operator>>(RValue lhs, RValue rhs); RValue operator+=(SIMD::Int &lhs, RValue rhs); RValue operator-=(SIMD::Int &lhs, RValue rhs); RValue operator*=(SIMD::Int &lhs, RValue rhs); // RValue operator/=(SIMD::Int &lhs, RValue rhs); // RValue operator%=(SIMD::Int &lhs, RValue rhs); RValue operator&=(SIMD::Int &lhs, RValue rhs); RValue operator|=(SIMD::Int &lhs, RValue rhs); RValue operator^=(SIMD::Int &lhs, RValue rhs); RValue operator<<=(SIMD::Int &lhs, unsigned char rhs); RValue operator>>=(SIMD::Int &lhs, unsigned char rhs); RValue operator+(RValue val); RValue operator-(RValue val); RValue operator~(RValue val); // RValue operator++(SIMD::Int &val, int); // Post-increment // const Int &operator++(SIMD::Int &val); // Pre-increment // RValue operator--(SIMD::Int &val, int); // Post-decrement // const Int &operator--(SIMD::Int &val); // Pre-decrement // RValue operator<(RValue lhs, RValue rhs); // RValue operator<=(RValue lhs, RValue rhs); // RValue operator>(RValue lhs, RValue rhs); // RValue operator>=(RValue lhs, RValue rhs); // RValue operator!=(RValue lhs, RValue rhs); // RValue operator==(RValue lhs, RValue rhs); RValue CmpEQ(RValue x, RValue y); RValue CmpLT(RValue x, RValue y); RValue CmpLE(RValue x, RValue y); RValue CmpNEQ(RValue x, RValue y); RValue CmpNLT(RValue x, RValue y); RValue CmpNLE(RValue x, RValue y); inline RValue CmpGT(RValue x, RValue y) { return CmpNLE(x, y); } inline RValue CmpGE(RValue x, RValue y) { return CmpNLT(x, y); } RValue Abs(RValue x); RValue Max(RValue x, RValue y); RValue Min(RValue x, RValue y); // Convert to nearest integer. If a converted value is outside of the integer // range, the returned result is undefined. RValue RoundInt(RValue cast); // Rounds to the nearest integer, but clamps very large values to an // implementation-dependent range. // Specifically, on x86, values larger than 2147483583.0 are converted to // 2147483583 (0x7FFFFFBF) instead of producing 0x80000000. RValue RoundIntClamped(RValue cast); RValue Extract(RValue val, int i); RValue Insert(RValue val, RValue element, int i); RValue Extract128(RValue val, int i); RValue Insert128(RValue val, RValue element, int i); RValue operator+(RValue lhs, RValue rhs); RValue operator-(RValue lhs, RValue rhs); RValue operator*(RValue lhs, RValue rhs); RValue operator/(RValue lhs, RValue rhs); RValue operator%(RValue lhs, RValue rhs); RValue operator&(RValue lhs, RValue rhs); RValue operator|(RValue lhs, RValue rhs); RValue operator^(RValue lhs, RValue rhs); RValue operator<<(RValue lhs, unsigned char rhs); RValue operator>>(RValue lhs, unsigned char rhs); RValue operator<<(RValue lhs, RValue rhs); RValue operator>>(RValue lhs, RValue rhs); RValue operator+=(SIMD::UInt &lhs, RValue rhs); RValue operator-=(SIMD::UInt &lhs, RValue rhs); RValue operator*=(SIMD::UInt &lhs, RValue rhs); // RValue operator/=(SIMD::UInt &lhs, RValue rhs); // RValue operator%=(SIMD::UInt &lhs, RValue rhs); RValue operator&=(SIMD::UInt &lhs, RValue rhs); RValue operator|=(SIMD::UInt &lhs, RValue rhs); RValue operator^=(SIMD::UInt &lhs, RValue rhs); RValue operator<<=(SIMD::UInt &lhs, unsigned char rhs); RValue operator>>=(SIMD::UInt &lhs, unsigned char rhs); RValue operator+(RValue val); RValue operator-(RValue val); RValue operator~(RValue val); // RValue operator++(SIMD::UInt &val, int); // Post-increment // const UInt &operator++(SIMD::UInt &val); // Pre-increment // RValue operator--(SIMD::UInt &val, int); // Post-decrement // const UInt &operator--(SIMD::UInt &val); // Pre-decrement // RValue operator<(RValue lhs, RValue rhs); // RValue operator<=(RValue lhs, RValue rhs); // RValue operator>(RValue lhs, RValue rhs); // RValue operator>=(RValue lhs, RValue rhs); // RValue operator!=(RValue lhs, RValue rhs); // RValue operator==(RValue lhs, RValue rhs); RValue CmpEQ(RValue x, RValue y); RValue CmpLT(RValue x, RValue y); RValue CmpLE(RValue x, RValue y); RValue CmpNEQ(RValue x, RValue y); RValue CmpNLT(RValue x, RValue y); RValue CmpNLE(RValue x, RValue y); inline RValue CmpGT(RValue x, RValue y) { return CmpNLE(x, y); } inline RValue CmpGE(RValue x, RValue y) { return CmpNLT(x, y); } RValue Max(RValue x, RValue y); RValue Min(RValue x, RValue y); RValue Extract(RValue val, int i); RValue Insert(RValue val, RValue element, int i); RValue Extract128(RValue val, int i); RValue Insert128(RValue val, RValue element, int i); // RValue RoundInt(RValue cast); RValue operator+(RValue lhs, RValue rhs); RValue operator-(RValue lhs, RValue rhs); RValue operator*(RValue lhs, RValue rhs); RValue operator/(RValue lhs, RValue rhs); RValue operator%(RValue lhs, RValue rhs); RValue operator+=(SIMD::Float &lhs, RValue rhs); RValue operator-=(SIMD::Float &lhs, RValue rhs); RValue operator*=(SIMD::Float &lhs, RValue rhs); RValue operator/=(SIMD::Float &lhs, RValue rhs); RValue operator%=(SIMD::Float &lhs, RValue rhs); RValue operator+(RValue val); RValue operator-(RValue val); // Computes `x * y + z`, which may be fused into one operation to produce a higher-precision result. RValue MulAdd(RValue x, RValue y, RValue z); // Computes a fused `x * y + z` operation. Caps::fmaIsFast indicates whether it emits an FMA instruction. RValue FMA(RValue x, RValue y, RValue z); RValue Abs(RValue x); RValue Max(RValue x, RValue y); RValue Min(RValue x, RValue y); RValue Rcp(RValue x, bool relaxedPrecision, bool exactAtPow2 = false); RValue RcpSqrt(RValue x, bool relaxedPrecision); RValue Sqrt(RValue x); RValue Insert(RValue val, RValue element, int i); RValue Extract(RValue x, int i); RValue Extract128(RValue val, int i); RValue Insert128(RValue val, RValue element, int i); // Ordered comparison functions RValue CmpEQ(RValue x, RValue y); RValue CmpLT(RValue x, RValue y); RValue CmpLE(RValue x, RValue y); RValue CmpNEQ(RValue x, RValue y); RValue CmpNLT(RValue x, RValue y); RValue