api/ssevector_8h_source.html

 /*

     This file is part of Mitsuba, a physically based rendering system.


     Copyright (c) 2007-2014 by Wenzel Jakob and others.


     Mitsuba is free software; you can redistribute it and/or modify

     it under the terms of the GNU General Public License Version 3

     as published by the Free Software Foundation.


     Mitsuba is distributed in the hope that it will be useful,

     but WITHOUT ANY WARRANTY; without even the implied warranty of

     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

     GNU General Public License for more details.


     You should have received a copy of the GNU General Public License

     along with this program. If not, see <http://www.gnu.org/licenses/>.

 */


 /*============================================================================

   HDRITools - High Dynamic Range Image Tools

   Copyright 2008-2012 Program of Computer Graphics, Cornell University


   Permission is hereby granted, free of charge, to any person obtaining a copy

   of this software and associated documentation files (the "Software"), to deal

   in the Software without restriction, including without limitation the rights

   to use, copy, modify, merge, publish, distribute, sublicense, and/or sell

   copies of the Software, and to permit persons to whom the Software is

   furnished to do so, subject to the following conditions:


   The above copyright notice and this permission notice shall be included in

   all copies or substantial portions of the Software.


   THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR

   IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,

   FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE

   AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER

   LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,

   OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN

   THE SOFTWARE.

  -----------------------------------------------------------------------------

  Primary author:

      Edgar Velazquez-Armendariz <cs#cornell#edu - eva5>

 ============================================================================*/


 #pragma once

 #if !defined(__MITSUBA_CORE_SSEVECTOR_H_)

 #define __MITSUBA_CORE_SSEVECTOR_H_


 #include <mitsuba/core/platform.h>

 #include <mitsuba/core/sse.h>


 #if !MTS_SSE

 # error "This header requires SSE support"

 #endif


 MTS_NAMESPACE_BEGIN


 namespace math

 {


 // Forward declarations, required by Clang and ICL 12.1

 struct SSEVector4f;

 struct SSEvector4i;


 template <int idx3, int idx2, int idx1, int idx0>

 SSEVector4f shuffle(const SSEVector4f& low, const SSEVector4f& hi);


 template <int idx3, int idx2, int idx1, int idx0>

 SSEVector4f shuffle(const SSEVector4f& a);


 struct SSEVector4f

 {

 private:

         __m128 xmm;


 public:

         SSEVector4f() {}

         SSEVector4f(const SSEVector4f& other) : xmm(other.xmm) {}

         SSEVector4f(__m128 val) : xmm(val) {}

         explicit SSEVector4f(float val) : xmm(_mm_set1_ps(val)) {}

         SSEVector4f(float f3, float f2, float f1, float f0) :

         xmm(_mm_set_ps(f3, f2, f1, f0))

         {}


         inline SSEVector4f& operator= (float val) {

                 xmm = _mm_set1_ps(val);

                 return *this;

         }


         inline static SSEVector4f zero() {

                 return _mm_setzero_ps();

         }


         operator __m128() const {

                 return xmm;

         }


         friend SSEVector4f operator& (const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_and_ps(a.xmm, b.xmm);

         }

         friend SSEVector4f operator| (const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_or_ps(a.xmm, b.xmm);

         }

         friend SSEVector4f operator^ (const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_xor_ps(a.xmm, b.xmm);

         }

         /// ~a & b

         friend SSEVector4f andnot(const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_andnot_ps(a.xmm, b.xmm);

         }


         SSEVector4f& operator&= (const SSEVector4f& a) {

                 xmm = _mm_and_ps(xmm, a.xmm);

                 return *this;

         }

         SSEVector4f& operator|= (const SSEVector4f& a) {

                 xmm = _mm_or_ps(xmm, a.xmm);

                 return *this;

         }

         SSEVector4f& operator^= (const SSEVector4f& a) {

                 xmm = _mm_xor_ps(xmm, a.xmm);

                 return *this;

         }


         friend SSEVector4f operator+ (const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_add_ps(a.xmm, b.xmm);

         }

         friend SSEVector4f operator- (const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_sub_ps(a.xmm, b.xmm);

         }

         friend SSEVector4f operator* (const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_mul_ps(a.xmm, b.xmm);

         }

         friend SSEVector4f operator/ (const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_div_ps(a.xmm, b.xmm);

         }


         SSEVector4f& operator+= (const SSEVector4f& a) {

                 xmm = _mm_add_ps(xmm, a.xmm);

                 return *this;

         }

         SSEVector4f& operator-= (const SSEVector4f& a) {

                 xmm = _mm_sub_ps(xmm, a.xmm);

                 return *this;

         }

         SSEVector4f& operator*= (const SSEVector4f& a) {

                 xmm = _mm_mul_ps(xmm, a.xmm);

                 return *this;

         }

         SSEVector4f& operator/= (const SSEVector4f& a) {

                 xmm = _mm_div_ps(xmm, a.xmm);

                 return *this;

         }


         /**

          * \brief Newton-Rhapson Reciprocal:

          * \f[ 2 * rcp(x) - (x * rcp(x) * rcp(x)) \f]

          */

         friend inline SSEVector4f rcp_nr(const SSEVector4f& v) {

                 __m128 x0 = _mm_rcp_ps(v.xmm);

                 return _mm_sub_ps(_mm_add_ps(x0,x0),

                         _mm_mul_ps(_mm_mul_ps(x0,v.xmm), x0));

         }


         friend inline SSEVector4f rcp(const SSEVector4f& v) {

                 return _mm_rcp_ps(v.xmm);

         }


         friend SSEVector4f min(const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_min_ps(a.xmm, b.xmm);

         }

         friend SSEVector4f max(const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_max_ps(a.xmm, b.xmm);

         }


         friend SSEVector4f isnan(const SSEVector4f& a) {

                 return _mm_cmpunord_ps(a.xmm, a.xmm);

         }

         friend SSEVector4f isnan(const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_cmpunord_ps(a.xmm, b.xmm);

         }


         /**

          * \brief Moves either of the values of \c low into the low 64-bits

          * of the result, and either of the values of \c high into

          * the high 64-bits of the result. Each index in the

          * template is a index in the range [0,3] to choose a value from the

          * source, 0 being the lowest and 3 the highest.

          */

         template <int idx3, int idx2, int idx1, int idx0>

         friend SSEVector4f shuffle(const SSEVector4f& low, const SSEVector4f& hi) {

                 return _mm_shuffle_ps(low.xmm,hi.xmm,_MM_SHUFFLE(idx3,idx2,idx1,idx0));

         }


         /// Shuffles the elements of the given vector using the indices [0,3]

         template <int idx3, int idx2, int idx1, int idx0>

         friend SSEVector4f shuffle(const SSEVector4f& a) {

                 return _mm_shuffle_ps(a.xmm, a.xmm, _MM_SHUFFLE(idx3,idx2,idx1,idx0));

         }


         /// a == b

         friend SSEVector4f cmpeq(const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_cmpeq_ps(a.xmm, b.xmm);

         }

         /// a < b

         friend SSEVector4f cmplt(const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_cmplt_ps(a.xmm, b.xmm);

         }

         /// a <= b

         friend SSEVector4f cmple(const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_cmple_ps(a.xmm, b.xmm);

         }

         /// a > b

         friend SSEVector4f cmpgt(const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_cmpgt_ps(a.xmm, b.xmm);

         }

         /// a >= b

         friend SSEVector4f cmpge(const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_cmpge_ps(a.xmm, b.xmm);

         }

         /// a != b

         friend SSEVector4f cmpneq(const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_cmpneq_ps(a.xmm, b.xmm);

         }

         /// !(a < b)

         friend SSEVector4f cmpnlt(const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_cmpnlt_ps(a.xmm, b.xmm);

         }

         /// !(a <= b)

         friend SSEVector4f cmpnle(const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_cmpnle_ps(a.xmm, b.xmm);

         }

         /// !(a > b)

         friend SSEVector4f cmpngt(const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_cmpngt_ps(a.xmm, b.xmm);

         }

         /// !(a >= b)

         friend SSEVector4f cmpnge(const SSEVector4f& a, const SSEVector4f& b) {

                 return _mm_cmpnge_ps(a.xmm, b.xmm);

         }


         friend SSEVector4f operator==(const SSEVector4f& a, const SSEVector4f& b) {

                 return cmpeq(a, b);

         }

         friend SSEVector4f operator!=(const SSEVector4f& a, const SSEVector4f& b) {

                 return cmpneq(a, b);

         }

         friend SSEVector4f operator<(const SSEVector4f& a, const SSEVector4f& b) {

                 return cmplt(a, b);

         }

         friend SSEVector4f operator<=(const SSEVector4f& a, const SSEVector4f& b) {

                 return cmple(a, b);

         }

         friend SSEVector4f operator>(const SSEVector4f& a, const SSEVector4f& b) {

                 return cmpgt(a, b);

         }

         friend SSEVector4f operator>=(const SSEVector4f& a, const SSEVector4f& b) {

                 return cmpge(a, b);

         }


         /// Select/blend operation <tt>(mask) ? a : b</tt>

         friend inline SSEVector4f select(const SSEVector4f& mask,

                 const SSEVector4f& a, const SSEVector4f& b) {

                 // Alternative method by Jim Conyngham/Wikipedia MD5 page, via

                 // http://markplusplus.wordpress.com/2007/03/14/fast-sse-select-operation/ [July 2012]

                 return _mm_xor_ps(b.xmm, _mm_and_ps(mask.xmm, _mm_xor_ps(a.xmm, b.xmm)));

         }


         /// Round \c a towards zero

         friend inline SSEVector4f roundTruncate(const SSEVector4f& a) {

                 __m128i truncated = _mm_cvttps_epi32(a.xmm);

                 return _mm_cvtepi32_ps(truncated);

         }


         /// Save to \c dest without polluting the cache

         friend inline void stream(SSEVector4f* dest, const SSEVector4f& value) {

                 _mm_stream_ps(reinterpret_cast<float*>(dest), value.xmm);

         }

         /// Save to \c dest without polluting the cache

         friend inline void stream(__m128* dest, const SSEVector4f& value) {

                 _mm_stream_ps(reinterpret_cast<float*>(dest), value.xmm);

         }

         /// Save to \c dest without polluting the cache

         friend inline void stream(float* dest, const SSEVector4f& value) {

                 _mm_stream_ps(dest, value.xmm);

         }

 };


 struct SSEVector4i

 {

 private:

         __m128i xmm;


 public:

         SSEVector4i() {}

         SSEVector4i(const SSEVector4i& val) : xmm(val.xmm) {}

         SSEVector4i(__m128i val) : xmm(val) {}

         explicit SSEVector4i(int32_t val) : xmm(_mm_set1_epi32(val)) {}

         SSEVector4i(int32_t i3, int32_t i2, int32_t i1, int32_t i0) :

         xmm(_mm_set_epi32(i3, i2, i1, i0))

         {}


         SSEVector4i& operator= (int32_t val) {

                 xmm = _mm_set1_epi32(val);

                 return *this;

         }


         inline static SSEVector4i zero() {

                 return _mm_setzero_si128();

         }


         operator __m128i() const {

                 return xmm;

         }


         friend SSEVector4i operator& (const SSEVector4i& a, const SSEVector4i& b) {

                 return _mm_and_si128(a.xmm, b.xmm);

         }

         friend SSEVector4i operator| (const SSEVector4i& a, const SSEVector4i& b) {

                 return _mm_or_si128(a.xmm, b.xmm);

         }

         friend SSEVector4i operator^ (const SSEVector4i& a, const SSEVector4i& b) {

                 return _mm_xor_si128(a.xmm, b.xmm);

         }

         /// ~a & b

         friend SSEVector4i andnot(const SSEVector4i& a, const SSEVector4i& b) {

                 return _mm_andnot_si128(a.xmm, b.xmm);

         }

         SSEVector4i& operator&= (const SSEVector4i& a) {

                 xmm = _mm_and_si128(xmm, a.xmm);

                 return *this;

         }

         SSEVector4i& operator|= (const SSEVector4i& a) {

                 xmm = _mm_or_si128(xmm, a.xmm);

                 return *this;

         }

         SSEVector4i& operator^= (const SSEVector4i& a) {

                 xmm = _mm_xor_si128(xmm, a.xmm);

                 return *this;

         }


         friend SSEVector4i operator+ (const SSEVector4i& a, const SSEVector4i& b) {

                 return _mm_add_epi32(a.xmm, b.xmm);

         }

         friend SSEVector4i operator- (const SSEVector4i& a, const SSEVector4i& b) {

                 return _mm_sub_epi32(a.xmm, b.xmm);

         }

         SSEVector4i& operator+= (const SSEVector4i& a) {

                 xmm = _mm_add_epi32(xmm, a.xmm);

                 return *this;

         }

         SSEVector4i& operator-= (const SSEVector4i& a) {

                 xmm = _mm_sub_epi32(xmm, a.xmm);

                 return *this;

         }


         /// Test if all elements are zero

         inline bool isZero() const {

                 const __m128i mask = _mm_cmpeq_epi32(xmm, _mm_setzero_si128());

                 return _mm_movemask_epi8(mask) == 0xFFFF;

         }


         /// a == b

         friend SSEVector4i cmpeq(const SSEVector4i& a, const SSEVector4i& b) {

                 return _mm_cmpeq_epi32(a.xmm, b.xmm);

         }

         /// a < b

         friend SSEVector4i cmplt(const SSEVector4i& a, const SSEVector4i& b) {

                 return _mm_cmplt_epi32(a.xmm, b.xmm);

         }

         /// a > b

         friend SSEVector4i cmpgt(const SSEVector4i& a, const SSEVector4i& b) {

                 return _mm_cmpgt_epi32(a.xmm, b.xmm);

         }

         friend SSEVector4i operator==(const SSEVector4i& a, const SSEVector4i& b) {

                 return cmpeq(a, b);

         }

         friend SSEVector4i operator<(const SSEVector4i& a, const SSEVector4i& b) {

                 return cmplt(a, b);

         }

         friend SSEVector4i operator>(const SSEVector4i& a, const SSEVector4i& b) {

                 return cmpgt(a, b);

         }


         /// Select/blend: <tt>(mask) ? a : b</tt>

         friend inline SSEVector4i select(const SSEVector4i& mask,

                 const SSEVector4i& a, const SSEVector4i& b) {

                 // Alternative method by Jim Conyngham/Wikipedia MD5 page, via

                 // http://markplusplus.wordpress.com/2007/03/14/fast-sse-select-operation/ [July 2012]

                 return _mm_xor_si128(b.xmm,

                         _mm_and_si128(mask.xmm, _mm_xor_si128(a.xmm, b.xmm)));

         }


         template <int32_t i3, int32_t i2, int32_t i1, int32_t i0>

         static const __m128i& constant() {

                 static const union {

                         int32_t i32[4];

                         __m128i xmm;

                 } u = {{i0, i1, i2, i3}};

                 return u.xmm;

         }


         template <int32_t value>

         static const __m128i& constant() {

                 static const union {

                         int32_t i32[4];

                         __m128i xmm;

                 } u = {{value, value, value, value}};

                 return u.xmm;

         }


         /// Shift right by \c count bits while shifting in zeros

         friend inline SSEVector4i srl(const SSEVector4i& a, int count) {

                 return _mm_srli_epi32(a.xmm, count);

         }


         /// Shift left by \c count bits while shifting in zeros

         friend inline SSEVector4i sll(const SSEVector4i& a, int count) {

                 return _mm_slli_epi32(a.xmm, count);

         }


         /// Save to \c dest without polluting the cache

         friend inline void stream(SSEVector4i* dest, const SSEVector4i& value) {

                 _mm_stream_si128(&(dest->xmm), value);

         }

         /// Save to \c dest without polluting the cache

         friend inline void stream(__m128i* dest, const SSEVector4i& value) {

                 _mm_stream_si128(dest, value);

         }

 };


 /// Reinterprets \c as a \c SSEVector4i

 inline SSEVector4i castAsInt(const SSEVector4f& a) {

         return _mm_castps_si128(a);

 }

 /// Convert \c a to integer using truncate

 inline SSEVector4i toInt(const SSEVector4f& a) {

         return _mm_cvttps_epi32(a);

 }

 /// Converts \c a to integer using round

 inline SSEVector4i roundToInt(const SSEVector4f& a) {

         return _mm_cvtps_epi32(a);

 }


 /// Reinterprets \c a as a \c SSEVector4f

 inline SSEVector4f castAsFloat(const SSEVector4i& a) {

         return _mm_castsi128_ps(a);

 }

 /// Convert \c a to floating point

 inline SSEVector4f toFloat(const SSEVector4i& a) {

         return _mm_cvtepi32_ps(a);

 }


 /**

  * \brief The arguments <tt>row0</tt>, <tt>row1</tt>, <tt>row2</tt> and

  * <tt>row3</tt> are \c __m128 values whose elements form the corresponding

  * rows of a 4-by-4 matrix. The matrix transposition is returned in

  * arguments <tt>row0</tt>, <tt>row1</tt>, <tt>row2</tt> and <tt>row3</tt>

  * where \c row0 now holds column 0 of the original matrix, \c row1 now

  * holds column 1 of the original matrix, and so on.

  * \author Intel Intrinsics Guide for AVX2

  */

 FINLINE void transpose(SSEVector4f& row0, SSEVector4f& row1,

         SSEVector4f& row2, SSEVector4f& row3) {

         __m128 tmp3, tmp2, tmp1, tmp0;

         tmp0 = _mm_unpacklo_ps(row0, row1);

         tmp2 = _mm_unpacklo_ps(row2, row3);

         tmp1 = _mm_unpackhi_ps(row0, row1);

         tmp3 = _mm_unpackhi_ps(row2, row3);


         row0 = _mm_movelh_ps(tmp0, tmp2);

         row1 = _mm_movehl_ps(tmp2, tmp0);

         row2 = _mm_movelh_ps(tmp1, tmp3);

         row3 = _mm_movehl_ps(tmp3, tmp1);

 }


 } // namespace sse


 MTS_NAMESPACE_END


 #endif /* __MITSUBA_CORE_SSEVECTOR_H_ */

mitsuba::math::SSEVector4i::SSEVector4i
SSEVector4i(int32_t i3, int32_t i2, int32_t i1, int32_t i0)
Definition: ssevector.h:302

mitsuba::math::SSEVector4i::SSEVector4i
SSEVector4i(int32_t val)
Definition: ssevector.h:301

sse.h

mitsuba::math::SSEVector4f::cmple
friend SSEVector4f cmple(const SSEVector4f &a, const SSEVector4f &b)
a &lt;= b
Definition: ssevector.h:211

mitsuba::math::castAsInt
SSEVector4i castAsInt(const SSEVector4f &a)
Reinterprets as a SSEVector4i.
Definition: ssevector.h:436

mitsuba::math::SSEVector4f::select
friend SSEVector4f select(const SSEVector4f &mask, const SSEVector4f &a, const SSEVector4f &b)
Select/blend operation (mask) ? a : b
Definition: ssevector.h:263

mitsuba::math::SSEVector4i::isZero
bool isZero() const
Test if all elements are zero.
Definition: ssevector.h:361

mitsuba::math::castAsFloat
SSEVector4f castAsFloat(const SSEVector4i &a)
Reinterprets a as a SSEVector4f.
Definition: ssevector.h:449

mitsuba::math::SSEVector4f::max
friend SSEVector4f max(const SSEVector4f &a, const SSEVector4f &b)
Definition: ssevector.h:173

mitsuba::operator*
Matrix< M1, N2, T > operator*(const Matrix< M1, N1, T > &mat1, const Matrix< M2, N2, T > &mat2)
Matrix multiplication (creates a temporary)
Definition: matrix.h:745

mitsuba::math::SSEVector4f::cmpnlt
friend SSEVector4f cmpnlt(const SSEVector4f &a, const SSEVector4f &b)
!(a &lt; b)
Definition: ssevector.h:227

mitsuba::math::SSEVector4i::SSEVector4i
SSEVector4i()
Definition: ssevector.h:298

mitsuba::math::SSEVector4i::stream
friend void stream(SSEVector4i *dest, const SSEVector4i &value)
Save to dest without polluting the cache.
Definition: ssevector.h:426

mitsuba::math::SSEVector4i::select
friend SSEVector4i select(const SSEVector4i &mask, const SSEVector4i &a, const SSEVector4i &b)
Select/blend: (mask) ? a : b
Definition: ssevector.h:389

mitsuba::math::SSEVector4i::cmpeq
friend SSEVector4i cmpeq(const SSEVector4i &a, const SSEVector4i &b)
a == b
Definition: ssevector.h:367

mitsuba::math::SSEVector4i::operator>
friend SSEVector4i operator>(const SSEVector4i &a, const SSEVector4i &b)
Definition: ssevector.h:384

mitsuba::math::SSEVector4f::SSEVector4f
SSEVector4f(float val)
Definition: ssevector.h:81

mitsuba::math::SSEVector4f::cmpnle
friend SSEVector4f cmpnle(const SSEVector4f &a, const SSEVector4f &b)
!(a &lt;= b)
Definition: ssevector.h:231

mitsuba::math::SSEVector4f
Definition: ssevector.h:72

mitsuba::math::SSEVector4f::operator<
friend SSEVector4f operator<(const SSEVector4f &a, const SSEVector4f &b)
Definition: ssevector.h:249

mitsuba::math::SSEVector4i::SSEVector4i
SSEVector4i(__m128i val)
Definition: ssevector.h:300

platform.h

mitsuba::math::SSEVector4f::stream
friend void stream(__m128 *dest, const SSEVector4f &value)
Save to dest without polluting the cache.
Definition: ssevector.h:281

mitsuba::math::SSEVector4f::cmpge
friend SSEVector4f cmpge(const SSEVector4f &a, const SSEVector4f &b)
a &gt;= b
Definition: ssevector.h:219

mitsuba::math::SSEVector4i
Definition: ssevector.h:292

mitsuba::math::SSEVector4i::constant
static const __m128i & constant()
Definition: ssevector.h:398

mitsuba::math::SSEVector4f::operator==
friend SSEVector4f operator==(const SSEVector4f &a, const SSEVector4f &b)
Definition: ssevector.h:243

MTS_NAMESPACE_BEGIN
#define MTS_NAMESPACE_BEGIN
Definition: platform.h:137

mitsuba::math::SSEVector4i::operator==
friend SSEVector4i operator==(const SSEVector4i &a, const SSEVector4i &b)
Definition: ssevector.h:378

mitsuba::math::transpose
FINLINE void transpose(SSEVector4f &row0, SSEVector4f &row1, SSEVector4f &row2, SSEVector4f &row3)
The arguments row0, row1, row2 and row3 are __m128 values whose elements form the corresponding rows ...
Definition: ssevector.h:466

mitsuba::math::toFloat
SSEVector4f toFloat(const SSEVector4i &a)
Convert a to floating point.
Definition: ssevector.h:453

mitsuba::math::SSEVector4f::rcp
friend SSEVector4f rcp(const SSEVector4f &v)
Definition: ssevector.h:166

mitsuba::math::SSEVector4f::cmpeq
friend SSEVector4f cmpeq(const SSEVector4f &a, const SSEVector4f &b)
a == b
Definition: ssevector.h:203

mitsuba::math::SSEVector4f::operator!=
friend SSEVector4f operator!=(const SSEVector4f &a, const SSEVector4f &b)
Definition: ssevector.h:246

mitsuba::math::SSEVector4f::rcp_nr
friend SSEVector4f rcp_nr(const SSEVector4f &v)
Newton-Rhapson Reciprocal: .
Definition: ssevector.h:160

mitsuba::math::SSEVector4f::cmplt
friend SSEVector4f cmplt(const SSEVector4f &a, const SSEVector4f &b)
a &lt; b
Definition: ssevector.h:207

mitsuba::math::SSEVector4f::operator>
friend SSEVector4f operator>(const SSEVector4f &a, const SSEVector4f &b)
Definition: ssevector.h:255

mitsuba::math::SSEVector4i::SSEVector4i
SSEVector4i(const SSEVector4i &val)
Definition: ssevector.h:299

mitsuba::math::SSEVector4f::min
friend SSEVector4f min(const SSEVector4f &a, const SSEVector4f &b)
Definition: ssevector.h:170

mitsuba::math::SSEVector4f::cmpnge
friend SSEVector4f cmpnge(const SSEVector4f &a, const SSEVector4f &b)
!(a &gt;= b)
Definition: ssevector.h:239

mitsuba::math::shuffle
SSEVector4f shuffle(const SSEVector4f &a)
Definition: ssevector.h:198

mitsuba::math::SSEVector4f::stream
friend void stream(SSEVector4f *dest, const SSEVector4f &value)
Save to dest without polluting the cache.
Definition: ssevector.h:277

mitsuba::math::toInt
SSEVector4i toInt(const SSEVector4f &a)
Convert a to integer using truncate.
Definition: ssevector.h:440

mitsuba::math::SSEVector4f::cmpgt
friend SSEVector4f cmpgt(const SSEVector4f &a, const SSEVector4f &b)
a &gt; b
Definition: ssevector.h:215

mitsuba::math::SSEVector4f::SSEVector4f
SSEVector4f(const SSEVector4f &other)
Definition: ssevector.h:79

mitsuba::math::SSEVector4f::roundTruncate
friend SSEVector4f roundTruncate(const SSEVector4f &a)
Round a towards zero.
Definition: ssevector.h:271

mitsuba::math::SSEVector4f::cmpneq
friend SSEVector4f cmpneq(const SSEVector4f &a, const SSEVector4f &b)
a != b
Definition: ssevector.h:223

mitsuba::math::SSEVector4f::SSEVector4f
SSEVector4f()
Definition: ssevector.h:78

mitsuba::math::SSEVector4f::andnot
friend SSEVector4f andnot(const SSEVector4f &a, const SSEVector4f &b)
~a &amp; b
Definition: ssevector.h:109

mitsuba::math::SSEVector4i::cmplt
friend SSEVector4i cmplt(const SSEVector4i &a, const SSEVector4i &b)
a &lt; b
Definition: ssevector.h:371

mitsuba::math::SSEVector4f::operator<=
friend SSEVector4f operator<=(const SSEVector4f &a, const SSEVector4f &b)
Definition: ssevector.h:252

mitsuba::math::SSEVector4f::SSEVector4f
SSEVector4f(__m128 val)
Definition: ssevector.h:80

mitsuba::math::SSEVector4i::operator<
friend SSEVector4i operator<(const SSEVector4i &a, const SSEVector4i &b)
Definition: ssevector.h:381

mitsuba::math::SSEVector4i::srl
friend SSEVector4i srl(const SSEVector4i &a, int count)
Shift right by count bits while shifting in zeros.
Definition: ssevector.h:416

mitsuba::math::SSEVector4i::constant
static const __m128i & constant()
Definition: ssevector.h:407

mitsuba::math::SSEVector4i::andnot
friend SSEVector4i andnot(const SSEVector4i &a, const SSEVector4i &b)
~a &amp; b
Definition: ssevector.h:329

mitsuba::math::SSEVector4f::zero
static SSEVector4f zero()
Definition: ssevector.h:91

mitsuba::math::SSEVector4i::cmpgt
friend SSEVector4i cmpgt(const SSEVector4i &a, const SSEVector4i &b)
a &gt; b
Definition: ssevector.h:375

mitsuba::math::SSEVector4f::isnan
friend SSEVector4f isnan(const SSEVector4f &a)
Definition: ssevector.h:177

mitsuba::math::SSEVector4f::isnan
friend SSEVector4f isnan(const SSEVector4f &a, const SSEVector4f &b)
Definition: ssevector.h:180

math::roundToInt
int roundToInt(float value)
Integer round function (single precision)
Definition: math.h:106

mitsuba::math::SSEVector4i::stream
friend void stream(__m128i *dest, const SSEVector4i &value)
Save to dest without polluting the cache.
Definition: ssevector.h:430

mitsuba::math::SSEVector4f::cmpngt
friend SSEVector4f cmpngt(const SSEVector4f &a, const SSEVector4f &b)
!(a &gt; b)
Definition: ssevector.h:235

mitsuba::math::SSEVector4i::sll
friend SSEVector4i sll(const SSEVector4i &a, int count)
Shift left by count bits while shifting in zeros.
Definition: ssevector.h:421

MTS_NAMESPACE_END
#define MTS_NAMESPACE_END
Definition: platform.h:138

mitsuba::math::SSEVector4f::operator>=
friend SSEVector4f operator>=(const SSEVector4f &a, const SSEVector4f &b)
Definition: ssevector.h:258

mitsuba::math::SSEVector4i::zero
static SSEVector4i zero()
Definition: ssevector.h:311

mitsuba::math::SSEVector4f::stream
friend void stream(float *dest, const SSEVector4f &value)
Save to dest without polluting the cache.
Definition: ssevector.h:285

mitsuba::math::SSEVector4f::SSEVector4f
SSEVector4f(float f3, float f2, float f1, float f0)
Definition: ssevector.h:82