nebula-doc/vec3_8h_source.html

#pragma once

//------------------------------------------------------------------------------

#include "core/types.h"

#include "math/scalar.h"

#include "core/simd.h"


//------------------------------------------------------------------------------

namespace Math

{

struct mat4;

struct vec3;


static const f32x4 _id_x = set_f32x4(1.0f, 0.0f, 0.0f, 0.0f);

static const f32x4 _id_y = set_f32x4(0.0f, 1.0f, 0.0f, 0.0f);

static const f32x4 _id_z = set_f32x4(0.0f, 0.0f, 1.0f, 0.0f);

static const f32x4 _id_w = set_f32x4(0.0f, 0.0f, 0.0f, 1.0f);

static const f32x4 _minus1 = set_f32x4(-1.0f, -1.0f, -1.0f, -1.0f);

static const f32x4 _plus1 = set_f32x4(1.0f, 1.0f, 1.0f, 1.0f);

static const f32x4 _zero = set_f32x4(0.0f, 0.0f, 0.0f, 0.0f);

static const i32x4 _sign = set_i32x4(0x80000000, 0x80000000, 0x80000000, 0x80000000);

static const f32x4 _mask_xyz = cast_i32x4_to_f32x4(set_i32x4( 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0 ));


struct NEBULA_ALIGN16 vec3

{

public:

    vec3() = default;


    vec3(scalar x, scalar y, scalar z);


    vec3(float3 f3);


    explicit vec3(scalar v);

    vec3(const vec3& rhs) = default;


    vec3(const f32x4& rhs);


    void operator=(const f32x4& rhs);

    void operator+=(const vec3& rhs);

    void operator-=(const vec3& rhs);

    void operator*=(scalar s);

    void operator*=(const vec3& rhs);

    void operator/=(const vec3& rhs);

    bool operator==(const vec3& rhs) const;

    bool operator!=(const vec3& rhs) const;


    void load(const scalar* ptr);

    void loadu(const scalar* ptr);

    void store(scalar* ptr) const;

    void storeu(scalar* ptr) const;

    void stream(scalar* ptr) const;


    void set(scalar x, scalar y, scalar z);


    scalar& operator[](const int index);

    scalar operator[](const int index) const;


    union

    {

        struct

        {

            // we can access __w to check it, but we don't actually use it

            float x, y, z, __w;

        };

        f32x4 vec;

        float v[3];

    };

};


//------------------------------------------------------------------------------

__forceinline


vec3::vec3(scalar x, scalar y, scalar z)

{

    this->vec = set_f32x4(x, y, z, 0);

}


//------------------------------------------------------------------------------

__forceinline


vec3::vec3(float3 f3)

{

    this->vec = _mm_setr_ps(f3.x, f3.y, f3.z, 0);

}


//------------------------------------------------------------------------------

__forceinline


vec3::vec3(scalar v)

{

    this->vec = set_f32x4(v, v, v, 0.0f);

}


//------------------------------------------------------------------------------

__forceinline


vec3::vec3(const f32x4& rhs)

{

    this->vec = set_last_f32x4(rhs, 0);

}


//------------------------------------------------------------------------------

__forceinline void


vec3::operator=(const f32x4& rhs)

{

    this->vec = set_last_f32x4(rhs, 0);

}


//------------------------------------------------------------------------------

__forceinline bool


vec3::operator==(const vec3& rhs) const

{

    return (((_mm_movemask_ps(_mm_cmpeq_ps(this->vec, rhs.vec)) & 7) == 7) != 0);

}


//------------------------------------------------------------------------------

__forceinline bool


vec3::operator!=(const vec3 &rhs) const

{

    return !(((_mm_movemask_ps(_mm_cmpeq_ps(this->vec, rhs.vec)) & 7) == 7) != 0);

}


//------------------------------------------------------------------------------

__forceinline void


vec3::load(const scalar* ptr)

{

    this->vec = load_aligned_f32x3(ptr);

}


//------------------------------------------------------------------------------

__forceinline void


vec3::loadu(const scalar* ptr)

{

    this->vec = load_unaligned_f32x3(ptr);

}


//------------------------------------------------------------------------------

__forceinline void


vec3::store(scalar* ptr) const

{

    store_f32x3(this->vec, ptr);

}


//------------------------------------------------------------------------------

__forceinline void


vec3::storeu(scalar* ptr) const

{

    store_f32x3(this->vec, ptr);

}


//------------------------------------------------------------------------------

__forceinline void


vec3::stream(scalar* ptr) const

{

    this->store(ptr);

}


//------------------------------------------------------------------------------

__forceinline vec3


operator-(const vec3& lhs)

{

    return vec3(flip_sign_f32x4(lhs.vec));

}


//------------------------------------------------------------------------------

__forceinline vec3


operator*(const vec3& lhs, scalar t)

{

    f32x4 temp = _mm_set1_ps(t);

    return mul_f32x4(lhs.vec, temp);

}


//------------------------------------------------------------------------------

__forceinline vec3


operator*(const vec3& lhs, const vec3& rhs)

{

    return mul_f32x4(lhs.vec, rhs.vec);

}


//------------------------------------------------------------------------------

__forceinline vec3


operator/(const vec3& lhs, scalar t)

{

    __m128 temp = _mm_set1_ps(t);

    return _mm_div_ps(lhs.vec, temp);

}


//------------------------------------------------------------------------------

__forceinline void


vec3::operator*=(const vec3& rhs)

{

    this->vec = mul_f32x4(this->vec, rhs.vec);

}


//------------------------------------------------------------------------------

__forceinline void


vec3::operator/=( const vec3& rhs )

{

    this->vec = div_f32x4(this->vec, rhs.vec);

}


//------------------------------------------------------------------------------

__forceinline void


vec3::operator+=(const vec3 &rhs)

{

    this->vec = add_f32x4(this->vec, rhs.vec);

}


//------------------------------------------------------------------------------

__forceinline void


vec3::operator-=(const vec3 &rhs)

{

    this->vec = sub_f32x4(this->vec, rhs.vec);

}


//------------------------------------------------------------------------------

__forceinline void


vec3::operator*=(scalar s)

{

    f32x4 temp = splat_f32x4(s);

    this->vec = mul_f32x4(this->vec, temp);

}


//------------------------------------------------------------------------------

__forceinline vec3


operator+(const vec3& lhs, const vec3 &rhs)

{

    return add_f32x4(lhs.vec, rhs.vec);

}


//------------------------------------------------------------------------------

__forceinline vec3


operator-(const vec3& lhs, const vec3& rhs)

{

    return sub_f32x4(lhs.vec, rhs.vec);

}


//------------------------------------------------------------------------------

__forceinline void


vec3::set(scalar x, scalar y, scalar z)

{

    this->vec = set_f32x4(x, y, z, 0);

}


//------------------------------------------------------------------------------

__forceinline scalar&


vec3::operator[]( const int index )

{

    n_assert(index < 3);

    return this->v[index];

}


//------------------------------------------------------------------------------

__forceinline scalar


vec3::operator[](const int index) const

{

    n_assert(index < 3);

    return this->v[index];

}


//------------------------------------------------------------------------------

__forceinline scalar


length(const vec3& v)

{

    scalar dot = dot_f32x3(v.vec, v.vec);

    return sqrt(dot);

}


//------------------------------------------------------------------------------

__forceinline scalar


lengthsq(const vec3& v)

{

    return dot_f32x3(v.vec, v.vec);

}


//------------------------------------------------------------------------------

__forceinline vec3


reciprocal(const vec3& v)

{

    return div_f32x4(_plus1, v.vec);

}


//------------------------------------------------------------------------------

__forceinline vec3


reciprocalapprox(const vec3& v)

{

    return rcp_f32x4(v.vec);

}


//------------------------------------------------------------------------------

__forceinline vec3


multiply(const vec3& v0, const vec3& v1)

{

    return mul_f32x4(v0.vec, v1.vec);

}


//------------------------------------------------------------------------------

__forceinline vec3


multiplyadd( const vec3& v0, const vec3& v1, const vec3& v2 )

{

    return fma_f32x4(v0.vec, v1.vec, v2.vec);

}


//------------------------------------------------------------------------------

__forceinline vec3


divide(const vec3& v0, const vec3& v1)

{

    return div_f32x4(v0.vec, v1.vec);

}


//------------------------------------------------------------------------------

__forceinline vec3


abs(const vec3& v)

{

    return abs_f32x4(v.vec);

}


//------------------------------------------------------------------------------

__forceinline vec3


cross(const vec3& v0, const vec3& v1)

{

    f32x4 tmp0, tmp1, tmp2, tmp3, result;

    tmp0 = shuffle_f32x4( v0.vec, v0.vec, 3,0,2,1 );

    tmp1 = shuffle_f32x4( v1.vec, v1.vec, 3,1,0,2 );

    tmp2 = shuffle_f32x4( v0.vec, v0.vec, 3,1,0,2 );

    tmp3 = shuffle_f32x4( v1.vec, v1.vec, 3,0,2,1 );

    result = mul_f32x4( tmp0, tmp1 );

    result = sub_f32x4( result, mul_f32x4( tmp2, tmp3 ) );

    return result;

}


//------------------------------------------------------------------------------

__forceinline scalar


dot(const vec3& v0, const vec3& v1)

{

    return dot_f32x3(v0.vec, v1.vec);

}


//------------------------------------------------------------------------------

__forceinline vec3


barycentric(const vec3& v0, const vec3 &v1, const vec3 &v2, scalar f, scalar g)

{

    f32x4 R1 = sub_f32x4(v1.vec,v0.vec);

    f32x4 SF = splat_f32x4(f);

    f32x4 R2 = sub_f32x4(v2.vec,v0.vec);

    f32x4 SG = splat_f32x4(g);

    R1 = mul_f32x4(R1,SF);

    R2 = mul_f32x4(R2,SG);

    R1 = add_f32x4(R1,v0.vec);

    R1 = add_f32x4(R1,R2);

    return R1;

}


//------------------------------------------------------------------------------

__forceinline vec3


catmullrom(const vec3& v0, const vec3& v1, const vec3& v2, const vec3& v3, scalar s)

{

    scalar s2 = s * s;

    scalar s3 = s * s2;


    f32x4 P0 = splat_f32x4((-s3 + 2.0f * s2 - s) * 0.5f);

    f32x4 P1 = splat_f32x4((3.0f * s3 - 5.0f * s2 + 2.0f) * 0.5f);

    f32x4 P2 = splat_f32x4((-3.0f * s3 + 4.0f * s2 + s) * 0.5f);

    f32x4 P3 = splat_f32x4((s3 - s2) * 0.5f);


    P0 = mul_f32x4(P0, v0.vec);

    P1 = mul_f32x4(P1, v1.vec);

    P2 = mul_f32x4(P2, v2.vec);

    P3 = mul_f32x4(P3, v3.vec);

    P0 = add_f32x4(P0,P1);

    P2 = add_f32x4(P2,P3);

    P0 = add_f32x4(P0,P2);

    return P0;

}


//------------------------------------------------------------------------------

__forceinline vec3


hermite(const vec3& v1, const vec3& t1, const vec3& v2, const vec3& t2, scalar s)

{

    scalar s2 = s * s;

    scalar s3 = s * s2;


    f32x4 P0 = splat_f32x4(2.0f * s3 - 3.0f * s2 + 1.0f);

    f32x4 T0 = splat_f32x4(s3 - 2.0f * s2 + s);

    f32x4 P1 = splat_f32x4(-2.0f * s3 + 3.0f * s2);

    f32x4 T1 = splat_f32x4(s3 - s2);


    f32x4 vResult = mul_f32x4(P0, v1.vec);

    f32x4 vTemp = mul_f32x4(T0, t1.vec);

    vResult = add_f32x4(vResult,vTemp);

    vTemp = mul_f32x4(P1, v2.vec);

    vResult = add_f32x4(vResult,vTemp);

    vTemp = mul_f32x4(T1, t2.vec);

    vResult = add_f32x4(vResult,vTemp);

    return vResult;

}


//------------------------------------------------------------------------------

__forceinline scalar


angle(const vec3& v0, const vec3& v1)

{

    f32x4 l0 = mul_f32x4(v0.vec, v0.vec);

    l0 = add_f32x4(shuffle_f32x4(l0, l0, 0, 0, 0, 0),

           add_f32x4(shuffle_f32x4(l0, l0, 1, 1, 1, 1), shuffle_f32x4(l0, l0, 2, 2, 2, 2)));


    f32x4 l1 = mul_f32x4(v1.vec, v1.vec);

    l1 = add_f32x4(shuffle_f32x4(l1, l1, 0, 0, 0, 0),

           add_f32x4(shuffle_f32x4(l1, l1, 1, 1, 1, 1), shuffle_f32x4(l1, l1, 2, 2, 2, 2)));


    f32x4 l = shuffle_f32x4(l0, l1, 0, 0, 0, 0);

    l = rsqrt_f32x4(l);

    l = mul_first_f32x4(shuffle_f32x4(l, l, 0, 0, 0, 0), shuffle_f32x4(l, l, 1, 1, 1, 1));


    f32x4 dot = mul_f32x4(v0.vec, v1.vec);

    dot = add_f32x4(shuffle_f32x4(dot, dot, 0, 0, 0, 0),

            add_f32x4(shuffle_f32x4(dot, dot, 1, 1, 1, 1),

              add_f32x4(shuffle_f32x4(dot, dot, 2, 2, 2, 2), shuffle_f32x4(dot, dot, 3, 3, 3, 3))));


    dot = mul_first_f32x4(dot, l);


    dot = max_first_f32x4(dot, _minus1);

    dot = min_first_f32x4(dot, _plus1);


    scalar cangle;

    store_f32(dot, &cangle);

    return acos(cangle);

}


//------------------------------------------------------------------------------

__forceinline vec3


lerp(const vec3& v0, const vec3& v1, scalar s)

{

    return fma_f32x4(sub_f32x4(v1.vec, v0.vec), splat_f32x4(s), v0.vec);

}


//------------------------------------------------------------------------------

__forceinline vec3


maximize(const vec3& v0, const vec3& v1)

{

    return max_f32x4(v0.vec, v1.vec);

}


//------------------------------------------------------------------------------

__forceinline vec3


minimize(const vec3& v0, const vec3& v1)

{

    return min_f32x4(v0.vec, v1.vec);

}


//------------------------------------------------------------------------------

__forceinline vec3


clamp(const vec3& clamp, const vec3& min, const vec3& max)

{

    f32x4 temp = max_f32x4(min.vec, clamp.vec);

    temp = min_f32x4(temp, max.vec);

    return vec3(temp);

}


//------------------------------------------------------------------------------

__forceinline vec3


normalize(const vec3& v)

{

    if (v == vec3(0)) return v;


    f32x4 t = div_f32x4(v.vec, splat_f32x4(sqrt(dot_f32x3(v.vec, v.vec))));

    return vec3(t);

}


//------------------------------------------------------------------------------

__forceinline vec3


normalizeapprox(const vec3& v)

{

    if (v == vec3(0)) return v;

    f32x4 t = splat_f32x4(1.0f / sqrt(dot_f32x3(v.vec, v.vec)));

    return mul_f32x4(v.vec, set_last_f32x4(t, 0));

}


//------------------------------------------------------------------------------

__forceinline vec3


reflect(const vec3& normal, const vec3& incident)

{

    f32x4 res = mul_f32x4(incident.vec, normal.vec);

    res = add_f32x4(shuffle_f32x4(res, res, 0, 0, 0, 0),

        add_f32x4(shuffle_f32x4(res, res, 1, 1, 1, 1), shuffle_f32x4(res, res, 2, 2, 2, 2)));

    res = add_f32x4(res, res);

    res = mul_f32x4(res, normal.vec);

    res = sub_f32x4(incident.vec,res);

    return res;

}


//------------------------------------------------------------------------------

__forceinline bool


less_any(const vec3& v0, const vec3& v1)

{

    __m128 vTemp = _mm_cmpge_ps(v0.vec, v1.vec);

    int res = _mm_movemask_ps(vTemp) & 0x7;

    return res != 0x7;

}


//------------------------------------------------------------------------------

__forceinline bool


less_all(const vec3& v0, const vec3& v1)

{

    __m128 vTemp = _mm_cmpge_ps(v0.vec, v1.vec);

    int res = _mm_movemask_ps(vTemp) & 0x7;

    return res == 0;

}


//------------------------------------------------------------------------------

__forceinline bool


lessequal_any(const vec3& v0, const vec3& v1)

{

    __m128 vTemp = _mm_cmpgt_ps(v0.vec, v1.vec);

    int res = _mm_movemask_ps(vTemp) & 7;

    return res != 0x7;

}


//------------------------------------------------------------------------------

__forceinline bool


lessequal_all(const vec3& v0, const vec3& v1)

{

    __m128 vTemp = _mm_cmpgt_ps(v0.vec, v1.vec);

    int res = _mm_movemask_ps(vTemp) & 0x7;

    return res == 0;

}


//------------------------------------------------------------------------------

__forceinline bool


greater_any(const vec3& v0, const vec3& v1)

{

    __m128 vTemp = _mm_cmpgt_ps(v0.vec, v1.vec);

    int res = _mm_movemask_ps(vTemp) & 0x7;

    return res != 0;

}


//------------------------------------------------------------------------------

__forceinline bool


greater_all(const vec3& v0, const vec3& v1)

{

    __m128 vTemp = _mm_cmpgt_ps(v0.vec, v1.vec);

    int res = _mm_movemask_ps(vTemp) & 0x7;

    return res == 0x7;

}


//------------------------------------------------------------------------------

__forceinline bool


greaterequal_any(const vec3& v0, const vec3& v1)

{

    __m128 vTemp = _mm_cmpge_ps(v0.vec, v1.vec);

    int res = _mm_movemask_ps(vTemp) & 0x7;

    return res != 0;

}


//------------------------------------------------------------------------------

__forceinline bool


greaterequal_all(const vec3& v0, const vec3& v1)

{

    __m128 vTemp = _mm_cmpge_ps(v0.vec, v1.vec);

    int res = _mm_movemask_ps(vTemp) & 0x7;

    return res == 0x7;

}


//------------------------------------------------------------------------------

__forceinline bool


equal_any(const vec3& v0, const vec3& v1)

{

    __m128 vTemp = _mm_cmpeq_ps(v0.vec, v1.vec);

    int res = _mm_movemask_ps(vTemp) & 0x7;

    return res != 0;

}


//------------------------------------------------------------------------------

__forceinline bool


nearequal(const vec3& v0, const vec3& v1, float epsilon)

{

    __m128 eps = _mm_setr_ps(epsilon, epsilon, epsilon, 0);

    __m128 delta = _mm_sub_ps(v0.vec, v1.vec);

    __m128 temp = _mm_setzero_ps();

    temp = _mm_sub_ps(temp, delta);

    temp = _mm_max_ps(temp, delta);

    temp = _mm_cmple_ps(temp, eps);

    return (_mm_movemask_ps(temp) & 0x7) != 0;

}


//------------------------------------------------------------------------------

__forceinline bool


nearequal(const vec3& v0, const vec3& v1, const vec3& epsilon)

{

    __m128 delta = _mm_sub_ps(v0.vec, v1.vec);

    __m128 temp = _mm_setzero_ps();

    temp = _mm_sub_ps(temp, delta);

    temp = _mm_max_ps(temp, delta);

    temp = _mm_cmple_ps(temp, epsilon.vec);

    auto foo = _mm_movemask_ps(temp) & 0x7;

    return (_mm_movemask_ps(temp) & 0x7) == 0x7;

}


//------------------------------------------------------------------------------

__forceinline vec3


less(const vec3& v0, const vec3& v1)

{

    return _mm_min_ps(_mm_cmplt_ps(v0.vec, v1.vec), _plus1);

}


//------------------------------------------------------------------------------

__forceinline vec3


greater(const vec3& v0, const vec3& v1)

{

    return _mm_min_ps(_mm_cmpgt_ps(v0.vec, v1.vec), _plus1);

}


//------------------------------------------------------------------------------

__forceinline vec3


equal(const vec3& v0, const vec3& v1)

{

    return _mm_min_ps(_mm_cmpeq_ps(v0.vec, v1.vec), _plus1);

}


//------------------------------------------------------------------------------

__forceinline vec3


splat(const vec3& v, uint element)

{

    n_assert(element < 3 && element >= 0);


    f32x4 res;

    switch (element)

    {

    case 0:

        res = shuffle_f32x4(v.vec, v.vec, 0, 0, 0, 0);

        break;

    case 1:

        res = shuffle_f32x4(v.vec, v.vec, 1, 1, 1, 1);

        break;

    case 2:

        res = shuffle_f32x4(v.vec, v.vec, 2, 2, 2, 2);

        break;

    }

    return set_last_f32x4(res, 0);

}


//------------------------------------------------------------------------------

__forceinline vec3


splat_x(const vec3& v)

{

    f32x4 res = shuffle_f32x4(v.vec, v.vec, 0, 0, 0, 0);

    return set_last_f32x4(res, 0);

}


//------------------------------------------------------------------------------

__forceinline vec3


splat_y(const vec3& v)

{

    f32x4 res = shuffle_f32x4(v.vec, v.vec, 1, 1, 1, 1);

    return set_last_f32x4(res, 0);

}


//------------------------------------------------------------------------------

__forceinline vec3


splat_z(const vec3& v)

{

    f32x4 res = shuffle_f32x4(v.vec, v.vec, 2, 2, 2, 2);

    return set_last_f32x4(res, 0);

}


//------------------------------------------------------------------------------

__forceinline vec3


permute(const vec3& v0, const vec3& v1, unsigned int i0, unsigned int i1, unsigned int i2)

{

    static i32x4 three = _mm_set_epi32(3,3,3,3);


    NEBULA_ALIGN16 unsigned int elem[4] = { i0, i1, i2, 7 };

    i32x4 vControl = _mm_load_si128(reinterpret_cast<const __m128i*>(&elem[0]));


    i32x4 vSelect = _mm_cmpgt_epi32(vControl, three);

    vControl = _mm_and_si128(vControl, three);


    f32x4 shuffled1 = _mm_permutevar_ps(v0.vec, vControl);

    f32x4 shuffled2 = _mm_permutevar_ps(v1.vec, vControl);


    f32x4 masked1 = _mm_andnot_ps(_mm_castsi128_ps(vSelect), shuffled1);

    f32x4 masked2 = _mm_and_ps(_mm_castsi128_ps(vSelect), shuffled2);


    return _mm_or_ps(masked1, masked2);

}


//------------------------------------------------------------------------------

__forceinline vec3


select(const vec3& v0, const vec3& v1, const uint i0, const uint i1, const uint i2)

{

    //FIXME this should be converted to something similar as XMVectorSelect

    return permute(v0, v1, i0, i1, i2);

}


//------------------------------------------------------------------------------

__forceinline vec3


select(const vec3& v0, const vec3& v1, const vec3& control)

{

    f32x4 v0masked = _mm_andnot_ps(control.vec, v0.vec);

    f32x4 v1masked = _mm_and_ps(v1.vec, control.vec);

    return _mm_or_ps(v0masked, v1masked);

}


//------------------------------------------------------------------------------

__forceinline vec3


floor(const vec3& v)

{

    return _mm_floor_ps(v.vec);

}


//------------------------------------------------------------------------------

__forceinline vec3


ceiling(const vec3& v)

{

    return _mm_ceil_ps(v.vec);

}


} // namespace Math

//------------------------------------------------------------------------------


n_assert
#define n_assert(exp)
Definition debug.h:50

Math
Different curves.
Definition angularpfeedbackloop.h:17

Math::less
__forceinline point less(const point &v0, const point &v1)
Definition point.h:501

Math::_zero
static const f32x4 _zero
Definition vec3.h:32

Math::_plus1
static const f32x4 _plus1
Definition vec3.h:31

Math::cross
__forceinline vec3 cross(const vec3 &v0, const vec3 &v1)
Definition vec3.h:423

Math::maximize
__forceinline point maximize(const point &v0, const point &v1)
Definition point.h:368

Math::_id_w
static const f32x4 _id_w
Definition vec3.h:29

Math::barycentric
__forceinline quat barycentric(const quat &q0, const quat &q1, const quat &q2, scalar f, scalar g)
Definition quat.h:296

Math::equal_any
__forceinline bool equal_any(const point &v0, const point &v1)
Definition point.h:474

Math::greaterequal_any
__forceinline bool greaterequal_any(const point &v0, const point &v1)
Definition point.h:452

Math::ceiling
__forceinline vec3 ceiling(const vec3 &v)
Definition vec3.h:887

Math::splat_z
__forceinline vec3 splat_z(const vec3 &v)
Definition vec3.h:824

Math::hermite
__forceinline vec3 hermite(const vec3 &v1, const vec3 &t1, const vec3 &v2, const vec3 &t2, scalar s)
Definition vec3.h:490

Math::sqrt
__forceinline scalar sqrt(scalar x)
Definition scalar.h:236

Math::equal
__forceinline point equal(const point &v0, const point &v1)
Definition point.h:519

Math::splat_x
__forceinline vec3 splat_x(const vec3 &v)
Definition vec3.h:804

Math::splat
__forceinline vec3 splat(const vec3 &v, uint element)
Definition vec3.h:780

Math::reflect
mat4 reflect(const vec4 &p)
based on this http://www.opengl.org/discussion_boards/showthread.php/169605-reflection-matrix-how-to-...
Definition mat4.cc:22

Math::multiply
__forceinline vec3 multiply(const vec3 &v0, const vec3 &v1)
Definition vec3.h:387

Math::angle
__forceinline scalar angle(const vec3 &v0, const vec3 &v1)
Definition vec3.h:514

Math::divide
__forceinline vec3 divide(const vec3 &v0, const vec3 &v1)
Definition vec3.h:405

Math::reciprocal
__forceinline vec3 reciprocal(const vec3 &v)
Definition vec3.h:369

Math::length
__forceinline scalar length(const quat &q)
Definition quat.h:260

Math::operator/
half operator/(half one, half two)
Definition half.h:132

Math::lengthsq
__forceinline scalar lengthsq(const quat &q)
Definition quat.h:269

Math::dot
__forceinline scalar dot(const plane &p, const vec4 &v1)
Definition plane.h:252

Math::permute
__forceinline vec3 permute(const vec3 &v0, const vec3 &v1, unsigned int i0, unsigned int i1, unsigned int i2)
Definition vec3.h:834

Math::normalize
__forceinline plane normalize(const plane &p)
Definition plane.h:261

Math::greaterequal_all
__forceinline bool greaterequal_all(const point &v0, const point &v1)
Definition point.h:463

Math::greater_any
__forceinline bool greater_any(const point &v0, const point &v1)
Definition point.h:430

Math::lerp
__forceinline float lerp(float x, float y, float l)
Linearly interpolate between 2 values: ret = x + l * (y - x)
Definition scalar.h:616

Math::_id_y
static const f32x4 _id_y
Definition vec3.h:27

Math::clamp
__forceinline float clamp(float val, float minVal, float maxVal)
Float clamping.
Definition scalar.h:506

Math::_id_z
static const f32x4 _id_z
Definition vec3.h:28

Math::operator-
half operator-(half one, half two)
Definition half.h:114

Math::less_any
__forceinline bool less_any(const point &v0, const point &v1)
Definition point.h:386

Math::catmullrom
__forceinline vec3 catmullrom(const vec3 &v0, const vec3 &v1, const vec3 &v2, const vec3 &v3, scalar s)
Definition vec3.h:466

Math::min
__forceinline TYPE min(TYPE a, TYPE b)
Definition scalar.h:399

Math::less_all
__forceinline bool less_all(const point &v0, const point &v1)
Definition point.h:397

Math::lessequal_all
__forceinline bool lessequal_all(const point &v0, const point &v1)
Definition point.h:419

Math::select
__forceinline vec3 select(const vec3 &v0, const vec3 &v1, const uint i0, const uint i1, const uint i2)
Definition vec3.h:857

Math::splat_y
__forceinline vec3 splat_y(const vec3 &v)
Definition vec3.h:814

Math::minimize
__forceinline point minimize(const point &v0, const point &v1)
Definition point.h:377

Math::scalar
float scalar
Definition scalar.h:45

Math::greater
__forceinline point greater(const point &v0, const point &v1)
Definition point.h:510

Math::operator+
half operator+(half one, half two)
Definition half.h:105

Math::_sign
static const i32x4 _sign
Definition vec3.h:33

Math::operator*
half operator*(half one, half two)
Definition half.h:123

Math::max
__forceinline TYPE max(TYPE a, TYPE b)
Definition scalar.h:368

Math::abs
__forceinline scalar abs(scalar a)
Definition scalar.h:451

Math::_mask_xyz
static const f32x4 _mask_xyz
Definition vec3.h:34

Math::multiplyadd
__forceinline vec3 multiplyadd(const vec3 &v0, const vec3 &v1, const vec3 &v2)
Definition vec3.h:396

Math::_minus1
static const f32x4 _minus1
Definition vec3.h:30

Math::acos
__forceinline scalar acos(scalar x)
Definition scalar.h:218

Math::greater_all
__forceinline bool greater_all(const point &v0, const point &v1)
Definition point.h:441

Math::nearequal
__forceinline bool nearequal(const point &v0, const point &v1, float epsilon)
Definition point.h:485

Math::lessequal_any
__forceinline bool lessequal_any(const point &v0, const point &v1)
Definition point.h:408

Math::_id_x
static const f32x4 _id_x
Definition vec3.h:26

Math::floor
__forceinline float floor(float val)
Floating point flooring.
Definition scalar.h:552

Math::normalizeapprox
__forceinline vec3 normalizeapprox(const vec3 &v)
Definition vec3.h:598

Math::reciprocalapprox
__forceinline vec3 reciprocalapprox(const vec3 &v)
Definition vec3.h:378

scalar.h
Nebula's scalar datatype.

simd.h
Maps generic SIMD-like types and intrinsics to either SSE4+AVX or NEON.

Game::Position::vec3
vec3()=default
default constructor, NOTE: does NOT setup components!

Math::float3
Definition scalar.h:67

Math::float3::x
scalar x
Definition scalar.h:70

Math::float3::y
scalar y
Definition scalar.h:70

Math::float3::z
scalar z
Definition scalar.h:70

Math::mat4
A 4x4 single point precision float matrix.
Definition mat4.h:49

Math::vec3
A 3D vector.
Definition vec3.h:37

Math::vec3::loadu
void loadu(const scalar *ptr)
load content from unaligned memory
Definition vec3.h:178

Math::vec3::stream
void stream(scalar *ptr) const
stream content to 16-byte-aligned memory circumventing the write-cache
Definition vec3.h:207

Math::vec3::v
float v[3]
Definition vec3.h:96

Math::vec3::operator==
bool operator==(const vec3 &rhs) const
equality operator
Definition vec3.h:149

Math::vec3::storeu
void storeu(scalar *ptr) const
write content to unaligned memory through the write cache
Definition vec3.h:198

Math::vec3::vec3
vec3()=default
default constructor, NOTE: does NOT setup components!

Math::vec3::load
void load(const scalar *ptr)
load content from 16-byte-aligned memory
Definition vec3.h:168

Math::vec3::operator*=
void operator*=(scalar s)
inplace scalar multiply
Definition vec3.h:293

Math::vec3::operator-=
void operator-=(const vec3 &rhs)
inplace sub
Definition vec3.h:284

Math::vec3::store
void store(scalar *ptr) const
write content to 16-byte-aligned memory through the write cache
Definition vec3.h:188

Math::vec3::x
float x
Definition vec3.h:93

Math::vec3::z
float z
Definition vec3.h:93

Math::vec3::operator/=
void operator/=(const vec3 &rhs)
divide by a vector component-wise
Definition vec3.h:266

Math::vec3::__w
float __w
Definition vec3.h:93

Math::vec3::vec
f32x4 vec
Definition vec3.h:95

Math::vec3::operator+=
void operator+=(const vec3 &rhs)
inplace add
Definition vec3.h:275

Math::vec3::operator[]
scalar & operator[](const int index)
read-only access to indexed component
Definition vec3.h:330

Math::vec3::operator!=
bool operator!=(const vec3 &rhs) const
inequality operator
Definition vec3.h:158

Math::vec3::operator=
void operator=(const f32x4 &rhs)
assign an vmVector4
Definition vec3.h:140

Math::vec3::set
void set(scalar x, scalar y, scalar z)
set content
Definition vec3.h:321

Math::vec3::vec3
vec3(const vec3 &rhs)=default
copy constructor

Math::vec3::y
float y
Definition vec3.h:93

operator==
bool operator==(const TiXmlString &a, const TiXmlString &b)
Definition tinystr.h:272

operator!=
bool operator!=(const TiXmlString &a, const TiXmlString &b)
Definition tinystr.h:282

types.h

NEBULA_ALIGN16
#define NEBULA_ALIGN16
Definition types.h:143

uint
unsigned int uint
Definition types.h:33