mirror of
https://github.com/CTCaer/RetroArch.git
synced 2024-12-27 05:05:51 +00:00
580 lines
12 KiB
C++
580 lines
12 KiB
C++
///////////////////////////////////////////////////////////////////////////////////////////////////
|
|
// OpenGL Mathematics Copyright (c) 2005 - 2014 G-Truc Creation (www.g-truc.net)
|
|
///////////////////////////////////////////////////////////////////////////////////////////////////
|
|
// Created : 2009-05-19
|
|
// Updated : 2009-05-19
|
|
// Licence : This source is under MIT License
|
|
// File : glm/gtx/simd_mat4.hpp
|
|
///////////////////////////////////////////////////////////////////////////////////////////////////
|
|
|
|
namespace glm{
|
|
namespace detail{
|
|
|
|
inline length_t fmat4x4SIMD::length() const
|
|
{
|
|
return 4;
|
|
}
|
|
|
|
//////////////////////////////////////
|
|
// Accesses
|
|
|
|
inline fvec4SIMD & fmat4x4SIMD::operator[]
|
|
(
|
|
length_t i
|
|
)
|
|
{
|
|
assert(i < this->length());
|
|
|
|
return this->Data[i];
|
|
}
|
|
|
|
inline fvec4SIMD const & fmat4x4SIMD::operator[]
|
|
(
|
|
length_t i
|
|
) const
|
|
{
|
|
assert(i < this->length());
|
|
|
|
return this->Data[i];
|
|
}
|
|
|
|
//////////////////////////////////////////////////////////////
|
|
// Constructors
|
|
|
|
inline fmat4x4SIMD::fmat4x4SIMD()
|
|
{
|
|
#ifndef GLM_SIMD_ENABLE_DEFAULT_INIT
|
|
this->Data[0] = fvec4SIMD(1.0f, 0, 0, 0);
|
|
this->Data[1] = fvec4SIMD(0, 1.0f, 0, 0);
|
|
this->Data[2] = fvec4SIMD(0, 0, 1.0f, 0);
|
|
this->Data[3] = fvec4SIMD(0, 0, 0, 1.0f);
|
|
#endif
|
|
}
|
|
|
|
inline fmat4x4SIMD::fmat4x4SIMD(float const & s)
|
|
{
|
|
this->Data[0] = fvec4SIMD(s, 0, 0, 0);
|
|
this->Data[1] = fvec4SIMD(0, s, 0, 0);
|
|
this->Data[2] = fvec4SIMD(0, 0, s, 0);
|
|
this->Data[3] = fvec4SIMD(0, 0, 0, s);
|
|
}
|
|
|
|
inline fmat4x4SIMD::fmat4x4SIMD
|
|
(
|
|
float const & x0, float const & y0, float const & z0, float const & w0,
|
|
float const & x1, float const & y1, float const & z1, float const & w1,
|
|
float const & x2, float const & y2, float const & z2, float const & w2,
|
|
float const & x3, float const & y3, float const & z3, float const & w3
|
|
)
|
|
{
|
|
this->Data[0] = fvec4SIMD(x0, y0, z0, w0);
|
|
this->Data[1] = fvec4SIMD(x1, y1, z1, w1);
|
|
this->Data[2] = fvec4SIMD(x2, y2, z2, w2);
|
|
this->Data[3] = fvec4SIMD(x3, y3, z3, w3);
|
|
}
|
|
|
|
inline fmat4x4SIMD::fmat4x4SIMD
|
|
(
|
|
fvec4SIMD const & v0,
|
|
fvec4SIMD const & v1,
|
|
fvec4SIMD const & v2,
|
|
fvec4SIMD const & v3
|
|
)
|
|
{
|
|
this->Data[0] = v0;
|
|
this->Data[1] = v1;
|
|
this->Data[2] = v2;
|
|
this->Data[3] = v3;
|
|
}
|
|
|
|
inline fmat4x4SIMD::fmat4x4SIMD
|
|
(
|
|
mat4 const & m
|
|
)
|
|
{
|
|
this->Data[0] = fvec4SIMD(m[0]);
|
|
this->Data[1] = fvec4SIMD(m[1]);
|
|
this->Data[2] = fvec4SIMD(m[2]);
|
|
this->Data[3] = fvec4SIMD(m[3]);
|
|
}
|
|
|
|
inline fmat4x4SIMD::fmat4x4SIMD
|
|
(
|
|
__m128 const in[4]
|
|
)
|
|
{
|
|
this->Data[0] = in[0];
|
|
this->Data[1] = in[1];
|
|
this->Data[2] = in[2];
|
|
this->Data[3] = in[3];
|
|
}
|
|
|
|
//////////////////////////////////////////////////////////////
|
|
// mat4 operators
|
|
|
|
inline fmat4x4SIMD& fmat4x4SIMD::operator=
|
|
(
|
|
fmat4x4SIMD const & m
|
|
)
|
|
{
|
|
this->Data[0] = m[0];
|
|
this->Data[1] = m[1];
|
|
this->Data[2] = m[2];
|
|
this->Data[3] = m[3];
|
|
return *this;
|
|
}
|
|
|
|
inline fmat4x4SIMD & fmat4x4SIMD::operator+=
|
|
(
|
|
fmat4x4SIMD const & m
|
|
)
|
|
{
|
|
this->Data[0].Data = _mm_add_ps(this->Data[0].Data, m[0].Data);
|
|
this->Data[1].Data = _mm_add_ps(this->Data[1].Data, m[1].Data);
|
|
this->Data[2].Data = _mm_add_ps(this->Data[2].Data, m[2].Data);
|
|
this->Data[3].Data = _mm_add_ps(this->Data[3].Data, m[3].Data);
|
|
return *this;
|
|
}
|
|
|
|
inline fmat4x4SIMD & fmat4x4SIMD::operator-=
|
|
(
|
|
fmat4x4SIMD const & m
|
|
)
|
|
{
|
|
this->Data[0].Data = _mm_sub_ps(this->Data[0].Data, m[0].Data);
|
|
this->Data[1].Data = _mm_sub_ps(this->Data[1].Data, m[1].Data);
|
|
this->Data[2].Data = _mm_sub_ps(this->Data[2].Data, m[2].Data);
|
|
this->Data[3].Data = _mm_sub_ps(this->Data[3].Data, m[3].Data);
|
|
|
|
return *this;
|
|
}
|
|
|
|
inline fmat4x4SIMD & fmat4x4SIMD::operator*=
|
|
(
|
|
fmat4x4SIMD const & m
|
|
)
|
|
{
|
|
sse_mul_ps(&this->Data[0].Data, &m.Data[0].Data, &this->Data[0].Data);
|
|
return *this;
|
|
}
|
|
|
|
inline fmat4x4SIMD & fmat4x4SIMD::operator/=
|
|
(
|
|
fmat4x4SIMD const & m
|
|
)
|
|
{
|
|
__m128 Inv[4];
|
|
sse_inverse_ps(&m.Data[0].Data, Inv);
|
|
sse_mul_ps(&this->Data[0].Data, Inv, &this->Data[0].Data);
|
|
return *this;
|
|
}
|
|
|
|
inline fmat4x4SIMD & fmat4x4SIMD::operator+=
|
|
(
|
|
float const & s
|
|
)
|
|
{
|
|
__m128 Operand = _mm_set_ps1(s);
|
|
this->Data[0].Data = _mm_add_ps(this->Data[0].Data, Operand);
|
|
this->Data[1].Data = _mm_add_ps(this->Data[1].Data, Operand);
|
|
this->Data[2].Data = _mm_add_ps(this->Data[2].Data, Operand);
|
|
this->Data[3].Data = _mm_add_ps(this->Data[3].Data, Operand);
|
|
return *this;
|
|
}
|
|
|
|
inline fmat4x4SIMD & fmat4x4SIMD::operator-=
|
|
(
|
|
float const & s
|
|
)
|
|
{
|
|
__m128 Operand = _mm_set_ps1(s);
|
|
this->Data[0].Data = _mm_sub_ps(this->Data[0].Data, Operand);
|
|
this->Data[1].Data = _mm_sub_ps(this->Data[1].Data, Operand);
|
|
this->Data[2].Data = _mm_sub_ps(this->Data[2].Data, Operand);
|
|
this->Data[3].Data = _mm_sub_ps(this->Data[3].Data, Operand);
|
|
return *this;
|
|
}
|
|
|
|
inline fmat4x4SIMD & fmat4x4SIMD::operator*=
|
|
(
|
|
float const & s
|
|
)
|
|
{
|
|
__m128 Operand = _mm_set_ps1(s);
|
|
this->Data[0].Data = _mm_mul_ps(this->Data[0].Data, Operand);
|
|
this->Data[1].Data = _mm_mul_ps(this->Data[1].Data, Operand);
|
|
this->Data[2].Data = _mm_mul_ps(this->Data[2].Data, Operand);
|
|
this->Data[3].Data = _mm_mul_ps(this->Data[3].Data, Operand);
|
|
return *this;
|
|
}
|
|
|
|
inline fmat4x4SIMD & fmat4x4SIMD::operator/=
|
|
(
|
|
float const & s
|
|
)
|
|
{
|
|
__m128 Operand = _mm_div_ps(one, _mm_set_ps1(s));
|
|
this->Data[0].Data = _mm_mul_ps(this->Data[0].Data, Operand);
|
|
this->Data[1].Data = _mm_mul_ps(this->Data[1].Data, Operand);
|
|
this->Data[2].Data = _mm_mul_ps(this->Data[2].Data, Operand);
|
|
this->Data[3].Data = _mm_mul_ps(this->Data[3].Data, Operand);
|
|
return *this;
|
|
}
|
|
|
|
inline fmat4x4SIMD & fmat4x4SIMD::operator++ ()
|
|
{
|
|
this->Data[0].Data = _mm_add_ps(this->Data[0].Data, one);
|
|
this->Data[1].Data = _mm_add_ps(this->Data[1].Data, one);
|
|
this->Data[2].Data = _mm_add_ps(this->Data[2].Data, one);
|
|
this->Data[3].Data = _mm_add_ps(this->Data[3].Data, one);
|
|
return *this;
|
|
}
|
|
|
|
inline fmat4x4SIMD & fmat4x4SIMD::operator-- ()
|
|
{
|
|
this->Data[0].Data = _mm_sub_ps(this->Data[0].Data, one);
|
|
this->Data[1].Data = _mm_sub_ps(this->Data[1].Data, one);
|
|
this->Data[2].Data = _mm_sub_ps(this->Data[2].Data, one);
|
|
this->Data[3].Data = _mm_sub_ps(this->Data[3].Data, one);
|
|
return *this;
|
|
}
|
|
|
|
|
|
//////////////////////////////////////////////////////////////
|
|
// Binary operators
|
|
|
|
inline fmat4x4SIMD operator+
|
|
(
|
|
const fmat4x4SIMD &m,
|
|
float const & s
|
|
)
|
|
{
|
|
return detail::fmat4x4SIMD
|
|
(
|
|
m[0] + s,
|
|
m[1] + s,
|
|
m[2] + s,
|
|
m[3] + s
|
|
);
|
|
}
|
|
|
|
inline fmat4x4SIMD operator+
|
|
(
|
|
float const & s,
|
|
const fmat4x4SIMD &m
|
|
)
|
|
{
|
|
return detail::fmat4x4SIMD
|
|
(
|
|
m[0] + s,
|
|
m[1] + s,
|
|
m[2] + s,
|
|
m[3] + s
|
|
);
|
|
}
|
|
|
|
inline fmat4x4SIMD operator+
|
|
(
|
|
const fmat4x4SIMD &m1,
|
|
const fmat4x4SIMD &m2
|
|
)
|
|
{
|
|
return detail::fmat4x4SIMD
|
|
(
|
|
m1[0] + m2[0],
|
|
m1[1] + m2[1],
|
|
m1[2] + m2[2],
|
|
m1[3] + m2[3]
|
|
);
|
|
}
|
|
|
|
|
|
inline fmat4x4SIMD operator-
|
|
(
|
|
const fmat4x4SIMD &m,
|
|
float const & s
|
|
)
|
|
{
|
|
return detail::fmat4x4SIMD
|
|
(
|
|
m[0] - s,
|
|
m[1] - s,
|
|
m[2] - s,
|
|
m[3] - s
|
|
);
|
|
}
|
|
|
|
inline fmat4x4SIMD operator-
|
|
(
|
|
float const & s,
|
|
const fmat4x4SIMD &m
|
|
)
|
|
{
|
|
return detail::fmat4x4SIMD
|
|
(
|
|
s - m[0],
|
|
s - m[1],
|
|
s - m[2],
|
|
s - m[3]
|
|
);
|
|
}
|
|
|
|
inline fmat4x4SIMD operator-
|
|
(
|
|
const fmat4x4SIMD &m1,
|
|
const fmat4x4SIMD &m2
|
|
)
|
|
{
|
|
return detail::fmat4x4SIMD
|
|
(
|
|
m1[0] - m2[0],
|
|
m1[1] - m2[1],
|
|
m1[2] - m2[2],
|
|
m1[3] - m2[3]
|
|
);
|
|
}
|
|
|
|
|
|
inline fmat4x4SIMD operator*
|
|
(
|
|
const fmat4x4SIMD &m,
|
|
float const & s
|
|
)
|
|
{
|
|
return detail::fmat4x4SIMD
|
|
(
|
|
m[0] * s,
|
|
m[1] * s,
|
|
m[2] * s,
|
|
m[3] * s
|
|
);
|
|
}
|
|
|
|
inline fmat4x4SIMD operator*
|
|
(
|
|
float const & s,
|
|
const fmat4x4SIMD &m
|
|
)
|
|
{
|
|
return detail::fmat4x4SIMD
|
|
(
|
|
m[0] * s,
|
|
m[1] * s,
|
|
m[2] * s,
|
|
m[3] * s
|
|
);
|
|
}
|
|
|
|
inline fvec4SIMD operator*
|
|
(
|
|
const fmat4x4SIMD &m,
|
|
fvec4SIMD const & v
|
|
)
|
|
{
|
|
return sse_mul_ps(&m.Data[0].Data, v.Data);
|
|
}
|
|
|
|
inline fvec4SIMD operator*
|
|
(
|
|
fvec4SIMD const & v,
|
|
const fmat4x4SIMD &m
|
|
)
|
|
{
|
|
return sse_mul_ps(v.Data, &m.Data[0].Data);
|
|
}
|
|
|
|
inline fmat4x4SIMD operator*
|
|
(
|
|
const fmat4x4SIMD &m1,
|
|
const fmat4x4SIMD &m2
|
|
)
|
|
{
|
|
fmat4x4SIMD result;
|
|
sse_mul_ps(&m1.Data[0].Data, &m2.Data[0].Data, &result.Data[0].Data);
|
|
|
|
return result;
|
|
}
|
|
|
|
|
|
|
|
inline fmat4x4SIMD operator/
|
|
(
|
|
const fmat4x4SIMD &m,
|
|
float const & s
|
|
)
|
|
{
|
|
return detail::fmat4x4SIMD
|
|
(
|
|
m[0] / s,
|
|
m[1] / s,
|
|
m[2] / s,
|
|
m[3] / s
|
|
);
|
|
}
|
|
|
|
inline fmat4x4SIMD operator/
|
|
(
|
|
float const & s,
|
|
const fmat4x4SIMD &m
|
|
)
|
|
{
|
|
return detail::fmat4x4SIMD
|
|
(
|
|
s / m[0],
|
|
s / m[1],
|
|
s / m[2],
|
|
s / m[3]
|
|
);
|
|
}
|
|
|
|
inline detail::fmat4x4SIMD inverse(detail::fmat4x4SIMD const & m)
|
|
{
|
|
detail::fmat4x4SIMD result;
|
|
detail::sse_inverse_ps(&m[0].Data, &result[0].Data);
|
|
return result;
|
|
}
|
|
|
|
inline fvec4SIMD operator/
|
|
(
|
|
const fmat4x4SIMD & m,
|
|
fvec4SIMD const & v
|
|
)
|
|
{
|
|
return inverse(m) * v;
|
|
}
|
|
|
|
inline fvec4SIMD operator/
|
|
(
|
|
fvec4SIMD const & v,
|
|
const fmat4x4SIMD &m
|
|
)
|
|
{
|
|
return v * inverse(m);
|
|
}
|
|
|
|
inline fmat4x4SIMD operator/
|
|
(
|
|
const fmat4x4SIMD &m1,
|
|
const fmat4x4SIMD &m2
|
|
)
|
|
{
|
|
__m128 result[4];
|
|
__m128 inv[4];
|
|
|
|
sse_inverse_ps(&m2.Data[0].Data, inv);
|
|
sse_mul_ps(&m1.Data[0].Data, inv, result);
|
|
|
|
return fmat4x4SIMD(result);
|
|
}
|
|
|
|
|
|
//////////////////////////////////////////////////////////////
|
|
// Unary constant operators
|
|
inline fmat4x4SIMD const operator-
|
|
(
|
|
fmat4x4SIMD const & m
|
|
)
|
|
{
|
|
return detail::fmat4x4SIMD
|
|
(
|
|
-m[0],
|
|
-m[1],
|
|
-m[2],
|
|
-m[3]
|
|
);
|
|
}
|
|
|
|
inline fmat4x4SIMD const operator--
|
|
(
|
|
fmat4x4SIMD const & m,
|
|
int
|
|
)
|
|
{
|
|
return detail::fmat4x4SIMD
|
|
(
|
|
m[0] - 1.0f,
|
|
m[1] - 1.0f,
|
|
m[2] - 1.0f,
|
|
m[3] - 1.0f
|
|
);
|
|
}
|
|
|
|
inline fmat4x4SIMD const operator++
|
|
(
|
|
fmat4x4SIMD const & m,
|
|
int
|
|
)
|
|
{
|
|
return detail::fmat4x4SIMD
|
|
(
|
|
m[0] + 1.0f,
|
|
m[1] + 1.0f,
|
|
m[2] + 1.0f,
|
|
m[3] + 1.0f
|
|
);
|
|
}
|
|
|
|
}//namespace detail
|
|
|
|
inline mat4 mat4_cast
|
|
(
|
|
detail::fmat4x4SIMD const & x
|
|
)
|
|
{
|
|
GLM_ALIGN(16) mat4 Result;
|
|
_mm_store_ps(&Result[0][0], x.Data[0].Data);
|
|
_mm_store_ps(&Result[1][0], x.Data[1].Data);
|
|
_mm_store_ps(&Result[2][0], x.Data[2].Data);
|
|
_mm_store_ps(&Result[3][0], x.Data[3].Data);
|
|
return Result;
|
|
}
|
|
|
|
inline detail::fmat4x4SIMD matrixCompMult
|
|
(
|
|
detail::fmat4x4SIMD const & x,
|
|
detail::fmat4x4SIMD const & y
|
|
)
|
|
{
|
|
detail::fmat4x4SIMD result;
|
|
result[0] = x[0] * y[0];
|
|
result[1] = x[1] * y[1];
|
|
result[2] = x[2] * y[2];
|
|
result[3] = x[3] * y[3];
|
|
return result;
|
|
}
|
|
|
|
inline detail::fmat4x4SIMD outerProduct
|
|
(
|
|
detail::fvec4SIMD const & c,
|
|
detail::fvec4SIMD const & r
|
|
)
|
|
{
|
|
__m128 Shu0 = _mm_shuffle_ps(r.Data, r.Data, _MM_SHUFFLE(0, 0, 0, 0));
|
|
__m128 Shu1 = _mm_shuffle_ps(r.Data, r.Data, _MM_SHUFFLE(1, 1, 1, 1));
|
|
__m128 Shu2 = _mm_shuffle_ps(r.Data, r.Data, _MM_SHUFFLE(2, 2, 2, 2));
|
|
__m128 Shu3 = _mm_shuffle_ps(r.Data, r.Data, _MM_SHUFFLE(3, 3, 3, 3));
|
|
|
|
detail::fmat4x4SIMD result(detail::fmat4x4SIMD::_null);
|
|
result[0].Data = _mm_mul_ps(c.Data, Shu0);
|
|
result[1].Data = _mm_mul_ps(c.Data, Shu1);
|
|
result[2].Data = _mm_mul_ps(c.Data, Shu2);
|
|
result[3].Data = _mm_mul_ps(c.Data, Shu3);
|
|
return result;
|
|
}
|
|
|
|
inline detail::fmat4x4SIMD transpose(detail::fmat4x4SIMD const & m)
|
|
{
|
|
detail::fmat4x4SIMD result;
|
|
detail::sse_transpose_ps(&m[0].Data, &result[0].Data);
|
|
return result;
|
|
}
|
|
|
|
inline float determinant(detail::fmat4x4SIMD const & m)
|
|
{
|
|
float Result;
|
|
_mm_store_ss(&Result, detail::sse_det_ps(&m[0].Data));
|
|
return Result;
|
|
}
|
|
|
|
}//namespace glm
|