fix rigid-body inverse SSE2

This commit is contained in:
Recep Aslantas
2016-11-01 00:02:03 +02:00
parent ec6c9ae497
commit 61eb854c56

View File

@@ -52,22 +52,22 @@ glm_mul_sse2(mat4 m1, mat4 m2, mat4 dest) {
CGLM_INLINE
void
glm_inv_tr_sse2(mat4 mat) {
__m128 r0, r1, r2, r3, x0;
__m128 r0, r1, r2, r3, x0, x1;
r0 = _mm_load_ps(mat[0]);
r1 = _mm_load_ps(mat[1]);
r2 = _mm_load_ps(mat[2]);
r3 = _mm_load_ps(mat[3]);
x1 = _mm_set_ps(1.0f, 0.0f, 0.0f, 0.0f);
_MM_TRANSPOSE4_PS(r0, r1, r2, x1);
x0 = _mm_add_ps(_mm_mul_ps(r0, _mm_shuffle1_ps(r3, 0, 0, 0, 0)),
_mm_mul_ps(r1, _mm_shuffle1_ps(r3, 1, 1, 1, 1)));
x0 = _mm_add_ps(x0, _mm_mul_ps(r2, _mm_shuffle1_ps(r3, 2, 2, 2, 2)));
x0 = _mm_xor_ps(x0, _mm_set1_ps(-0.f));
r3 = _mm_set_ps(1.0f, 0.0f, 0.0f, 0.0f);
x0 = _mm_add_ps(x0, r3);
_MM_TRANSPOSE4_PS(r0, r1, r2, r3);
x0 = _mm_add_ps(x0, x1);
_mm_store_ps(mat[0], r0);
_mm_store_ps(mat[1], r1);