improve mat4 mul

This commit is contained in:
Recep Aslantas
2016-09-20 03:13:48 +03:00
parent b42a599310
commit 8a6fe6948a
3 changed files with 77 additions and 72 deletions

View File

@@ -12,23 +12,14 @@
#include <emmintrin.h>
/* float */
#define _mm_madd_ps(L, R0, R1) \
_mm_add_ps(_mm_mul_ps(_mm_set1_ps(*(L)), R0), \
_mm_mul_ps(_mm_set1_ps(*(L + 1)), R1))
#define _mm_msub_ps(M00, M01, M10, M11) \
_mm_sub_ps(_mm_mul_ps(M00, M01), \
_mm_mul_ps(M10, M11))
#define _mm_shuffle1_ps(a, z, y, x, w) \
_mm_shuffle_ps(a, a, _MM_SHUFFLE(z, y, x, w))
#define _mm_shuffle1_ps1(a, x) \
_mm_shuffle_ps(a, a, _MM_SHUFFLE(x, x, x, x))
#define _mm_shuffle2_ps(a, b, z0, y0, x0, w0, z1, y1, x1, w1) \
_mm_shuffle1_ps(_mm_shuffle_ps(a, b, _MM_SHUFFLE(z0, y0, x0, w0)), \
z1, y1, x1, w1);
#define _mm_madd4_ps(L, R0, R1, R2, R3) \
_mm_add_ps(_mm_madd_ps(L, R0, R1), \
_mm_madd_ps(L + 2, R2, R3))
#endif /* cglm_intrin_h */