mirror of
https://github.com/recp/cglm.git
synced 2026-02-17 03:39:05 +00:00
Compare commits
4 Commits
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
01b93b0409 | ||
|
|
9aebdc76b3 | ||
|
|
e9b51fc07a | ||
|
|
abfa355b84 |
1
.gitignore
vendored
1
.gitignore
vendored
@@ -69,4 +69,3 @@ win/cglm_test_*
|
|||||||
win/x64
|
win/x64
|
||||||
win/x85
|
win/x85
|
||||||
win/Debug
|
win/Debug
|
||||||
cglm-test-ios*
|
|
||||||
|
|||||||
9
CREDITS
9
CREDITS
@@ -52,12 +52,3 @@ https://gamedev.stackexchange.com/questions/28395/rotating-vector3-by-a-quaterni
|
|||||||
|
|
||||||
9. Sphere AABB intersect
|
9. Sphere AABB intersect
|
||||||
https://github.com/erich666/GraphicsGems/blob/master/gems/BoxSphere.c
|
https://github.com/erich666/GraphicsGems/blob/master/gems/BoxSphere.c
|
||||||
|
|
||||||
10. Horizontal add
|
|
||||||
https://stackoverflow.com/questions/6996764/fastest-way-to-do-horizontal-float-vector-sum-on-x86
|
|
||||||
|
|
||||||
11. de casteljau implementation and comments
|
|
||||||
https://forums.khronos.org/showthread.php/10264-Animations-in-1-4-1-release-notes-revision-A/page2?highlight=bezier
|
|
||||||
https://forums.khronos.org/showthread.php/10644-Animation-Bezier-interpolation
|
|
||||||
https://forums.khronos.org/showthread.php/10387-2D-Tangents-in-Bezier-Splines?p=34164&viewfull=1#post34164
|
|
||||||
https://forums.khronos.org/showthread.php/10651-Animation-TCB-Spline-Interpolation-in-COLLADA?highlight=bezier
|
|
||||||
|
|||||||
@@ -82,11 +82,7 @@ Currently *cglm* uses default clip space configuration (-1, 1) for camera functi
|
|||||||
- inline or pre-compiled function call
|
- inline or pre-compiled function call
|
||||||
- frustum (extract view frustum planes, corners...)
|
- frustum (extract view frustum planes, corners...)
|
||||||
- bounding box (AABB in Frustum (culling), crop, merge...)
|
- bounding box (AABB in Frustum (culling), crop, merge...)
|
||||||
- bounding sphere
|
|
||||||
- project, unproject
|
- project, unproject
|
||||||
- easing functions
|
|
||||||
- curves
|
|
||||||
- curve interpolation helpers (S*M*C, deCasteljau...)
|
|
||||||
- and other...
|
- and other...
|
||||||
|
|
||||||
<hr />
|
<hr />
|
||||||
|
|||||||
@@ -2,7 +2,7 @@ Pod::Spec.new do |s|
|
|||||||
|
|
||||||
# Description
|
# Description
|
||||||
s.name = "cglm"
|
s.name = "cglm"
|
||||||
s.version = "0.5.1"
|
s.version = "0.4.6"
|
||||||
s.summary = "📽 Optimized OpenGL/Graphics Math (glm) for C"
|
s.summary = "📽 Optimized OpenGL/Graphics Math (glm) for C"
|
||||||
s.description = <<-DESC
|
s.description = <<-DESC
|
||||||
cglm is math library for graphics programming for C. It is similar to original glm but it is written for C instead of C++ (you can use here too). See the documentation or README for all features.
|
cglm is math library for graphics programming for C. It is similar to original glm but it is written for C instead of C++ (you can use here too). See the documentation or README for all features.
|
||||||
|
|||||||
@@ -7,7 +7,7 @@
|
|||||||
#*****************************************************************************
|
#*****************************************************************************
|
||||||
|
|
||||||
AC_PREREQ([2.69])
|
AC_PREREQ([2.69])
|
||||||
AC_INIT([cglm], [0.5.3], [info@recp.me])
|
AC_INIT([cglm], [0.5.2], [info@recp.me])
|
||||||
AM_INIT_AUTOMAKE([-Wall -Werror foreign subdir-objects])
|
AM_INIT_AUTOMAKE([-Wall -Werror foreign subdir-objects])
|
||||||
|
|
||||||
AC_CONFIG_MACRO_DIR([m4])
|
AC_CONFIG_MACRO_DIR([m4])
|
||||||
@@ -29,7 +29,6 @@ LT_INIT
|
|||||||
# Checks for libraries.
|
# Checks for libraries.
|
||||||
AC_CHECK_LIB([m], [floor])
|
AC_CHECK_LIB([m], [floor])
|
||||||
|
|
||||||
m4_ifdef([AM_SILENT_RULES], [AM_SILENT_RULES([yes])])
|
|
||||||
AC_SYS_LARGEFILE
|
AC_SYS_LARGEFILE
|
||||||
|
|
||||||
# Checks for header files.
|
# Checks for header files.
|
||||||
|
|||||||
@@ -46,5 +46,3 @@ Follow the :doc:`build` documentation for this
|
|||||||
io
|
io
|
||||||
call
|
call
|
||||||
sphere
|
sphere
|
||||||
curve
|
|
||||||
bezier
|
|
||||||
|
|||||||
@@ -1,89 +0,0 @@
|
|||||||
.. default-domain:: C
|
|
||||||
|
|
||||||
Bezier
|
|
||||||
================================================================================
|
|
||||||
|
|
||||||
Header: cglm/bezier.h
|
|
||||||
|
|
||||||
Common helpers for cubic bezier and similar curves.
|
|
||||||
|
|
||||||
Table of contents (click to go):
|
|
||||||
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
|
|
||||||
|
|
||||||
Functions:
|
|
||||||
|
|
||||||
1. :c:func:`glm_bezier`
|
|
||||||
2. :c:func:`glm_hermite`
|
|
||||||
3. :c:func:`glm_decasteljau`
|
|
||||||
|
|
||||||
Functions documentation
|
|
||||||
~~~~~~~~~~~~~~~~~~~~~~~
|
|
||||||
|
|
||||||
.. c:function:: float glm_bezier(float s, float p0, float c0, float c1, float p1)
|
|
||||||
|
|
||||||
| cubic bezier interpolation
|
|
||||||
| formula:
|
|
||||||
|
|
||||||
.. code-block:: text
|
|
||||||
|
|
||||||
B(s) = P0*(1-s)^3 + 3*C0*s*(1-s)^2 + 3*C1*s^2*(1-s) + P1*s^3
|
|
||||||
|
|
||||||
| similar result using matrix:
|
|
||||||
|
|
||||||
.. code-block:: text
|
|
||||||
|
|
||||||
B(s) = glm_smc(t, GLM_BEZIER_MAT, (vec4){p0, c0, c1, p1})
|
|
||||||
|
|
||||||
| glm_eq(glm_smc(...), glm_bezier(...)) should return TRUE
|
|
||||||
|
|
||||||
Parameters:
|
|
||||||
| *[in]* **s** parameter between 0 and 1
|
|
||||||
| *[in]* **p0** begin point
|
|
||||||
| *[in]* **c0** control point 1
|
|
||||||
| *[in]* **c1** control point 2
|
|
||||||
| *[in]* **p1** end point
|
|
||||||
|
|
||||||
Returns:
|
|
||||||
B(s)
|
|
||||||
|
|
||||||
.. c:function:: float glm_hermite(float s, float p0, float t0, float t1, float p1)
|
|
||||||
|
|
||||||
| cubic hermite interpolation
|
|
||||||
| formula:
|
|
||||||
|
|
||||||
.. code-block:: text
|
|
||||||
|
|
||||||
H(s) = P0*(2*s^3 - 3*s^2 + 1) + T0*(s^3 - 2*s^2 + s) + P1*(-2*s^3 + 3*s^2) + T1*(s^3 - s^2)
|
|
||||||
|
|
||||||
| similar result using matrix:
|
|
||||||
|
|
||||||
.. code-block:: text
|
|
||||||
|
|
||||||
H(s) = glm_smc(t, GLM_HERMITE_MAT, (vec4){p0, p1, c0, c1})
|
|
||||||
|
|
||||||
| glm_eq(glm_smc(...), glm_hermite(...)) should return TRUE
|
|
||||||
|
|
||||||
|
|
||||||
Parameters:
|
|
||||||
| *[in]* **s** parameter between 0 and 1
|
|
||||||
| *[in]* **p0** begin point
|
|
||||||
| *[in]* **t0** tangent 1
|
|
||||||
| *[in]* **t1** tangent 2
|
|
||||||
| *[in]* **p1** end point
|
|
||||||
|
|
||||||
Returns:
|
|
||||||
B(s)
|
|
||||||
|
|
||||||
.. c:function:: float glm_decasteljau(float prm, float p0, float c0, float c1, float p1)
|
|
||||||
|
|
||||||
| iterative way to solve cubic equation
|
|
||||||
|
|
||||||
Parameters:
|
|
||||||
| *[in]* **prm** parameter between 0 and 1
|
|
||||||
| *[in]* **p0** begin point
|
|
||||||
| *[in]* **c0** control point 1
|
|
||||||
| *[in]* **c1** control point 2
|
|
||||||
| *[in]* **p1** end point
|
|
||||||
|
|
||||||
Returns:
|
|
||||||
parameter to use in cubic equation
|
|
||||||
@@ -62,9 +62,9 @@ author = u'Recep Aslantas'
|
|||||||
# built documents.
|
# built documents.
|
||||||
#
|
#
|
||||||
# The short X.Y version.
|
# The short X.Y version.
|
||||||
version = u'0.5.3'
|
version = u'0.5.2'
|
||||||
# The full version, including alpha/beta/rc tags.
|
# The full version, including alpha/beta/rc tags.
|
||||||
release = u'0.5.3'
|
release = u'0.5.2'
|
||||||
|
|
||||||
# The language for content autogenerated by Sphinx. Refer to documentation
|
# The language for content autogenerated by Sphinx. Refer to documentation
|
||||||
# for a list of supported languages.
|
# for a list of supported languages.
|
||||||
|
|||||||
@@ -1,41 +0,0 @@
|
|||||||
.. default-domain:: C
|
|
||||||
|
|
||||||
Curve
|
|
||||||
================================================================================
|
|
||||||
|
|
||||||
Header: cglm/curve.h
|
|
||||||
|
|
||||||
Common helpers for common curves. For specific curve see its header/doc
|
|
||||||
e.g bezier
|
|
||||||
|
|
||||||
Table of contents (click to go):
|
|
||||||
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
|
|
||||||
|
|
||||||
Functions:
|
|
||||||
|
|
||||||
1. :c:func:`glm_smc`
|
|
||||||
|
|
||||||
Functions documentation
|
|
||||||
~~~~~~~~~~~~~~~~~~~~~~~
|
|
||||||
|
|
||||||
.. c:function:: float glm_smc(float s, mat4 m, vec4 c)
|
|
||||||
|
|
||||||
| helper function to calculate **S** * **M** * **C** multiplication for curves
|
|
||||||
|
|
||||||
| this function does not encourage you to use SMC, instead it is a helper if you use SMC.
|
|
||||||
|
|
||||||
| if you want to specify S as vector then use more generic glm_mat4_rmc() func.
|
|
||||||
|
|
||||||
| Example usage:
|
|
||||||
|
|
||||||
.. code-block:: c
|
|
||||||
|
|
||||||
Bs = glm_smc(s, GLM_BEZIER_MAT, (vec4){p0, c0, c1, p1})
|
|
||||||
|
|
||||||
Parameters:
|
|
||||||
| *[in]* **s** parameter between 0 and 1 (this will be [s3, s2, s, 1])
|
|
||||||
| *[in]* **m** basis matrix
|
|
||||||
| *[out]* **c** position/control vector
|
|
||||||
|
|
||||||
Returns:
|
|
||||||
scalar value e.g. Bs
|
|
||||||
@@ -21,7 +21,6 @@ Functions:
|
|||||||
1. :c:func:`glm_mat3_copy`
|
1. :c:func:`glm_mat3_copy`
|
||||||
#. :c:func:`glm_mat3_identity`
|
#. :c:func:`glm_mat3_identity`
|
||||||
#. :c:func:`glm_mat3_identity_array`
|
#. :c:func:`glm_mat3_identity_array`
|
||||||
#. :c:func:`glm_mat3_zero`
|
|
||||||
#. :c:func:`glm_mat3_mul`
|
#. :c:func:`glm_mat3_mul`
|
||||||
#. :c:func:`glm_mat3_transpose_to`
|
#. :c:func:`glm_mat3_transpose_to`
|
||||||
#. :c:func:`glm_mat3_transpose`
|
#. :c:func:`glm_mat3_transpose`
|
||||||
@@ -33,7 +32,6 @@ Functions:
|
|||||||
#. :c:func:`glm_mat3_trace`
|
#. :c:func:`glm_mat3_trace`
|
||||||
#. :c:func:`glm_mat3_swap_col`
|
#. :c:func:`glm_mat3_swap_col`
|
||||||
#. :c:func:`glm_mat3_swap_row`
|
#. :c:func:`glm_mat3_swap_row`
|
||||||
#. :c:func:`glm_mat3_rmc`
|
|
||||||
|
|
||||||
Functions documentation
|
Functions documentation
|
||||||
~~~~~~~~~~~~~~~~~~~~~~~
|
~~~~~~~~~~~~~~~~~~~~~~~
|
||||||
@@ -61,13 +59,6 @@ Functions documentation
|
|||||||
| *[in,out]* **mat** matrix array (must be aligned (16/32) if alignment is not disabled)
|
| *[in,out]* **mat** matrix array (must be aligned (16/32) if alignment is not disabled)
|
||||||
| *[in]* **count** count of matrices
|
| *[in]* **count** count of matrices
|
||||||
|
|
||||||
.. c:function:: void glm_mat3_zero(mat3 mat)
|
|
||||||
|
|
||||||
make given matrix zero
|
|
||||||
|
|
||||||
Parameters:
|
|
||||||
| *[in,out]* **mat** matrix to
|
|
||||||
|
|
||||||
.. c:function:: void glm_mat3_mul(mat3 m1, mat3 m2, mat3 dest)
|
.. c:function:: void glm_mat3_mul(mat3 m1, mat3 m2, mat3 dest)
|
||||||
|
|
||||||
multiply m1 and m2 to dest
|
multiply m1 and m2 to dest
|
||||||
@@ -170,20 +161,3 @@ Functions documentation
|
|||||||
| *[in, out]* **mat** matrix
|
| *[in, out]* **mat** matrix
|
||||||
| *[in]* **row1** row1
|
| *[in]* **row1** row1
|
||||||
| *[in]* **row2** row2
|
| *[in]* **row2** row2
|
||||||
|
|
||||||
.. c:function:: float glm_mat3_rmc(vec3 r, mat3 m, vec3 c)
|
|
||||||
|
|
||||||
| **rmc** stands for **Row** * **Matrix** * **Column**
|
|
||||||
|
|
||||||
| helper for R (row vector) * M (matrix) * C (column vector)
|
|
||||||
|
|
||||||
| the result is scalar because R * M = Matrix1x3 (row vector),
|
|
||||||
| then Matrix1x3 * Vec3 (column vector) = Matrix1x1 (Scalar)
|
|
||||||
|
|
||||||
Parameters:
|
|
||||||
| *[in]* **r** row vector or matrix1x3
|
|
||||||
| *[in]* **m** matrix3x3
|
|
||||||
| *[in]* **c** column vector or matrix3x1
|
|
||||||
|
|
||||||
Returns:
|
|
||||||
scalar value e.g. Matrix1x1
|
|
||||||
|
|||||||
@@ -26,7 +26,6 @@ Functions:
|
|||||||
#. :c:func:`glm_mat4_copy`
|
#. :c:func:`glm_mat4_copy`
|
||||||
#. :c:func:`glm_mat4_identity`
|
#. :c:func:`glm_mat4_identity`
|
||||||
#. :c:func:`glm_mat4_identity_array`
|
#. :c:func:`glm_mat4_identity_array`
|
||||||
#. :c:func:`glm_mat4_zero`
|
|
||||||
#. :c:func:`glm_mat4_pick3`
|
#. :c:func:`glm_mat4_pick3`
|
||||||
#. :c:func:`glm_mat4_pick3t`
|
#. :c:func:`glm_mat4_pick3t`
|
||||||
#. :c:func:`glm_mat4_ins3`
|
#. :c:func:`glm_mat4_ins3`
|
||||||
@@ -46,7 +45,6 @@ Functions:
|
|||||||
#. :c:func:`glm_mat4_inv_fast`
|
#. :c:func:`glm_mat4_inv_fast`
|
||||||
#. :c:func:`glm_mat4_swap_col`
|
#. :c:func:`glm_mat4_swap_col`
|
||||||
#. :c:func:`glm_mat4_swap_row`
|
#. :c:func:`glm_mat4_swap_row`
|
||||||
#. :c:func:`glm_mat4_rmc`
|
|
||||||
|
|
||||||
Functions documentation
|
Functions documentation
|
||||||
~~~~~~~~~~~~~~~~~~~~~~~
|
~~~~~~~~~~~~~~~~~~~~~~~
|
||||||
@@ -82,13 +80,6 @@ Functions documentation
|
|||||||
| *[in,out]* **mat** matrix array (must be aligned (16/32) if alignment is not disabled)
|
| *[in,out]* **mat** matrix array (must be aligned (16/32) if alignment is not disabled)
|
||||||
| *[in]* **count** count of matrices
|
| *[in]* **count** count of matrices
|
||||||
|
|
||||||
.. c:function:: void glm_mat4_zero(mat4 mat)
|
|
||||||
|
|
||||||
make given matrix zero
|
|
||||||
|
|
||||||
Parameters:
|
|
||||||
| *[in,out]* **mat** matrix to
|
|
||||||
|
|
||||||
.. c:function:: void glm_mat4_pick3(mat4 mat, mat3 dest)
|
.. c:function:: void glm_mat4_pick3(mat4 mat, mat3 dest)
|
||||||
|
|
||||||
copy upper-left of mat4 to mat3
|
copy upper-left of mat4 to mat3
|
||||||
@@ -279,20 +270,3 @@ Functions documentation
|
|||||||
| *[in, out]* **mat** matrix
|
| *[in, out]* **mat** matrix
|
||||||
| *[in]* **row1** row1
|
| *[in]* **row1** row1
|
||||||
| *[in]* **row2** row2
|
| *[in]* **row2** row2
|
||||||
|
|
||||||
.. c:function:: float glm_mat4_rmc(vec4 r, mat4 m, vec4 c)
|
|
||||||
|
|
||||||
| **rmc** stands for **Row** * **Matrix** * **Column**
|
|
||||||
|
|
||||||
| helper for R (row vector) * M (matrix) * C (column vector)
|
|
||||||
|
|
||||||
| the result is scalar because R * M = Matrix1x4 (row vector),
|
|
||||||
| then Matrix1x4 * Vec4 (column vector) = Matrix1x1 (Scalar)
|
|
||||||
|
|
||||||
Parameters:
|
|
||||||
| *[in]* **r** row vector or matrix1x4
|
|
||||||
| *[in]* **m** matrix4x4
|
|
||||||
| *[in]* **c** column vector or matrix4x1
|
|
||||||
|
|
||||||
Returns:
|
|
||||||
scalar value e.g. Matrix1x1
|
|
||||||
|
|||||||
@@ -40,13 +40,3 @@ SSE and SSE2 Shuffle Option
|
|||||||
**_mm_shuffle_ps** generates **shufps** instruction even if registers are same.
|
**_mm_shuffle_ps** generates **shufps** instruction even if registers are same.
|
||||||
You can force it to generate **pshufd** instruction by defining
|
You can force it to generate **pshufd** instruction by defining
|
||||||
**CGLM_USE_INT_DOMAIN** macro. As default it is not defined.
|
**CGLM_USE_INT_DOMAIN** macro. As default it is not defined.
|
||||||
|
|
||||||
SSE3 and SSE4 Dot Product Options
|
|
||||||
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
|
|
||||||
|
|
||||||
You have to extra options for dot product: **CGLM_SSE4_DOT** and **CGLM_SSE3_DOT**.
|
|
||||||
|
|
||||||
- If **SSE4** is enabled then you can define **CGLM_SSE4_DOT** to force cglm to use **_mm_dp_ps** instruction.
|
|
||||||
- If **SSE3** is enabled then you can define **CGLM_SSE3_DOT** to force cglm to use **_mm_hadd_ps** instructions.
|
|
||||||
|
|
||||||
otherwise cglm will use custom cglm's hadd functions which are optimized too.
|
|
||||||
|
|||||||
@@ -58,7 +58,11 @@ Functions:
|
|||||||
#. :c:func:`glm_vec4_minv`
|
#. :c:func:`glm_vec4_minv`
|
||||||
#. :c:func:`glm_vec4_clamp`
|
#. :c:func:`glm_vec4_clamp`
|
||||||
#. :c:func:`glm_vec4_lerp`
|
#. :c:func:`glm_vec4_lerp`
|
||||||
#. :c:func:`glm_vec4_cubic`
|
#. :c:func:`glm_vec4_isnan`
|
||||||
|
#. :c:func:`glm_vec4_isinf`
|
||||||
|
#. :c:func:`glm_vec4_isvalid`
|
||||||
|
#. :c:func:`glm_vec4_sign`
|
||||||
|
#. :c:func:`glm_vec4_sqrt`
|
||||||
|
|
||||||
Functions documentation
|
Functions documentation
|
||||||
~~~~~~~~~~~~~~~~~~~~~~~
|
~~~~~~~~~~~~~~~~~~~~~~~
|
||||||
@@ -397,11 +401,3 @@ Functions documentation
|
|||||||
| *[in]* **to** to value
|
| *[in]* **to** to value
|
||||||
| *[in]* **t** interpolant (amount) clamped between 0 and 1
|
| *[in]* **t** interpolant (amount) clamped between 0 and 1
|
||||||
| *[out]* **dest** destination
|
| *[out]* **dest** destination
|
||||||
|
|
||||||
.. c:function:: void glm_vec4_cubic(float s, vec4 dest)
|
|
||||||
|
|
||||||
helper to fill vec4 as [S^3, S^2, S, 1]
|
|
||||||
|
|
||||||
Parameters:
|
|
||||||
| *[in]* **s** parameter
|
|
||||||
| *[out]* **dest** destination
|
|
||||||
|
|||||||
@@ -1,152 +0,0 @@
|
|||||||
/*
|
|
||||||
* Copyright (c), Recep Aslantas.
|
|
||||||
*
|
|
||||||
* MIT License (MIT), http://opensource.org/licenses/MIT
|
|
||||||
* Full license can be found in the LICENSE file
|
|
||||||
*/
|
|
||||||
|
|
||||||
#ifndef cglm_bezier_h
|
|
||||||
#define cglm_bezier_h
|
|
||||||
|
|
||||||
#define GLM_BEZIER_MAT_INIT {{-1.0f, 3.0f, -3.0f, 1.0f}, \
|
|
||||||
{ 3.0f, -6.0f, 3.0f, 0.0f}, \
|
|
||||||
{-3.0f, 3.0f, 0.0f, 0.0f}, \
|
|
||||||
{ 1.0f, 0.0f, 0.0f, 0.0f}}
|
|
||||||
#define GLM_HERMITE_MAT_INIT {{ 2.0f, -3.0f, 0.0f, 1.0f}, \
|
|
||||||
{-2.0f, 3.0f, 0.0f, 0.0f}, \
|
|
||||||
{ 1.0f, -2.0f, 1.0f, 0.0f}, \
|
|
||||||
{ 1.0f, -1.0f, 0.0f, 0.0f}}
|
|
||||||
/* for C only */
|
|
||||||
#define GLM_BEZIER_MAT ((mat4)GLM_BEZIER_MAT_INIT)
|
|
||||||
#define GLM_HERMITE_MAT ((mat4)GLM_HERMITE_MAT_INIT)
|
|
||||||
|
|
||||||
#define CGLM_DECASTEL_EPS 1e-9
|
|
||||||
#define CGLM_DECASTEL_MAX 1000
|
|
||||||
#define CGLM_DECASTEL_SMALL 1e-20
|
|
||||||
|
|
||||||
/*!
|
|
||||||
* @brief cubic bezier interpolation
|
|
||||||
*
|
|
||||||
* Formula:
|
|
||||||
* B(s) = P0*(1-s)^3 + 3*C0*s*(1-s)^2 + 3*C1*s^2*(1-s) + P1*s^3
|
|
||||||
*
|
|
||||||
* similar result using matrix:
|
|
||||||
* B(s) = glm_smc(t, GLM_BEZIER_MAT, (vec4){p0, c0, c1, p1})
|
|
||||||
*
|
|
||||||
* glm_eq(glm_smc(...), glm_bezier(...)) should return TRUE
|
|
||||||
*
|
|
||||||
* @param[in] s parameter between 0 and 1
|
|
||||||
* @param[in] p0 begin point
|
|
||||||
* @param[in] c0 control point 1
|
|
||||||
* @param[in] c1 control point 2
|
|
||||||
* @param[in] p1 end point
|
|
||||||
*
|
|
||||||
* @return B(s)
|
|
||||||
*/
|
|
||||||
CGLM_INLINE
|
|
||||||
float
|
|
||||||
glm_bezier(float s, float p0, float c0, float c1, float p1) {
|
|
||||||
float x, xx, ss, xs3, a;
|
|
||||||
|
|
||||||
x = 1.0f - s;
|
|
||||||
xx = x * x;
|
|
||||||
ss = s * s;
|
|
||||||
xs3 = (s - ss) * 3.0f;
|
|
||||||
a = p0 * xx + c0 * xs3;
|
|
||||||
|
|
||||||
return a + s * (c1 * xs3 + p1 * ss - a);
|
|
||||||
}
|
|
||||||
|
|
||||||
/*!
|
|
||||||
* @brief cubic hermite interpolation
|
|
||||||
*
|
|
||||||
* Formula:
|
|
||||||
* H(s) = P0*(2*s^3 - 3*s^2 + 1) + T0*(s^3 - 2*s^2 + s)
|
|
||||||
* + P1*(-2*s^3 + 3*s^2) + T1*(s^3 - s^2)
|
|
||||||
*
|
|
||||||
* similar result using matrix:
|
|
||||||
* H(s) = glm_smc(t, GLM_HERMITE_MAT, (vec4){p0, p1, c0, c1})
|
|
||||||
*
|
|
||||||
* glm_eq(glm_smc(...), glm_hermite(...)) should return TRUE
|
|
||||||
*
|
|
||||||
* @param[in] s parameter between 0 and 1
|
|
||||||
* @param[in] p0 begin point
|
|
||||||
* @param[in] t0 tangent 1
|
|
||||||
* @param[in] t1 tangent 2
|
|
||||||
* @param[in] p1 end point
|
|
||||||
*
|
|
||||||
* @return H(s)
|
|
||||||
*/
|
|
||||||
CGLM_INLINE
|
|
||||||
float
|
|
||||||
glm_hermite(float s, float p0, float t0, float t1, float p1) {
|
|
||||||
float ss, d, a, b, c, e, f;
|
|
||||||
|
|
||||||
ss = s * s;
|
|
||||||
a = ss + ss;
|
|
||||||
c = a + ss;
|
|
||||||
b = a * s;
|
|
||||||
d = s * ss;
|
|
||||||
f = d - ss;
|
|
||||||
e = b - c;
|
|
||||||
|
|
||||||
return p0 * (e + 1.0f) + t0 * (f - ss + s) + t1 * f - p1 * e;
|
|
||||||
}
|
|
||||||
|
|
||||||
/*!
|
|
||||||
* @brief iterative way to solve cubic equation
|
|
||||||
*
|
|
||||||
* @param[in] prm parameter between 0 and 1
|
|
||||||
* @param[in] p0 begin point
|
|
||||||
* @param[in] c0 control point 1
|
|
||||||
* @param[in] c1 control point 2
|
|
||||||
* @param[in] p1 end point
|
|
||||||
*
|
|
||||||
* @return parameter to use in cubic equation
|
|
||||||
*/
|
|
||||||
CGLM_INLINE
|
|
||||||
float
|
|
||||||
glm_decasteljau(float prm, float p0, float c0, float c1, float p1) {
|
|
||||||
float u, v, a, b, c, d, e, f;
|
|
||||||
int i;
|
|
||||||
|
|
||||||
if (prm - p0 < CGLM_DECASTEL_SMALL)
|
|
||||||
return 0.0f;
|
|
||||||
|
|
||||||
if (p1 - prm < CGLM_DECASTEL_SMALL)
|
|
||||||
return 1.0f;
|
|
||||||
|
|
||||||
u = 0.0f;
|
|
||||||
v = 1.0f;
|
|
||||||
|
|
||||||
for (i = 0; i < CGLM_DECASTEL_MAX; i++) {
|
|
||||||
/* de Casteljau Subdivision */
|
|
||||||
a = (p0 + c0) * 0.5f;
|
|
||||||
b = (c0 + c1) * 0.5f;
|
|
||||||
c = (c1 + p1) * 0.5f;
|
|
||||||
d = (a + b) * 0.5f;
|
|
||||||
e = (b + c) * 0.5f;
|
|
||||||
f = (d + e) * 0.5f; /* this one is on the curve! */
|
|
||||||
|
|
||||||
/* The curve point is close enough to our wanted t */
|
|
||||||
if (fabsf(f - prm) < CGLM_DECASTEL_EPS)
|
|
||||||
return glm_clamp_zo((u + v) * 0.5f);
|
|
||||||
|
|
||||||
/* dichotomy */
|
|
||||||
if (f < prm) {
|
|
||||||
p0 = f;
|
|
||||||
c0 = e;
|
|
||||||
c1 = c;
|
|
||||||
u = (u + v) * 0.5f;
|
|
||||||
} else {
|
|
||||||
c0 = a;
|
|
||||||
c1 = d;
|
|
||||||
p1 = f;
|
|
||||||
v = (u + v) * 0.5f;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
return glm_clamp_zo((u + v) * 0.5f);
|
|
||||||
}
|
|
||||||
|
|
||||||
#endif /* cglm_bezier_h */
|
|
||||||
@@ -27,8 +27,6 @@ extern "C" {
|
|||||||
#include "call/project.h"
|
#include "call/project.h"
|
||||||
#include "call/sphere.h"
|
#include "call/sphere.h"
|
||||||
#include "call/ease.h"
|
#include "call/ease.h"
|
||||||
#include "call/curve.h"
|
|
||||||
#include "call/bezier.h"
|
|
||||||
|
|
||||||
#ifdef __cplusplus
|
#ifdef __cplusplus
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -1,31 +0,0 @@
|
|||||||
/*
|
|
||||||
* Copyright (c), Recep Aslantas.
|
|
||||||
*
|
|
||||||
* MIT License (MIT), http://opensource.org/licenses/MIT
|
|
||||||
* Full license can be found in the LICENSE file
|
|
||||||
*/
|
|
||||||
|
|
||||||
#ifndef cglmc_bezier_h
|
|
||||||
#define cglmc_bezier_h
|
|
||||||
#ifdef __cplusplus
|
|
||||||
extern "C" {
|
|
||||||
#endif
|
|
||||||
|
|
||||||
#include "../cglm.h"
|
|
||||||
|
|
||||||
CGLM_EXPORT
|
|
||||||
float
|
|
||||||
glmc_bezier(float s, float p0, float c0, float c1, float p1);
|
|
||||||
|
|
||||||
CGLM_EXPORT
|
|
||||||
float
|
|
||||||
glmc_hermite(float s, float p0, float t0, float t1, float p1);
|
|
||||||
|
|
||||||
CGLM_EXPORT
|
|
||||||
float
|
|
||||||
glmc_decasteljau(float prm, float p0, float c0, float c1, float p1);
|
|
||||||
|
|
||||||
#ifdef __cplusplus
|
|
||||||
}
|
|
||||||
#endif
|
|
||||||
#endif /* cglmc_bezier_h */
|
|
||||||
@@ -1,23 +0,0 @@
|
|||||||
/*
|
|
||||||
* Copyright (c), Recep Aslantas.
|
|
||||||
*
|
|
||||||
* MIT License (MIT), http://opensource.org/licenses/MIT
|
|
||||||
* Full license can be found in the LICENSE file
|
|
||||||
*/
|
|
||||||
|
|
||||||
#ifndef cglmc_curve_h
|
|
||||||
#define cglmc_curve_h
|
|
||||||
#ifdef __cplusplus
|
|
||||||
extern "C" {
|
|
||||||
#endif
|
|
||||||
|
|
||||||
#include "../cglm.h"
|
|
||||||
|
|
||||||
CGLM_EXPORT
|
|
||||||
float
|
|
||||||
glmc_smc(float s, mat4 m, vec4 c);
|
|
||||||
|
|
||||||
#ifdef __cplusplus
|
|
||||||
}
|
|
||||||
#endif
|
|
||||||
#endif /* cglmc_curve_h */
|
|
||||||
@@ -137,7 +137,4 @@ CGLM_EXPORT
|
|||||||
float
|
float
|
||||||
glmc_ease_bounce_inout(float t);
|
glmc_ease_bounce_inout(float t);
|
||||||
|
|
||||||
#ifdef __cplusplus
|
|
||||||
}
|
|
||||||
#endif
|
|
||||||
#endif /* cglmc_ease_h */
|
#endif /* cglmc_ease_h */
|
||||||
|
|||||||
@@ -72,10 +72,6 @@ CGLM_EXPORT
|
|||||||
void
|
void
|
||||||
glmc_mat3_swap_row(mat3 mat, int row1, int row2);
|
glmc_mat3_swap_row(mat3 mat, int row1, int row2);
|
||||||
|
|
||||||
CGLM_EXPORT
|
|
||||||
float
|
|
||||||
glmc_mat3_rmc(vec3 r, mat3 m, vec3 c);
|
|
||||||
|
|
||||||
#ifdef __cplusplus
|
#ifdef __cplusplus
|
||||||
}
|
}
|
||||||
#endif
|
#endif
|
||||||
|
|||||||
@@ -113,10 +113,6 @@ CGLM_EXPORT
|
|||||||
void
|
void
|
||||||
glmc_mat4_swap_row(mat4 mat, int row1, int row2);
|
glmc_mat4_swap_row(mat4 mat, int row1, int row2);
|
||||||
|
|
||||||
CGLM_EXPORT
|
|
||||||
float
|
|
||||||
glmc_mat4_rmc(vec4 r, mat4 m, vec4 c);
|
|
||||||
|
|
||||||
#ifdef __cplusplus
|
#ifdef __cplusplus
|
||||||
}
|
}
|
||||||
#endif
|
#endif
|
||||||
|
|||||||
@@ -33,7 +33,4 @@ CGLM_EXPORT
|
|||||||
bool
|
bool
|
||||||
glmc_sphere_point(vec4 s, vec3 point);
|
glmc_sphere_point(vec4 s, vec3 point);
|
||||||
|
|
||||||
#ifdef __cplusplus
|
|
||||||
}
|
|
||||||
#endif
|
|
||||||
#endif /* cglmc_sphere_h */
|
#endif /* cglmc_sphere_h */
|
||||||
|
|||||||
@@ -153,10 +153,6 @@ CGLM_EXPORT
|
|||||||
void
|
void
|
||||||
glmc_vec4_lerp(vec4 from, vec4 to, float t, vec4 dest);
|
glmc_vec4_lerp(vec4 from, vec4 to, float t, vec4 dest);
|
||||||
|
|
||||||
CGLM_EXPORT
|
|
||||||
void
|
|
||||||
glmc_vec4_cubic(float s, vec4 dest);
|
|
||||||
|
|
||||||
/* ext */
|
/* ext */
|
||||||
|
|
||||||
CGLM_EXPORT
|
CGLM_EXPORT
|
||||||
|
|||||||
@@ -84,7 +84,7 @@ glm_frustum(float left,
|
|||||||
mat4 dest) {
|
mat4 dest) {
|
||||||
float rl, tb, fn, nv;
|
float rl, tb, fn, nv;
|
||||||
|
|
||||||
glm_mat4_zero(dest);
|
glm__memzero(float, dest, sizeof(mat4));
|
||||||
|
|
||||||
rl = 1.0f / (right - left);
|
rl = 1.0f / (right - left);
|
||||||
tb = 1.0f / (top - bottom);
|
tb = 1.0f / (top - bottom);
|
||||||
@@ -122,7 +122,7 @@ glm_ortho(float left,
|
|||||||
mat4 dest) {
|
mat4 dest) {
|
||||||
float rl, tb, fn;
|
float rl, tb, fn;
|
||||||
|
|
||||||
glm_mat4_zero(dest);
|
glm__memzero(float, dest, sizeof(mat4));
|
||||||
|
|
||||||
rl = 1.0f / (right - left);
|
rl = 1.0f / (right - left);
|
||||||
tb = 1.0f / (top - bottom);
|
tb = 1.0f / (top - bottom);
|
||||||
@@ -259,7 +259,7 @@ glm_perspective(float fovy,
|
|||||||
mat4 dest) {
|
mat4 dest) {
|
||||||
float f, fn;
|
float f, fn;
|
||||||
|
|
||||||
glm_mat4_zero(dest);
|
glm__memzero(float, dest, sizeof(mat4));
|
||||||
|
|
||||||
f = 1.0f / tanf(fovy * 0.5f);
|
f = 1.0f / tanf(fovy * 0.5f);
|
||||||
fn = 1.0f / (nearVal - farVal);
|
fn = 1.0f / (nearVal - farVal);
|
||||||
|
|||||||
@@ -26,7 +26,5 @@
|
|||||||
#include "project.h"
|
#include "project.h"
|
||||||
#include "sphere.h"
|
#include "sphere.h"
|
||||||
#include "ease.h"
|
#include "ease.h"
|
||||||
#include "curve.h"
|
|
||||||
#include "bezier.h"
|
|
||||||
|
|
||||||
#endif /* cglm_h */
|
#endif /* cglm_h */
|
||||||
|
|||||||
@@ -26,6 +26,34 @@
|
|||||||
# define CGLM_INLINE static inline __attribute((always_inline))
|
# define CGLM_INLINE static inline __attribute((always_inline))
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
#define glm__memcpy(type, dest, src, size) \
|
||||||
|
do { \
|
||||||
|
type *srci; \
|
||||||
|
type *srci_end; \
|
||||||
|
type *desti; \
|
||||||
|
\
|
||||||
|
srci = (type *)src; \
|
||||||
|
srci_end = (type *)((char *)srci + size); \
|
||||||
|
desti = (type *)dest; \
|
||||||
|
\
|
||||||
|
while (srci != srci_end) \
|
||||||
|
*desti++ = *srci++; \
|
||||||
|
} while (0)
|
||||||
|
|
||||||
|
#define glm__memset(type, dest, size, val) \
|
||||||
|
do { \
|
||||||
|
type *desti; \
|
||||||
|
type *desti_end; \
|
||||||
|
\
|
||||||
|
desti = (type *)dest; \
|
||||||
|
desti_end = (type *)((char *)desti + size); \
|
||||||
|
\
|
||||||
|
while (desti != desti_end) \
|
||||||
|
*desti++ = val; \
|
||||||
|
} while (0)
|
||||||
|
|
||||||
|
#define glm__memzero(type, dest, size) glm__memset(type, dest, size, 0)
|
||||||
|
|
||||||
#include "types.h"
|
#include "types.h"
|
||||||
#include "simd/intrin.h"
|
#include "simd/intrin.h"
|
||||||
|
|
||||||
|
|||||||
@@ -1,40 +0,0 @@
|
|||||||
/*
|
|
||||||
* Copyright (c), Recep Aslantas.
|
|
||||||
*
|
|
||||||
* MIT License (MIT), http://opensource.org/licenses/MIT
|
|
||||||
* Full license can be found in the LICENSE file
|
|
||||||
*/
|
|
||||||
|
|
||||||
#ifndef cglm_curve_h
|
|
||||||
#define cglm_curve_h
|
|
||||||
|
|
||||||
#include "common.h"
|
|
||||||
#include "vec4.h"
|
|
||||||
#include "mat4.h"
|
|
||||||
|
|
||||||
/*!
|
|
||||||
* @brief helper function to calculate S*M*C multiplication for curves
|
|
||||||
*
|
|
||||||
* This function does not encourage you to use SMC,
|
|
||||||
* instead it is a helper if you use SMC.
|
|
||||||
*
|
|
||||||
* if you want to specify S as vector then use more generic glm_mat4_rmc() func.
|
|
||||||
*
|
|
||||||
* Example usage:
|
|
||||||
* B(s) = glm_smc(s, GLM_BEZIER_MAT, (vec4){p0, c0, c1, p1})
|
|
||||||
*
|
|
||||||
* @param[in] s parameter between 0 and 1 (this will be [s3, s2, s, 1])
|
|
||||||
* @param[in] m basis matrix
|
|
||||||
* @param[in] c position/control vector
|
|
||||||
*
|
|
||||||
* @return B(s)
|
|
||||||
*/
|
|
||||||
CGLM_INLINE
|
|
||||||
float
|
|
||||||
glm_smc(float s, mat4 m, vec4 c) {
|
|
||||||
vec4 vs;
|
|
||||||
glm_vec4_cubic(s, vs);
|
|
||||||
return glm_mat4_rmc(vs, m, c);
|
|
||||||
}
|
|
||||||
|
|
||||||
#endif /* cglm_curve_h */
|
|
||||||
@@ -17,19 +17,16 @@
|
|||||||
CGLM_INLINE void glm_mat3_copy(mat3 mat, mat3 dest);
|
CGLM_INLINE void glm_mat3_copy(mat3 mat, mat3 dest);
|
||||||
CGLM_INLINE void glm_mat3_identity(mat3 mat);
|
CGLM_INLINE void glm_mat3_identity(mat3 mat);
|
||||||
CGLM_INLINE void glm_mat3_identity_array(mat3 * restrict mat, size_t count);
|
CGLM_INLINE void glm_mat3_identity_array(mat3 * restrict mat, size_t count);
|
||||||
CGLM_INLINE void glm_mat3_zero(mat3 mat);
|
|
||||||
CGLM_INLINE void glm_mat3_mul(mat3 m1, mat3 m2, mat3 dest);
|
CGLM_INLINE void glm_mat3_mul(mat3 m1, mat3 m2, mat3 dest);
|
||||||
CGLM_INLINE void glm_mat3_transpose_to(mat3 m, mat3 dest);
|
CGLM_INLINE void glm_mat3_transpose_to(mat3 m, mat3 dest);
|
||||||
CGLM_INLINE void glm_mat3_transpose(mat3 m);
|
CGLM_INLINE void glm_mat3_transpose(mat3 m);
|
||||||
CGLM_INLINE void glm_mat3_mulv(mat3 m, vec3 v, vec3 dest);
|
CGLM_INLINE void glm_mat3_mulv(mat3 m, vec3 v, vec3 dest);
|
||||||
CGLM_INLINE float glm_mat3_trace(mat3 m);
|
CGLM_INLINE float glm_mat3_trace(mat3 m);
|
||||||
CGLM_INLINE void glm_mat3_quat(mat3 m, versor dest);
|
|
||||||
CGLM_INLINE void glm_mat3_scale(mat3 m, float s);
|
CGLM_INLINE void glm_mat3_scale(mat3 m, float s);
|
||||||
CGLM_INLINE float glm_mat3_det(mat3 mat);
|
CGLM_INLINE float glm_mat3_det(mat3 mat);
|
||||||
CGLM_INLINE void glm_mat3_inv(mat3 mat, mat3 dest);
|
CGLM_INLINE void glm_mat3_inv(mat3 mat, mat3 dest);
|
||||||
CGLM_INLINE void glm_mat3_swap_col(mat3 mat, int col1, int col2);
|
CGLM_INLINE void glm_mat3_swap_col(mat3 mat, int col1, int col2);
|
||||||
CGLM_INLINE void glm_mat3_swap_row(mat3 mat, int row1, int row2);
|
CGLM_INLINE void glm_mat3_swap_row(mat3 mat, int row1, int row2);
|
||||||
CGLM_INLINE float glm_mat3_rmc(vec3 r, mat3 m, vec3 c);
|
|
||||||
*/
|
*/
|
||||||
|
|
||||||
#ifndef cglm_mat3_h
|
#ifndef cglm_mat3_h
|
||||||
@@ -66,17 +63,7 @@
|
|||||||
CGLM_INLINE
|
CGLM_INLINE
|
||||||
void
|
void
|
||||||
glm_mat3_copy(mat3 mat, mat3 dest) {
|
glm_mat3_copy(mat3 mat, mat3 dest) {
|
||||||
dest[0][0] = mat[0][0];
|
glm__memcpy(float, dest, mat, sizeof(mat3));
|
||||||
dest[0][1] = mat[0][1];
|
|
||||||
dest[0][2] = mat[0][2];
|
|
||||||
|
|
||||||
dest[1][0] = mat[1][0];
|
|
||||||
dest[1][1] = mat[1][1];
|
|
||||||
dest[1][2] = mat[1][2];
|
|
||||||
|
|
||||||
dest[2][0] = mat[2][0];
|
|
||||||
dest[2][1] = mat[2][1];
|
|
||||||
dest[2][2] = mat[2][2];
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/*!
|
/*!
|
||||||
@@ -119,18 +106,6 @@ glm_mat3_identity_array(mat3 * __restrict mat, size_t count) {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
/*!
|
|
||||||
* @brief make given matrix zero.
|
|
||||||
*
|
|
||||||
* @param[in, out] mat matrix
|
|
||||||
*/
|
|
||||||
CGLM_INLINE
|
|
||||||
void
|
|
||||||
glm_mat3_zero(mat3 mat) {
|
|
||||||
CGLM_ALIGN_MAT mat3 t = GLM_MAT3_ZERO_INIT;
|
|
||||||
glm_mat3_copy(t, mat);
|
|
||||||
}
|
|
||||||
|
|
||||||
/*!
|
/*!
|
||||||
* @brief multiply m1 and m2 to dest
|
* @brief multiply m1 and m2 to dest
|
||||||
*
|
*
|
||||||
@@ -397,26 +372,4 @@ glm_mat3_swap_row(mat3 mat, int row1, int row2) {
|
|||||||
mat[2][row2] = tmp[2];
|
mat[2][row2] = tmp[2];
|
||||||
}
|
}
|
||||||
|
|
||||||
/*!
|
|
||||||
* @brief helper for R (row vector) * M (matrix) * C (column vector)
|
|
||||||
*
|
|
||||||
* rmc stands for Row * Matrix * Column
|
|
||||||
*
|
|
||||||
* the result is scalar because R * M = Matrix1x3 (row vector),
|
|
||||||
* then Matrix1x3 * Vec3 (column vector) = Matrix1x1 (Scalar)
|
|
||||||
*
|
|
||||||
* @param[in] r row vector or matrix1x3
|
|
||||||
* @param[in] m matrix3x3
|
|
||||||
* @param[in] c column vector or matrix3x1
|
|
||||||
*
|
|
||||||
* @return scalar value e.g. Matrix1x1
|
|
||||||
*/
|
|
||||||
CGLM_INLINE
|
|
||||||
float
|
|
||||||
glm_mat3_rmc(vec3 r, mat3 m, vec3 c) {
|
|
||||||
vec3 tmp;
|
|
||||||
glm_mat3_mulv(m, c, tmp);
|
|
||||||
return glm_vec3_dot(r, tmp);
|
|
||||||
}
|
|
||||||
|
|
||||||
#endif /* cglm_mat3_h */
|
#endif /* cglm_mat3_h */
|
||||||
|
|||||||
@@ -22,7 +22,6 @@
|
|||||||
CGLM_INLINE void glm_mat4_copy(mat4 mat, mat4 dest);
|
CGLM_INLINE void glm_mat4_copy(mat4 mat, mat4 dest);
|
||||||
CGLM_INLINE void glm_mat4_identity(mat4 mat);
|
CGLM_INLINE void glm_mat4_identity(mat4 mat);
|
||||||
CGLM_INLINE void glm_mat4_identity_array(mat4 * restrict mat, size_t count);
|
CGLM_INLINE void glm_mat4_identity_array(mat4 * restrict mat, size_t count);
|
||||||
CGLM_INLINE void glm_mat4_zero(mat4 mat);
|
|
||||||
CGLM_INLINE void glm_mat4_pick3(mat4 mat, mat3 dest);
|
CGLM_INLINE void glm_mat4_pick3(mat4 mat, mat3 dest);
|
||||||
CGLM_INLINE void glm_mat4_pick3t(mat4 mat, mat3 dest);
|
CGLM_INLINE void glm_mat4_pick3t(mat4 mat, mat3 dest);
|
||||||
CGLM_INLINE void glm_mat4_ins3(mat3 mat, mat4 dest);
|
CGLM_INLINE void glm_mat4_ins3(mat3 mat, mat4 dest);
|
||||||
@@ -32,7 +31,6 @@
|
|||||||
CGLM_INLINE void glm_mat4_mulv3(mat4 m, vec3 v, vec3 dest);
|
CGLM_INLINE void glm_mat4_mulv3(mat4 m, vec3 v, vec3 dest);
|
||||||
CGLM_INLINE float glm_mat4_trace(mat4 m);
|
CGLM_INLINE float glm_mat4_trace(mat4 m);
|
||||||
CGLM_INLINE float glm_mat4_trace3(mat4 m);
|
CGLM_INLINE float glm_mat4_trace3(mat4 m);
|
||||||
CGLM_INLINE void glm_mat4_quat(mat4 m, versor dest) ;
|
|
||||||
CGLM_INLINE void glm_mat4_transpose_to(mat4 m, mat4 dest);
|
CGLM_INLINE void glm_mat4_transpose_to(mat4 m, mat4 dest);
|
||||||
CGLM_INLINE void glm_mat4_transpose(mat4 m);
|
CGLM_INLINE void glm_mat4_transpose(mat4 m);
|
||||||
CGLM_INLINE void glm_mat4_scale_p(mat4 m, float s);
|
CGLM_INLINE void glm_mat4_scale_p(mat4 m, float s);
|
||||||
@@ -42,7 +40,6 @@
|
|||||||
CGLM_INLINE void glm_mat4_inv_fast(mat4 mat, mat4 dest);
|
CGLM_INLINE void glm_mat4_inv_fast(mat4 mat, mat4 dest);
|
||||||
CGLM_INLINE void glm_mat4_swap_col(mat4 mat, int col1, int col2);
|
CGLM_INLINE void glm_mat4_swap_col(mat4 mat, int col1, int col2);
|
||||||
CGLM_INLINE void glm_mat4_swap_row(mat4 mat, int row1, int row2);
|
CGLM_INLINE void glm_mat4_swap_row(mat4 mat, int row1, int row2);
|
||||||
CGLM_INLINE float glm_mat4_rmc(vec4 r, mat4 m, vec4 c);
|
|
||||||
*/
|
*/
|
||||||
|
|
||||||
#ifndef cglm_mat_h
|
#ifndef cglm_mat_h
|
||||||
@@ -101,15 +98,7 @@
|
|||||||
CGLM_INLINE
|
CGLM_INLINE
|
||||||
void
|
void
|
||||||
glm_mat4_ucopy(mat4 mat, mat4 dest) {
|
glm_mat4_ucopy(mat4 mat, mat4 dest) {
|
||||||
dest[0][0] = mat[0][0]; dest[1][0] = mat[1][0];
|
glm__memcpy(float, dest, mat, sizeof(mat4));
|
||||||
dest[0][1] = mat[0][1]; dest[1][1] = mat[1][1];
|
|
||||||
dest[0][2] = mat[0][2]; dest[1][2] = mat[1][2];
|
|
||||||
dest[0][3] = mat[0][3]; dest[1][3] = mat[1][3];
|
|
||||||
|
|
||||||
dest[2][0] = mat[2][0]; dest[3][0] = mat[3][0];
|
|
||||||
dest[2][1] = mat[2][1]; dest[3][1] = mat[3][1];
|
|
||||||
dest[2][2] = mat[2][2]; dest[3][2] = mat[3][2];
|
|
||||||
dest[2][3] = mat[2][3]; dest[3][3] = mat[3][3];
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/*!
|
/*!
|
||||||
@@ -129,11 +118,6 @@ glm_mat4_copy(mat4 mat, mat4 dest) {
|
|||||||
glmm_store(dest[1], glmm_load(mat[1]));
|
glmm_store(dest[1], glmm_load(mat[1]));
|
||||||
glmm_store(dest[2], glmm_load(mat[2]));
|
glmm_store(dest[2], glmm_load(mat[2]));
|
||||||
glmm_store(dest[3], glmm_load(mat[3]));
|
glmm_store(dest[3], glmm_load(mat[3]));
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(dest[0], vld1q_f32(mat[0]));
|
|
||||||
vst1q_f32(dest[1], vld1q_f32(mat[1]));
|
|
||||||
vst1q_f32(dest[2], vld1q_f32(mat[2]));
|
|
||||||
vst1q_f32(dest[3], vld1q_f32(mat[3]));
|
|
||||||
#else
|
#else
|
||||||
glm_mat4_ucopy(mat, dest);
|
glm_mat4_ucopy(mat, dest);
|
||||||
#endif
|
#endif
|
||||||
@@ -179,18 +163,6 @@ glm_mat4_identity_array(mat4 * __restrict mat, size_t count) {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
/*!
|
|
||||||
* @brief make given matrix zero.
|
|
||||||
*
|
|
||||||
* @param[in, out] mat matrix
|
|
||||||
*/
|
|
||||||
CGLM_INLINE
|
|
||||||
void
|
|
||||||
glm_mat4_zero(mat4 mat) {
|
|
||||||
CGLM_ALIGN_MAT mat4 t = GLM_MAT4_ZERO_INIT;
|
|
||||||
glm_mat4_copy(t, mat);
|
|
||||||
}
|
|
||||||
|
|
||||||
/*!
|
/*!
|
||||||
* @brief copy upper-left of mat4 to mat3
|
* @brief copy upper-left of mat4 to mat3
|
||||||
*
|
*
|
||||||
@@ -280,7 +252,7 @@ glm_mat4_mul(mat4 m1, mat4 m2, mat4 dest) {
|
|||||||
glm_mat4_mul_avx(m1, m2, dest);
|
glm_mat4_mul_avx(m1, m2, dest);
|
||||||
#elif defined( __SSE__ ) || defined( __SSE2__ )
|
#elif defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
glm_mat4_mul_sse2(m1, m2, dest);
|
glm_mat4_mul_sse2(m1, m2, dest);
|
||||||
#elif defined(CGLM_NEON_FP)
|
#elif defined( __ARM_NEON_FP )
|
||||||
glm_mat4_mul_neon(m1, m2, dest);
|
glm_mat4_mul_neon(m1, m2, dest);
|
||||||
#else
|
#else
|
||||||
float a00 = m1[0][0], a01 = m1[0][1], a02 = m1[0][2], a03 = m1[0][3],
|
float a00 = m1[0][0], a01 = m1[0][1], a02 = m1[0][2], a03 = m1[0][3],
|
||||||
@@ -497,8 +469,10 @@ glm_mat4_transpose(mat4 m) {
|
|||||||
glm_mat4_transp_sse2(m, m);
|
glm_mat4_transp_sse2(m, m);
|
||||||
#else
|
#else
|
||||||
mat4 d;
|
mat4 d;
|
||||||
|
|
||||||
glm_mat4_transpose_to(m, d);
|
glm_mat4_transpose_to(m, d);
|
||||||
glm_mat4_ucopy(d, m);
|
|
||||||
|
glm__memcpy(float, m, d, sizeof(mat4));
|
||||||
#endif
|
#endif
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -530,15 +504,10 @@ glm_mat4_scale_p(mat4 m, float s) {
|
|||||||
CGLM_INLINE
|
CGLM_INLINE
|
||||||
void
|
void
|
||||||
glm_mat4_scale(mat4 m, float s) {
|
glm_mat4_scale(mat4 m, float s) {
|
||||||
#if defined( __SSE__ ) || defined( __SSE2__ )
|
#ifdef __AVX__
|
||||||
|
glm_mat4_scale_avx(m, s);
|
||||||
|
#elif defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
glm_mat4_scale_sse2(m, s);
|
glm_mat4_scale_sse2(m, s);
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
float32x4_t v0;
|
|
||||||
v0 = vdupq_n_f32(s);
|
|
||||||
vst1q_f32(m[0], vmulq_f32(vld1q_f32(m[0]), v0));
|
|
||||||
vst1q_f32(m[1], vmulq_f32(vld1q_f32(m[1]), v0));
|
|
||||||
vst1q_f32(m[2], vmulq_f32(vld1q_f32(m[2]), v0));
|
|
||||||
vst1q_f32(m[3], vmulq_f32(vld1q_f32(m[3]), v0));
|
|
||||||
#else
|
#else
|
||||||
glm_mat4_scale_p(m, s);
|
glm_mat4_scale_p(m, s);
|
||||||
#endif
|
#endif
|
||||||
@@ -587,7 +556,9 @@ glm_mat4_det(mat4 mat) {
|
|||||||
CGLM_INLINE
|
CGLM_INLINE
|
||||||
void
|
void
|
||||||
glm_mat4_inv(mat4 mat, mat4 dest) {
|
glm_mat4_inv(mat4 mat, mat4 dest) {
|
||||||
#if defined( __SSE__ ) || defined( __SSE2__ )
|
#ifdef __AVX__
|
||||||
|
glm_mat4_inv_avx(mat, dest);
|
||||||
|
#elif defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
glm_mat4_inv_sse2(mat, dest);
|
glm_mat4_inv_sse2(mat, dest);
|
||||||
#else
|
#else
|
||||||
float t[6];
|
float t[6];
|
||||||
@@ -648,7 +619,9 @@ glm_mat4_inv(mat4 mat, mat4 dest) {
|
|||||||
CGLM_INLINE
|
CGLM_INLINE
|
||||||
void
|
void
|
||||||
glm_mat4_inv_fast(mat4 mat, mat4 dest) {
|
glm_mat4_inv_fast(mat4 mat, mat4 dest) {
|
||||||
#if defined( __SSE__ ) || defined( __SSE2__ )
|
#ifdef __AVX__
|
||||||
|
glm_mat4_inv_fast_avx(mat, dest);
|
||||||
|
#elif defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
glm_mat4_inv_fast_sse2(mat, dest);
|
glm_mat4_inv_fast_sse2(mat, dest);
|
||||||
#else
|
#else
|
||||||
glm_mat4_inv(mat, dest);
|
glm_mat4_inv(mat, dest);
|
||||||
@@ -698,26 +671,4 @@ glm_mat4_swap_row(mat4 mat, int row1, int row2) {
|
|||||||
mat[3][row2] = tmp[3];
|
mat[3][row2] = tmp[3];
|
||||||
}
|
}
|
||||||
|
|
||||||
/*!
|
|
||||||
* @brief helper for R (row vector) * M (matrix) * C (column vector)
|
|
||||||
*
|
|
||||||
* rmc stands for Row * Matrix * Column
|
|
||||||
*
|
|
||||||
* the result is scalar because R * M = Matrix1x4 (row vector),
|
|
||||||
* then Matrix1x4 * Vec4 (column vector) = Matrix1x1 (Scalar)
|
|
||||||
*
|
|
||||||
* @param[in] r row vector or matrix1x4
|
|
||||||
* @param[in] m matrix4x4
|
|
||||||
* @param[in] c column vector or matrix4x1
|
|
||||||
*
|
|
||||||
* @return scalar value e.g. B(s)
|
|
||||||
*/
|
|
||||||
CGLM_INLINE
|
|
||||||
float
|
|
||||||
glm_mat4_rmc(vec4 r, mat4 m, vec4 c) {
|
|
||||||
vec4 tmp;
|
|
||||||
glm_mat4_mulv(m, c, tmp);
|
|
||||||
return glm_vec4_dot(r, tmp);
|
|
||||||
}
|
|
||||||
|
|
||||||
#endif /* cglm_mat_h */
|
#endif /* cglm_mat_h */
|
||||||
|
|||||||
@@ -218,7 +218,7 @@ glm_quat_normalize_to(versor q, versor dest) {
|
|||||||
float dot;
|
float dot;
|
||||||
|
|
||||||
x0 = glmm_load(q);
|
x0 = glmm_load(q);
|
||||||
xdot = glmm_vdot(x0, x0);
|
xdot = glmm_dot(x0, x0);
|
||||||
dot = _mm_cvtss_f32(xdot);
|
dot = _mm_cvtss_f32(xdot);
|
||||||
|
|
||||||
if (dot <= 0.0f) {
|
if (dot <= 0.0f) {
|
||||||
|
|||||||
@@ -1,41 +0,0 @@
|
|||||||
/*
|
|
||||||
* Copyright (c), Recep Aslantas.
|
|
||||||
*
|
|
||||||
* MIT License (MIT), http://opensource.org/licenses/MIT
|
|
||||||
* Full license can be found in the LICENSE file
|
|
||||||
*/
|
|
||||||
|
|
||||||
#ifndef cglm_simd_arm_h
|
|
||||||
#define cglm_simd_arm_h
|
|
||||||
#include "intrin.h"
|
|
||||||
#ifdef CGLM_SIMD_ARM
|
|
||||||
|
|
||||||
#define glmm_load(p) vld1q_f32(p)
|
|
||||||
#define glmm_store(p, a) vst1q_f32(p, a)
|
|
||||||
|
|
||||||
static inline
|
|
||||||
float
|
|
||||||
glmm_hadd(float32x4_t v) {
|
|
||||||
#if defined(__aarch64__)
|
|
||||||
return vaddvq_f32(v);
|
|
||||||
#else
|
|
||||||
v = vaddq_f32(v, vrev64q_f32(v));
|
|
||||||
v = vaddq_f32(v, vcombine_f32(vget_high_f32(v), vget_low_f32(v)));
|
|
||||||
return vgetq_lane_f32(v, 0);
|
|
||||||
#endif
|
|
||||||
}
|
|
||||||
|
|
||||||
static inline
|
|
||||||
float
|
|
||||||
glmm_dot(float32x4_t a, float32x4_t b) {
|
|
||||||
return glmm_hadd(vmulq_f32(a, b));
|
|
||||||
}
|
|
||||||
|
|
||||||
static inline
|
|
||||||
float
|
|
||||||
glmm_norm(float32x4_t a) {
|
|
||||||
return sqrtf(glmm_dot(a, a));
|
|
||||||
}
|
|
||||||
|
|
||||||
#endif
|
|
||||||
#endif /* cglm_simd_arm_h */
|
|
||||||
@@ -14,12 +14,23 @@
|
|||||||
|
|
||||||
#include <immintrin.h>
|
#include <immintrin.h>
|
||||||
|
|
||||||
|
CGLM_INLINE
|
||||||
|
void
|
||||||
|
glm_mat4_scale_avx(mat4 m, float s) {
|
||||||
|
__m256 y0;
|
||||||
|
y0 = _mm256_set1_ps(s);
|
||||||
|
|
||||||
|
glmm_store256(m[0], _mm256_mul_ps(y0, glmm_load256(m[0])));
|
||||||
|
glmm_store256(m[2], _mm256_mul_ps(y0, glmm_load256(m[2])));
|
||||||
|
}
|
||||||
|
|
||||||
CGLM_INLINE
|
CGLM_INLINE
|
||||||
void
|
void
|
||||||
glm_mat4_mul_avx(mat4 m1, mat4 m2, mat4 dest) {
|
glm_mat4_mul_avx(mat4 m1, mat4 m2, mat4 dest) {
|
||||||
/* D = R * L (Column-Major) */
|
/* D = R * L (Column-Major) */
|
||||||
|
|
||||||
__m256 y0, y1, y2, y3, y4, y5, y6, y7, y8, y9;
|
__m256 y0, y1, y2, y3, y4, y5, y6, y7, y8, y9;
|
||||||
|
__m256i yi0, yi1, yi2, yi3;
|
||||||
|
|
||||||
y0 = glmm_load256(m2[0]); /* h g f e d c b a */
|
y0 = glmm_load256(m2[0]); /* h g f e d c b a */
|
||||||
y1 = glmm_load256(m2[2]); /* p o n m l k j i */
|
y1 = glmm_load256(m2[2]); /* p o n m l k j i */
|
||||||
@@ -31,14 +42,19 @@ glm_mat4_mul_avx(mat4 m1, mat4 m2, mat4 dest) {
|
|||||||
y4 = _mm256_permute2f128_ps(y2, y2, 0x03); /* d c b a h g f e */
|
y4 = _mm256_permute2f128_ps(y2, y2, 0x03); /* d c b a h g f e */
|
||||||
y5 = _mm256_permute2f128_ps(y3, y3, 0x03); /* l k j i p o n m */
|
y5 = _mm256_permute2f128_ps(y3, y3, 0x03); /* l k j i p o n m */
|
||||||
|
|
||||||
|
yi0 = _mm256_set_epi32(1, 1, 1, 1, 0, 0, 0, 0);
|
||||||
|
yi1 = _mm256_set_epi32(3, 3, 3, 3, 2, 2, 2, 2);
|
||||||
|
yi2 = _mm256_set_epi32(0, 0, 0, 0, 1, 1, 1, 1);
|
||||||
|
yi3 = _mm256_set_epi32(2, 2, 2, 2, 3, 3, 3, 3);
|
||||||
|
|
||||||
/* f f f f a a a a */
|
/* f f f f a a a a */
|
||||||
/* h h h h c c c c */
|
/* h h h h c c c c */
|
||||||
/* e e e e b b b b */
|
/* e e e e b b b b */
|
||||||
/* g g g g d d d d */
|
/* g g g g d d d d */
|
||||||
y6 = _mm256_permutevar_ps(y0, _mm256_set_epi32(1, 1, 1, 1, 0, 0, 0, 0));
|
y6 = _mm256_permutevar_ps(y0, yi0);
|
||||||
y7 = _mm256_permutevar_ps(y0, _mm256_set_epi32(3, 3, 3, 3, 2, 2, 2, 2));
|
y7 = _mm256_permutevar_ps(y0, yi1);
|
||||||
y8 = _mm256_permutevar_ps(y0, _mm256_set_epi32(0, 0, 0, 0, 1, 1, 1, 1));
|
y8 = _mm256_permutevar_ps(y0, yi2);
|
||||||
y9 = _mm256_permutevar_ps(y0, _mm256_set_epi32(2, 2, 2, 2, 3, 3, 3, 3));
|
y9 = _mm256_permutevar_ps(y0, yi3);
|
||||||
|
|
||||||
glmm_store256(dest[0],
|
glmm_store256(dest[0],
|
||||||
_mm256_add_ps(_mm256_add_ps(_mm256_mul_ps(y2, y6),
|
_mm256_add_ps(_mm256_add_ps(_mm256_mul_ps(y2, y6),
|
||||||
@@ -50,10 +66,10 @@ glm_mat4_mul_avx(mat4 m1, mat4 m2, mat4 dest) {
|
|||||||
/* p p p p k k k k */
|
/* p p p p k k k k */
|
||||||
/* m m m m j j j j */
|
/* m m m m j j j j */
|
||||||
/* o o o o l l l l */
|
/* o o o o l l l l */
|
||||||
y6 = _mm256_permutevar_ps(y1, _mm256_set_epi32(1, 1, 1, 1, 0, 0, 0, 0));
|
y6 = _mm256_permutevar_ps(y1, yi0);
|
||||||
y7 = _mm256_permutevar_ps(y1, _mm256_set_epi32(3, 3, 3, 3, 2, 2, 2, 2));
|
y7 = _mm256_permutevar_ps(y1, yi1);
|
||||||
y8 = _mm256_permutevar_ps(y1, _mm256_set_epi32(0, 0, 0, 0, 1, 1, 1, 1));
|
y8 = _mm256_permutevar_ps(y1, yi2);
|
||||||
y9 = _mm256_permutevar_ps(y1, _mm256_set_epi32(2, 2, 2, 2, 3, 3, 3, 3));
|
y9 = _mm256_permutevar_ps(y1, yi3);
|
||||||
|
|
||||||
glmm_store256(dest[2],
|
glmm_store256(dest[2],
|
||||||
_mm256_add_ps(_mm256_add_ps(_mm256_mul_ps(y2, y6),
|
_mm256_add_ps(_mm256_add_ps(_mm256_mul_ps(y2, y6),
|
||||||
@@ -62,5 +78,365 @@ glm_mat4_mul_avx(mat4 m1, mat4 m2, mat4 dest) {
|
|||||||
_mm256_mul_ps(y5, y9))));
|
_mm256_mul_ps(y5, y9))));
|
||||||
}
|
}
|
||||||
|
|
||||||
|
CGLM_INLINE
|
||||||
|
void
|
||||||
|
glm_mat4_inv_avx(mat4 mat, mat4 dest) {
|
||||||
|
__m256 y0, y1, y2, y3, y4, y5, y6, y7, y8, y9, y10, y11, y12, y13;
|
||||||
|
__m256 yt0, yt1, yt2;
|
||||||
|
__m256 t0, t1, t2;
|
||||||
|
__m256 r1, r2;
|
||||||
|
__m256 flpsign;
|
||||||
|
__m256i yi1, yi2, yi3;
|
||||||
|
|
||||||
|
y0 = glmm_load256(mat[0]); /* h g f e d c b a */
|
||||||
|
y1 = glmm_load256(mat[2]); /* p o n m l k j i */
|
||||||
|
|
||||||
|
y2 = _mm256_permute2f128_ps(y1, y1, 0x00); /* l k j i l k j i */
|
||||||
|
y3 = _mm256_permute2f128_ps(y1, y1, 0x11); /* p o n m p o n m */
|
||||||
|
y4 = _mm256_permute2f128_ps(y0, y0, 0x03); /* d c b a h g f e */
|
||||||
|
y13 = _mm256_permute2f128_ps(y4, y4, 0x00); /* h g f e h g f e */
|
||||||
|
|
||||||
|
yi1 = _mm256_set_epi32(0, 0, 0, 0, 0, 1, 1, 2);
|
||||||
|
yi2 = _mm256_set_epi32(1, 1, 1, 2, 3, 2, 3, 3);
|
||||||
|
flpsign = _mm256_set_ps(0.f, -0.f, 0.f, -0.f, -0.f, 0.f, -0.f, 0.f);
|
||||||
|
|
||||||
|
/* i i i i i j j k */
|
||||||
|
/* n n n o p o p p */
|
||||||
|
/* m m m m m n n o */
|
||||||
|
/* j j j k l k l l */
|
||||||
|
/* e e e e e f f g */
|
||||||
|
/* f f f g h g h h */
|
||||||
|
y5 = _mm256_permutevar_ps(y2, yi1);
|
||||||
|
y6 = _mm256_permutevar_ps(y3, yi2);
|
||||||
|
y7 = _mm256_permutevar_ps(y3, yi1);
|
||||||
|
y8 = _mm256_permutevar_ps(y2, yi2);
|
||||||
|
y2 = _mm256_permutevar_ps(y13, yi1);
|
||||||
|
y3 = _mm256_permutevar_ps(y13, yi2);
|
||||||
|
|
||||||
|
yi1 = _mm256_set_epi32(2, 1, 0, 0, 2, 1, 0, 0);
|
||||||
|
yi2 = _mm256_set_epi32(2, 1, 1, 0, 2, 1, 1, 0);
|
||||||
|
yi3 = _mm256_set_epi32(3, 3, 2, 0, 3, 3, 2, 0);
|
||||||
|
|
||||||
|
/*
|
||||||
|
t0[0] = k * p - o * l; t1[0] = g * p - o * h; t2[0] = g * l - k * h;
|
||||||
|
t0[1] = j * p - n * l; t1[1] = f * p - n * h; t2[1] = f * l - j * h;
|
||||||
|
t0[2] = j * o - n * k; t1[2] = f * o - n * g; t2[2] = f * k - j * g;
|
||||||
|
t0[3] = i * p - m * l; t1[3] = e * p - m * h; t2[3] = e * l - i * h;
|
||||||
|
t0[4] = i * o - m * k; t1[4] = e * o - m * g; t2[4] = e * k - i * g;
|
||||||
|
t0[5] = i * n - m * j; t1[5] = e * n - m * f; t2[5] = e * j - i * f;
|
||||||
|
*/
|
||||||
|
yt0 = _mm256_sub_ps(_mm256_mul_ps(y5, y6), _mm256_mul_ps(y7, y8));
|
||||||
|
yt1 = _mm256_sub_ps(_mm256_mul_ps(y2, y6), _mm256_mul_ps(y7, y3));
|
||||||
|
yt2 = _mm256_sub_ps(_mm256_mul_ps(y2, y8), _mm256_mul_ps(y5, y3));
|
||||||
|
|
||||||
|
/* t3 t2 t1 t0 t3 t2 t1 t0 */
|
||||||
|
/* t5 t5 t5 t4 t5 t5 t5 t4 */
|
||||||
|
y9 = _mm256_permute2f128_ps(yt0, yt0, 0x00);
|
||||||
|
y10 = _mm256_permute2f128_ps(yt0, yt0, 0x11);
|
||||||
|
//
|
||||||
|
/* t2 t1 t0 t0 t2 t1 t0 t0 */
|
||||||
|
t0 = _mm256_permutevar_ps(y9, yi1);
|
||||||
|
|
||||||
|
/* t4 t3 t3 t1 t4 t3 t3 t1 */
|
||||||
|
y11 = _mm256_shuffle_ps(y9, y10, 0x4D);
|
||||||
|
y12 = _mm256_permutevar_ps(y11, yi2);
|
||||||
|
t1 = _mm256_permute2f128_ps(y12, y9, 0x00);
|
||||||
|
|
||||||
|
/* t5 t5 t4 t2 t5 t5 t4 t2 */
|
||||||
|
y11 = _mm256_shuffle_ps(y9, y10, 0x4A);
|
||||||
|
y12 = _mm256_permutevar_ps(y11, yi3);
|
||||||
|
t2 = _mm256_permute2f128_ps(y12, y12, 0x00);
|
||||||
|
|
||||||
|
/* a a a b e e e f */
|
||||||
|
/* b b c c f f g g */
|
||||||
|
/* c d d d g h h h */
|
||||||
|
y9 = _mm256_permute_ps(y4, 0x01);
|
||||||
|
y10 = _mm256_permute_ps(y4, 0x5A);
|
||||||
|
y11 = _mm256_permute_ps(y4, 0xBF);
|
||||||
|
|
||||||
|
/*
|
||||||
|
dest[0][0] = f * t[0] - g * t[1] + h * t[2];
|
||||||
|
dest[1][0] =-(e * t[0] - g * t[3] + h * t[4]);
|
||||||
|
dest[2][0] = e * t[1] - f * t[3] + h * t[5];
|
||||||
|
dest[3][0] =-(e * t[2] - f * t[4] + g * t[5]);
|
||||||
|
|
||||||
|
dest[0][1] =-(b * t[0] - c * t[1] + d * t[2]);
|
||||||
|
dest[1][1] = a * t[0] - c * t[3] + d * t[4];
|
||||||
|
dest[2][1] =-(a * t[1] - b * t[3] + d * t[5]);
|
||||||
|
dest[3][1] = a * t[2] - b * t[4] + c * t[5];
|
||||||
|
*/
|
||||||
|
r1 = _mm256_xor_ps(_mm256_add_ps(_mm256_sub_ps(_mm256_mul_ps(y9, t0),
|
||||||
|
_mm256_mul_ps(y10, t1)),
|
||||||
|
_mm256_mul_ps(y11, t2)),
|
||||||
|
flpsign);
|
||||||
|
|
||||||
|
/* d c b a d c b a */
|
||||||
|
y2 = _mm256_permute2f128_ps(y0, y0, 0x0);
|
||||||
|
|
||||||
|
/* a a a b a a a b */
|
||||||
|
/* b b c c b b c c */
|
||||||
|
/* c d d d c d d d */
|
||||||
|
y3 = _mm256_permutevar_ps(y2, _mm256_set_epi32(0, 0, 0, 1, 0, 0, 0, 1));
|
||||||
|
y4 = _mm256_permutevar_ps(y2, _mm256_set_epi32(1, 1, 2, 2, 1, 1, 2, 2));
|
||||||
|
y5 = _mm256_permutevar_ps(y2, _mm256_set_epi32(2, 3, 3, 3, 2, 3, 3, 3));
|
||||||
|
|
||||||
|
/* t2[3] t2[2] t2[1] t2[0] t1[3] t1[2] t1[1] t1[0] */
|
||||||
|
/* t2[5] t2[5] t2[5] t2[4] t1[5] t1[5] t1[5] t1[4] */
|
||||||
|
y6 = _mm256_permute2f128_ps(yt1, yt2, 0x20);
|
||||||
|
y7 = _mm256_permute2f128_ps(yt1, yt2, 0x31);
|
||||||
|
|
||||||
|
/* t2[2] t2[1] t2[0] t2[0] t1[2] t1[1] t1[0] t1[0] */
|
||||||
|
t0 = _mm256_permutevar_ps(y6, yi1);
|
||||||
|
|
||||||
|
/* t1[4] t1[3] t1[3] t1[1] t1[4] t1[3] t1[3] t1[1] */
|
||||||
|
|
||||||
|
/* t1[4] t1[3] t1[3] t1[1] t1[4] t1[3] t1[3] t1[1] */
|
||||||
|
y11 = _mm256_shuffle_ps(y6, y7, 0x4D);
|
||||||
|
t1 = _mm256_permutevar_ps(y11, yi2);
|
||||||
|
|
||||||
|
|
||||||
|
/* t2[5] t2[5] t2[4] t2[2] t1[5] t1[5] t1[4] t1[2] */
|
||||||
|
y11 = _mm256_shuffle_ps(y6, y7, 0x4A);
|
||||||
|
t2 = _mm256_permutevar_ps(y11, yi3);
|
||||||
|
|
||||||
|
/*
|
||||||
|
dest[0][2] = b * t1[0] - c * t1[1] + d * t1[2];
|
||||||
|
dest[1][2] =-(a * t1[0] - c * t1[3] + d * t1[4]);
|
||||||
|
dest[2][2] = a * t1[1] - b * t1[3] + d * t1[5];
|
||||||
|
dest[3][2] =-(a * t1[2] - b * t1[4] + c * t1[5]);
|
||||||
|
|
||||||
|
dest[0][3] =-(b * t2[0] - c * t2[1] + d * t2[2]);
|
||||||
|
dest[1][3] = a * t2[0] - c * t2[3] + d * t2[4];
|
||||||
|
dest[2][3] =-(a * t2[1] - b * t2[3] + d * t2[5]);
|
||||||
|
dest[3][3] = a * t2[2] - b * t2[4] + c * t2[5];
|
||||||
|
*/
|
||||||
|
r2 = _mm256_xor_ps(_mm256_add_ps(_mm256_sub_ps(_mm256_mul_ps(y3, t0),
|
||||||
|
_mm256_mul_ps(y4, t1)),
|
||||||
|
_mm256_mul_ps(y5, t2)),
|
||||||
|
flpsign);
|
||||||
|
|
||||||
|
/* determinant */
|
||||||
|
|
||||||
|
y4 = _mm256_mul_ps(y0, r1);
|
||||||
|
y4 = _mm256_permute2f128_ps(y4, y4, 0x30);
|
||||||
|
y4 = _mm256_dp_ps(y0, r1, 0xff);
|
||||||
|
|
||||||
|
y5 = _mm256_div_ps(_mm256_set1_ps(1.0f), y4);
|
||||||
|
r1 = _mm256_mul_ps(r1, y5);
|
||||||
|
r2 = _mm256_mul_ps(r2, y5);
|
||||||
|
|
||||||
|
/* transpose */
|
||||||
|
|
||||||
|
/* d c b a h g f e */
|
||||||
|
/* l k j i p o n m */
|
||||||
|
y0 = _mm256_permute2f128_ps(r1, r1, 0x03);
|
||||||
|
y1 = _mm256_permute2f128_ps(r2, r2, 0x03);
|
||||||
|
|
||||||
|
/* b a f e f e b a */
|
||||||
|
/* j i n m n m j i */
|
||||||
|
/* i m a e m i e a */
|
||||||
|
/* j n b f n j f b */
|
||||||
|
/* n j f b m i e a */
|
||||||
|
y2 = _mm256_shuffle_ps(r1, y0, 0x44);
|
||||||
|
y3 = _mm256_shuffle_ps(r2, y1, 0x44);
|
||||||
|
y4 = _mm256_shuffle_ps(y2, y3, 0x88);
|
||||||
|
y5 = _mm256_shuffle_ps(y2, y3, 0xDD);
|
||||||
|
y6 = _mm256_permute2f128_ps(y4, y5, 0x20);
|
||||||
|
|
||||||
|
/* d c h g h g d c */
|
||||||
|
/* l k p o p o l k */
|
||||||
|
/* k o c g o k g c */
|
||||||
|
/* l p d h p l h d */
|
||||||
|
/* p l h d o k g c */
|
||||||
|
y2 = _mm256_shuffle_ps(r1, y0, 0xEE);
|
||||||
|
y3 = _mm256_shuffle_ps(r2, y1, 0xEE);
|
||||||
|
y4 = _mm256_shuffle_ps(y2, y3, 0x88);
|
||||||
|
y5 = _mm256_shuffle_ps(y2, y3, 0xDD);
|
||||||
|
y7 = _mm256_permute2f128_ps(y4, y5, 0x20);
|
||||||
|
|
||||||
|
glmm_store256(dest[0], y6);
|
||||||
|
glmm_store256(dest[2], y7);
|
||||||
|
}
|
||||||
|
|
||||||
|
CGLM_INLINE
|
||||||
|
void
|
||||||
|
glm_mat4_inv_fast_avx(mat4 mat, mat4 dest) {
|
||||||
|
__m256 y0, y1, y2, y3, y4, y5, y6, y7, y8, y9, y10, y11, y12, y13;
|
||||||
|
__m256 yt0, yt1, yt2;
|
||||||
|
__m256 t0, t1, t2;
|
||||||
|
__m256 r1, r2;
|
||||||
|
__m256 flpsign;
|
||||||
|
__m256i yi1, yi2, yi3;
|
||||||
|
|
||||||
|
y0 = glmm_load256(mat[0]); /* h g f e d c b a */
|
||||||
|
y1 = glmm_load256(mat[2]); /* p o n m l k j i */
|
||||||
|
|
||||||
|
y2 = _mm256_permute2f128_ps(y1, y1, 0x00); /* l k j i l k j i */
|
||||||
|
y3 = _mm256_permute2f128_ps(y1, y1, 0x11); /* p o n m p o n m */
|
||||||
|
y4 = _mm256_permute2f128_ps(y0, y0, 0x03); /* d c b a h g f e */
|
||||||
|
y13 = _mm256_permute2f128_ps(y4, y4, 0x00); /* h g f e h g f e */
|
||||||
|
|
||||||
|
yi1 = _mm256_set_epi32(0, 0, 0, 0, 0, 1, 1, 2);
|
||||||
|
yi2 = _mm256_set_epi32(1, 1, 1, 2, 3, 2, 3, 3);
|
||||||
|
flpsign = _mm256_set_ps(0.f, -0.f, 0.f, -0.f, -0.f, 0.f, -0.f, 0.f);
|
||||||
|
|
||||||
|
/* i i i i i j j k */
|
||||||
|
/* n n n o p o p p */
|
||||||
|
/* m m m m m n n o */
|
||||||
|
/* j j j k l k l l */
|
||||||
|
/* e e e e e f f g */
|
||||||
|
/* f f f g h g h h */
|
||||||
|
y5 = _mm256_permutevar_ps(y2, yi1);
|
||||||
|
y6 = _mm256_permutevar_ps(y3, yi2);
|
||||||
|
y7 = _mm256_permutevar_ps(y3, yi1);
|
||||||
|
y8 = _mm256_permutevar_ps(y2, yi2);
|
||||||
|
y2 = _mm256_permutevar_ps(y13, yi1);
|
||||||
|
y3 = _mm256_permutevar_ps(y13, yi2);
|
||||||
|
|
||||||
|
yi1 = _mm256_set_epi32(2, 1, 0, 0, 2, 1, 0, 0);
|
||||||
|
yi2 = _mm256_set_epi32(2, 1, 1, 0, 2, 1, 1, 0);
|
||||||
|
yi3 = _mm256_set_epi32(3, 3, 2, 0, 3, 3, 2, 0);
|
||||||
|
|
||||||
|
/*
|
||||||
|
t0[0] = k * p - o * l; t1[0] = g * p - o * h; t2[0] = g * l - k * h;
|
||||||
|
t0[1] = j * p - n * l; t1[1] = f * p - n * h; t2[1] = f * l - j * h;
|
||||||
|
t0[2] = j * o - n * k; t1[2] = f * o - n * g; t2[2] = f * k - j * g;
|
||||||
|
t0[3] = i * p - m * l; t1[3] = e * p - m * h; t2[3] = e * l - i * h;
|
||||||
|
t0[4] = i * o - m * k; t1[4] = e * o - m * g; t2[4] = e * k - i * g;
|
||||||
|
t0[5] = i * n - m * j; t1[5] = e * n - m * f; t2[5] = e * j - i * f;
|
||||||
|
*/
|
||||||
|
yt0 = _mm256_sub_ps(_mm256_mul_ps(y5, y6), _mm256_mul_ps(y7, y8));
|
||||||
|
yt1 = _mm256_sub_ps(_mm256_mul_ps(y2, y6), _mm256_mul_ps(y7, y3));
|
||||||
|
yt2 = _mm256_sub_ps(_mm256_mul_ps(y2, y8), _mm256_mul_ps(y5, y3));
|
||||||
|
|
||||||
|
/* t3 t2 t1 t0 t3 t2 t1 t0 */
|
||||||
|
/* t5 t5 t5 t4 t5 t5 t5 t4 */
|
||||||
|
y9 = _mm256_permute2f128_ps(yt0, yt0, 0x00);
|
||||||
|
y10 = _mm256_permute2f128_ps(yt0, yt0, 0x11);
|
||||||
|
|
||||||
|
/* t2 t1 t0 t0 t2 t1 t0 t0 */
|
||||||
|
t0 = _mm256_permutevar_ps(y9, yi1);
|
||||||
|
|
||||||
|
/* t4 t3 t3 t1 t4 t3 t3 t1 */
|
||||||
|
y11 = _mm256_shuffle_ps(y9, y10, 0x4D);
|
||||||
|
y12 = _mm256_permutevar_ps(y11, yi2);
|
||||||
|
t1 = _mm256_permute2f128_ps(y12, y9, 0x00);
|
||||||
|
|
||||||
|
/* t5 t5 t4 t2 t5 t5 t4 t2 */
|
||||||
|
y11 = _mm256_shuffle_ps(y9, y10, 0x4A);
|
||||||
|
y12 = _mm256_permutevar_ps(y11, yi3);
|
||||||
|
t2 = _mm256_permute2f128_ps(y12, y12, 0x00);
|
||||||
|
|
||||||
|
/* a a a b e e e f */
|
||||||
|
/* b b c c f f g g */
|
||||||
|
/* c d d d g h h h */
|
||||||
|
y9 = _mm256_permute_ps(y4, 0x01);
|
||||||
|
y10 = _mm256_permute_ps(y4, 0x5A);
|
||||||
|
y11 = _mm256_permute_ps(y4, 0xBF);
|
||||||
|
|
||||||
|
/*
|
||||||
|
dest[0][0] = f * t[0] - g * t[1] + h * t[2];
|
||||||
|
dest[1][0] =-(e * t[0] - g * t[3] + h * t[4]);
|
||||||
|
dest[2][0] = e * t[1] - f * t[3] + h * t[5];
|
||||||
|
dest[3][0] =-(e * t[2] - f * t[4] + g * t[5]);
|
||||||
|
|
||||||
|
dest[0][1] =-(b * t[0] - c * t[1] + d * t[2]);
|
||||||
|
dest[1][1] = a * t[0] - c * t[3] + d * t[4];
|
||||||
|
dest[2][1] =-(a * t[1] - b * t[3] + d * t[5]);
|
||||||
|
dest[3][1] = a * t[2] - b * t[4] + c * t[5];
|
||||||
|
*/
|
||||||
|
r1 = _mm256_xor_ps(_mm256_add_ps(_mm256_sub_ps(_mm256_mul_ps(y9, t0),
|
||||||
|
_mm256_mul_ps(y10, t1)),
|
||||||
|
_mm256_mul_ps(y11, t2)),
|
||||||
|
flpsign);
|
||||||
|
|
||||||
|
/* d c b a d c b a */
|
||||||
|
y2 = _mm256_permute2f128_ps(y0, y0, 0x0);
|
||||||
|
|
||||||
|
/* a a a b a a a b */
|
||||||
|
/* b b c c b b c c */
|
||||||
|
/* c d d d c d d d */
|
||||||
|
y3 = _mm256_permutevar_ps(y2, _mm256_set_epi32(0, 0, 0, 1, 0, 0, 0, 1));
|
||||||
|
y4 = _mm256_permutevar_ps(y2, _mm256_set_epi32(1, 1, 2, 2, 1, 1, 2, 2));
|
||||||
|
y5 = _mm256_permutevar_ps(y2, _mm256_set_epi32(2, 3, 3, 3, 2, 3, 3, 3));
|
||||||
|
|
||||||
|
/* t2[3] t2[2] t2[1] t2[0] t1[3] t1[2] t1[1] t1[0] */
|
||||||
|
/* t2[5] t2[5] t2[5] t2[4] t1[5] t1[5] t1[5] t1[4] */
|
||||||
|
y6 = _mm256_permute2f128_ps(yt1, yt2, 0x20);
|
||||||
|
y7 = _mm256_permute2f128_ps(yt1, yt2, 0x31);
|
||||||
|
|
||||||
|
/* t2[2] t2[1] t2[0] t2[0] t1[2] t1[1] t1[0] t1[0] */
|
||||||
|
t0 = _mm256_permutevar_ps(y6, yi1);
|
||||||
|
|
||||||
|
/* t1[4] t1[3] t1[3] t1[1] t1[4] t1[3] t1[3] t1[1] */
|
||||||
|
|
||||||
|
/* t1[4] t1[3] t1[3] t1[1] t1[4] t1[3] t1[3] t1[1] */
|
||||||
|
y11 = _mm256_shuffle_ps(y6, y7, 0x4D);
|
||||||
|
t1 = _mm256_permutevar_ps(y11, yi2);
|
||||||
|
|
||||||
|
|
||||||
|
/* t2[5] t2[5] t2[4] t2[2] t1[5] t1[5] t1[4] t1[2] */
|
||||||
|
y11 = _mm256_shuffle_ps(y6, y7, 0x4A);
|
||||||
|
t2 = _mm256_permutevar_ps(y11, yi3);
|
||||||
|
|
||||||
|
/*
|
||||||
|
dest[0][2] = b * t1[0] - c * t1[1] + d * t1[2];
|
||||||
|
dest[1][2] =-(a * t1[0] - c * t1[3] + d * t1[4]);
|
||||||
|
dest[2][2] = a * t1[1] - b * t1[3] + d * t1[5];
|
||||||
|
dest[3][2] =-(a * t1[2] - b * t1[4] + c * t1[5]);
|
||||||
|
|
||||||
|
dest[0][3] =-(b * t2[0] - c * t2[1] + d * t2[2]);
|
||||||
|
dest[1][3] = a * t2[0] - c * t2[3] + d * t2[4];
|
||||||
|
dest[2][3] =-(a * t2[1] - b * t2[3] + d * t2[5]);
|
||||||
|
dest[3][3] = a * t2[2] - b * t2[4] + c * t2[5];
|
||||||
|
*/
|
||||||
|
r2 = _mm256_xor_ps(_mm256_add_ps(_mm256_sub_ps(_mm256_mul_ps(y3, t0),
|
||||||
|
_mm256_mul_ps(y4, t1)),
|
||||||
|
_mm256_mul_ps(y5, t2)),
|
||||||
|
flpsign);
|
||||||
|
|
||||||
|
/* determinant */
|
||||||
|
|
||||||
|
y4 = _mm256_mul_ps(y0, r1);
|
||||||
|
y4 = _mm256_permute2f128_ps(y4, y4, 0x30);
|
||||||
|
y4 = _mm256_dp_ps(y0, r1, 0xff);
|
||||||
|
|
||||||
|
y5 = _mm256_rcp_ps(y4);
|
||||||
|
r1 = _mm256_mul_ps(r1, y5);
|
||||||
|
r2 = _mm256_mul_ps(r2, y5);
|
||||||
|
|
||||||
|
/* transpose */
|
||||||
|
|
||||||
|
/* d c b a h g f e */
|
||||||
|
/* l k j i p o n m */
|
||||||
|
y0 = _mm256_permute2f128_ps(r1, r1, 0x03);
|
||||||
|
y1 = _mm256_permute2f128_ps(r2, r2, 0x03);
|
||||||
|
|
||||||
|
/* b a f e f e b a */
|
||||||
|
/* j i n m n m j i */
|
||||||
|
/* i m a e m i e a */
|
||||||
|
/* j n b f n j f b */
|
||||||
|
/* n j f b m i e a */
|
||||||
|
y2 = _mm256_shuffle_ps(r1, y0, 0x44);
|
||||||
|
y3 = _mm256_shuffle_ps(r2, y1, 0x44);
|
||||||
|
y4 = _mm256_shuffle_ps(y2, y3, 0x88);
|
||||||
|
y5 = _mm256_shuffle_ps(y2, y3, 0xDD);
|
||||||
|
y6 = _mm256_permute2f128_ps(y4, y5, 0x20);
|
||||||
|
|
||||||
|
/* d c h g h g d c */
|
||||||
|
/* l k p o p o l k */
|
||||||
|
/* k o c g o k g c */
|
||||||
|
/* l p d h p l h d */
|
||||||
|
/* p l h d o k g c */
|
||||||
|
y2 = _mm256_shuffle_ps(r1, y0, 0xEE);
|
||||||
|
y3 = _mm256_shuffle_ps(r2, y1, 0xEE);
|
||||||
|
y4 = _mm256_shuffle_ps(y2, y3, 0x88);
|
||||||
|
y5 = _mm256_shuffle_ps(y2, y3, 0xDD);
|
||||||
|
y7 = _mm256_permute2f128_ps(y4, y5, 0x20);
|
||||||
|
|
||||||
|
glmm_store256(dest[0], y6);
|
||||||
|
glmm_store256(dest[2], y7);
|
||||||
|
}
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
#endif /* cglm_mat_simd_avx_h */
|
#endif /* cglm_mat_simd_avx_h */
|
||||||
|
|||||||
@@ -27,64 +27,90 @@
|
|||||||
#if defined( __SSE__ ) || defined( __SSE2__ )
|
#if defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
# include <xmmintrin.h>
|
# include <xmmintrin.h>
|
||||||
# include <emmintrin.h>
|
# include <emmintrin.h>
|
||||||
|
|
||||||
|
/* OPTIONAL: You may save some instructions but latency (not sure) */
|
||||||
|
#ifdef CGLM_USE_INT_DOMAIN
|
||||||
|
# define glmm_shuff1(xmm, z, y, x, w) \
|
||||||
|
_mm_castsi128_ps(_mm_shuffle_epi32(_mm_castps_si128(xmm), \
|
||||||
|
_MM_SHUFFLE(z, y, x, w)))
|
||||||
|
#else
|
||||||
|
# define glmm_shuff1(xmm, z, y, x, w) \
|
||||||
|
_mm_shuffle_ps(xmm, xmm, _MM_SHUFFLE(z, y, x, w))
|
||||||
|
#endif
|
||||||
|
|
||||||
|
#define glmm_shuff1x(xmm, x) glmm_shuff1(xmm, x, x, x, x)
|
||||||
|
#define glmm_shuff2(a, b, z0, y0, x0, w0, z1, y1, x1, w1) \
|
||||||
|
glmm_shuff1(_mm_shuffle_ps(a, b, _MM_SHUFFLE(z0, y0, x0, w0)), \
|
||||||
|
z1, y1, x1, w1)
|
||||||
|
|
||||||
|
static inline
|
||||||
|
__m128
|
||||||
|
glmm_dot(__m128 a, __m128 b) {
|
||||||
|
__m128 x0;
|
||||||
|
x0 = _mm_mul_ps(a, b);
|
||||||
|
x0 = _mm_add_ps(x0, glmm_shuff1(x0, 1, 0, 3, 2));
|
||||||
|
return _mm_add_ps(x0, glmm_shuff1(x0, 0, 1, 0, 1));
|
||||||
|
}
|
||||||
|
|
||||||
|
static inline
|
||||||
|
__m128
|
||||||
|
glmm_norm(__m128 a) {
|
||||||
|
return _mm_sqrt_ps(glmm_dot(a, a));
|
||||||
|
}
|
||||||
|
|
||||||
|
static inline
|
||||||
|
__m128
|
||||||
|
glmm_load3(float v[3]) {
|
||||||
|
__m128i xy;
|
||||||
|
__m128 z;
|
||||||
|
|
||||||
|
xy = _mm_loadl_epi64((const __m128i *)v);
|
||||||
|
z = _mm_load_ss(&v[2]);
|
||||||
|
|
||||||
|
return _mm_movelh_ps(_mm_castsi128_ps(xy), z);
|
||||||
|
}
|
||||||
|
|
||||||
|
static inline
|
||||||
|
void
|
||||||
|
glmm_store3(__m128 vx, float v[3]) {
|
||||||
|
_mm_storel_pi((__m64 *)&v[0], vx);
|
||||||
|
_mm_store_ss(&v[2], glmm_shuff1(vx, 2, 2, 2, 2));
|
||||||
|
}
|
||||||
|
|
||||||
|
#ifdef CGLM_ALL_UNALIGNED
|
||||||
|
# define glmm_load(p) _mm_loadu_ps(p)
|
||||||
|
# define glmm_store(p, a) _mm_storeu_ps(p, a)
|
||||||
|
#else
|
||||||
|
# define glmm_load(p) _mm_load_ps(p)
|
||||||
|
# define glmm_store(p, a) _mm_store_ps(p, a)
|
||||||
|
#endif
|
||||||
|
|
||||||
|
#endif
|
||||||
|
|
||||||
|
/* x86, x64 */
|
||||||
|
#if defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
# define CGLM_SSE_FP 1
|
# define CGLM_SSE_FP 1
|
||||||
# ifndef CGLM_SIMD_x86
|
|
||||||
# define CGLM_SIMD_x86
|
|
||||||
# endif
|
|
||||||
#endif
|
|
||||||
|
|
||||||
#if defined(__SSE3__)
|
|
||||||
# include <x86intrin.h>
|
|
||||||
# ifndef CGLM_SIMD_x86
|
|
||||||
# define CGLM_SIMD_x86
|
|
||||||
# endif
|
|
||||||
#endif
|
|
||||||
|
|
||||||
#if defined(__SSE4_1__)
|
|
||||||
# include <smmintrin.h>
|
|
||||||
# ifndef CGLM_SIMD_x86
|
|
||||||
# define CGLM_SIMD_x86
|
|
||||||
# endif
|
|
||||||
#endif
|
|
||||||
|
|
||||||
#if defined(__SSE4_2__)
|
|
||||||
# include <nmmintrin.h>
|
|
||||||
# ifndef CGLM_SIMD_x86
|
|
||||||
# define CGLM_SIMD_x86
|
|
||||||
# endif
|
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
#ifdef __AVX__
|
#ifdef __AVX__
|
||||||
# include <immintrin.h>
|
|
||||||
# define CGLM_AVX_FP 1
|
# define CGLM_AVX_FP 1
|
||||||
# ifndef CGLM_SIMD_x86
|
|
||||||
# define CGLM_SIMD_x86
|
#ifdef CGLM_ALL_UNALIGNED
|
||||||
# endif
|
# define glmm_load256(p) _mm256_loadu_ps(p)
|
||||||
|
# define glmm_store256(p, a) _mm256_storeu_ps(p, a)
|
||||||
|
#else
|
||||||
|
# define glmm_load256(p) _mm256_load_ps(p)
|
||||||
|
# define glmm_store256(p, a) _mm256_store_ps(p, a)
|
||||||
|
#endif
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
/* ARM Neon */
|
/* ARM Neon */
|
||||||
#if defined(__ARM_NEON)
|
#if defined(__ARM_NEON) && defined(__ARM_NEON_FP)
|
||||||
# include <arm_neon.h>
|
# include <arm_neon.h>
|
||||||
# if defined(__ARM_NEON_FP)
|
|
||||||
# define CGLM_NEON_FP 1
|
# define CGLM_NEON_FP 1
|
||||||
# ifndef CGLM_SIMD_ARM
|
#else
|
||||||
# define CGLM_SIMD_ARM
|
# undef CGLM_NEON_FP
|
||||||
# endif
|
|
||||||
# endif
|
|
||||||
#endif
|
|
||||||
|
|
||||||
#if defined(CGLM_SIMD_x86) || defined(CGLM_NEON_FP)
|
|
||||||
# ifndef CGLM_SIMD
|
|
||||||
# define CGLM_SIMD
|
|
||||||
# endif
|
|
||||||
#endif
|
|
||||||
|
|
||||||
#if defined(CGLM_SIMD_x86)
|
|
||||||
# include "x86.h"
|
|
||||||
#endif
|
|
||||||
|
|
||||||
#if defined(CGLM_SIMD_ARM)
|
|
||||||
# include "arm.h"
|
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
#endif /* cglm_intrin_h */
|
#endif /* cglm_intrin_h */
|
||||||
|
|||||||
@@ -1,136 +0,0 @@
|
|||||||
/*
|
|
||||||
* Copyright (c), Recep Aslantas.
|
|
||||||
*
|
|
||||||
* MIT License (MIT), http://opensource.org/licenses/MIT
|
|
||||||
* Full license can be found in the LICENSE file
|
|
||||||
*/
|
|
||||||
|
|
||||||
#ifndef cglm_simd_x86_h
|
|
||||||
#define cglm_simd_x86_h
|
|
||||||
#include "intrin.h"
|
|
||||||
#ifdef CGLM_SIMD_x86
|
|
||||||
|
|
||||||
#ifdef CGLM_ALL_UNALIGNED
|
|
||||||
# define glmm_load(p) _mm_loadu_ps(p)
|
|
||||||
# define glmm_store(p, a) _mm_storeu_ps(p, a)
|
|
||||||
#else
|
|
||||||
# define glmm_load(p) _mm_load_ps(p)
|
|
||||||
# define glmm_store(p, a) _mm_store_ps(p, a)
|
|
||||||
#endif
|
|
||||||
|
|
||||||
#ifdef CGLM_USE_INT_DOMAIN
|
|
||||||
# define glmm_shuff1(xmm, z, y, x, w) \
|
|
||||||
_mm_castsi128_ps(_mm_shuffle_epi32(_mm_castps_si128(xmm), \
|
|
||||||
_MM_SHUFFLE(z, y, x, w)))
|
|
||||||
#else
|
|
||||||
# define glmm_shuff1(xmm, z, y, x, w) \
|
|
||||||
_mm_shuffle_ps(xmm, xmm, _MM_SHUFFLE(z, y, x, w))
|
|
||||||
#endif
|
|
||||||
|
|
||||||
#define glmm_shuff1x(xmm, x) glmm_shuff1(xmm, x, x, x, x)
|
|
||||||
#define glmm_shuff2(a, b, z0, y0, x0, w0, z1, y1, x1, w1) \
|
|
||||||
glmm_shuff1(_mm_shuffle_ps(a, b, _MM_SHUFFLE(z0, y0, x0, w0)), \
|
|
||||||
z1, y1, x1, w1)
|
|
||||||
|
|
||||||
#ifdef __AVX__
|
|
||||||
# ifdef CGLM_ALL_UNALIGNED
|
|
||||||
# define glmm_load256(p) _mm256_loadu_ps(p)
|
|
||||||
# define glmm_store256(p, a) _mm256_storeu_ps(p, a)
|
|
||||||
# else
|
|
||||||
# define glmm_load256(p) _mm256_load_ps(p)
|
|
||||||
# define glmm_store256(p, a) _mm256_store_ps(p, a)
|
|
||||||
# endif
|
|
||||||
#endif
|
|
||||||
|
|
||||||
static inline
|
|
||||||
__m128
|
|
||||||
glmm_vhadds(__m128 v) {
|
|
||||||
#if defined(__SSE3__)
|
|
||||||
__m128 shuf, sums;
|
|
||||||
shuf = _mm_movehdup_ps(v);
|
|
||||||
sums = _mm_add_ps(v, shuf);
|
|
||||||
shuf = _mm_movehl_ps(shuf, sums);
|
|
||||||
sums = _mm_add_ss(sums, shuf);
|
|
||||||
return sums;
|
|
||||||
#else
|
|
||||||
__m128 shuf, sums;
|
|
||||||
shuf = glmm_shuff1(v, 2, 3, 0, 1);
|
|
||||||
sums = _mm_add_ps(v, shuf);
|
|
||||||
shuf = _mm_movehl_ps(shuf, sums);
|
|
||||||
sums = _mm_add_ss(sums, shuf);
|
|
||||||
return sums;
|
|
||||||
#endif
|
|
||||||
}
|
|
||||||
|
|
||||||
static inline
|
|
||||||
float
|
|
||||||
glmm_hadd(__m128 v) {
|
|
||||||
return _mm_cvtss_f32(glmm_vhadds(v));
|
|
||||||
}
|
|
||||||
|
|
||||||
static inline
|
|
||||||
__m128
|
|
||||||
glmm_vdots(__m128 a, __m128 b) {
|
|
||||||
#if (defined(__SSE4_1__) || defined(__SSE4_2__)) && defined(CGLM_SSE4_DOT)
|
|
||||||
return _mm_dp_ps(a, b, 0xFF);
|
|
||||||
#elif defined(__SSE3__) && defined(CGLM_SSE3_DOT)
|
|
||||||
__m128 x0, x1;
|
|
||||||
x0 = _mm_mul_ps(a, b);
|
|
||||||
x1 = _mm_hadd_ps(x0, x0);
|
|
||||||
return _mm_hadd_ps(x1, x1);
|
|
||||||
#else
|
|
||||||
return glmm_vhadds(_mm_mul_ps(a, b));
|
|
||||||
#endif
|
|
||||||
}
|
|
||||||
|
|
||||||
static inline
|
|
||||||
__m128
|
|
||||||
glmm_vdot(__m128 a, __m128 b) {
|
|
||||||
#if (defined(__SSE4_1__) || defined(__SSE4_2__)) && defined(CGLM_SSE4_DOT)
|
|
||||||
return _mm_dp_ps(a, b, 0xFF);
|
|
||||||
#elif defined(__SSE3__) && defined(CGLM_SSE3_DOT)
|
|
||||||
__m128 x0, x1;
|
|
||||||
x0 = _mm_mul_ps(a, b);
|
|
||||||
x1 = _mm_hadd_ps(x0, x0);
|
|
||||||
return _mm_hadd_ps(x1, x1);
|
|
||||||
#else
|
|
||||||
__m128 x0;
|
|
||||||
x0 = _mm_mul_ps(a, b);
|
|
||||||
x0 = _mm_add_ps(x0, glmm_shuff1(x0, 1, 0, 3, 2));
|
|
||||||
return _mm_add_ps(x0, glmm_shuff1(x0, 0, 1, 0, 1));
|
|
||||||
#endif
|
|
||||||
}
|
|
||||||
|
|
||||||
static inline
|
|
||||||
float
|
|
||||||
glmm_dot(__m128 a, __m128 b) {
|
|
||||||
return _mm_cvtss_f32(glmm_vdots(a, b));
|
|
||||||
}
|
|
||||||
|
|
||||||
static inline
|
|
||||||
float
|
|
||||||
glmm_norm(__m128 a) {
|
|
||||||
return _mm_cvtss_f32(_mm_sqrt_ss(glmm_vhadds(_mm_mul_ps(a, a))));
|
|
||||||
}
|
|
||||||
|
|
||||||
static inline
|
|
||||||
__m128
|
|
||||||
glmm_load3(float v[3]) {
|
|
||||||
__m128i xy;
|
|
||||||
__m128 z;
|
|
||||||
|
|
||||||
xy = _mm_loadl_epi64((const __m128i *)v);
|
|
||||||
z = _mm_load_ss(&v[2]);
|
|
||||||
|
|
||||||
return _mm_movelh_ps(_mm_castsi128_ps(xy), z);
|
|
||||||
}
|
|
||||||
|
|
||||||
static inline
|
|
||||||
void
|
|
||||||
glmm_store3(__m128 vx, float v[3]) {
|
|
||||||
_mm_storel_pi((__m64 *)&v[0], vx);
|
|
||||||
_mm_store_ss(&v[2], glmm_shuff1(vx, 2, 2, 2, 2));
|
|
||||||
}
|
|
||||||
|
|
||||||
#endif
|
|
||||||
#endif /* cglm_simd_x86_h */
|
|
||||||
@@ -122,8 +122,6 @@ void
|
|||||||
glm_vec4_copy(vec4 v, vec4 dest) {
|
glm_vec4_copy(vec4 v, vec4 dest) {
|
||||||
#if defined( __SSE__ ) || defined( __SSE2__ )
|
#if defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
glmm_store(dest, glmm_load(v));
|
glmm_store(dest, glmm_load(v));
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(dest, vld1q_f32(v));
|
|
||||||
#else
|
#else
|
||||||
dest[0] = v[0];
|
dest[0] = v[0];
|
||||||
dest[1] = v[1];
|
dest[1] = v[1];
|
||||||
@@ -159,8 +157,6 @@ void
|
|||||||
glm_vec4_zero(vec4 v) {
|
glm_vec4_zero(vec4 v) {
|
||||||
#if defined( __SSE__ ) || defined( __SSE2__ )
|
#if defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
glmm_store(v, _mm_setzero_ps());
|
glmm_store(v, _mm_setzero_ps());
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(v, vdupq_n_f32(0.0f));
|
|
||||||
#else
|
#else
|
||||||
v[0] = 0.0f;
|
v[0] = 0.0f;
|
||||||
v[1] = 0.0f;
|
v[1] = 0.0f;
|
||||||
@@ -179,8 +175,6 @@ void
|
|||||||
glm_vec4_one(vec4 v) {
|
glm_vec4_one(vec4 v) {
|
||||||
#if defined( __SSE__ ) || defined( __SSE2__ )
|
#if defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
glmm_store(v, _mm_set1_ps(1.0f));
|
glmm_store(v, _mm_set1_ps(1.0f));
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(v, vdupq_n_f32(1.0f));
|
|
||||||
#else
|
#else
|
||||||
v[0] = 1.0f;
|
v[0] = 1.0f;
|
||||||
v[1] = 1.0f;
|
v[1] = 1.0f;
|
||||||
@@ -200,8 +194,11 @@ glm_vec4_one(vec4 v) {
|
|||||||
CGLM_INLINE
|
CGLM_INLINE
|
||||||
float
|
float
|
||||||
glm_vec4_dot(vec4 a, vec4 b) {
|
glm_vec4_dot(vec4 a, vec4 b) {
|
||||||
#if defined(CGLM_SIMD)
|
#if defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
return glmm_dot(glmm_load(a), glmm_load(b));
|
__m128 x0;
|
||||||
|
x0 = _mm_mul_ps(glmm_load(a), glmm_load(b));
|
||||||
|
x0 = _mm_add_ps(x0, glmm_shuff1(x0, 1, 0, 3, 2));
|
||||||
|
return _mm_cvtss_f32(_mm_add_ss(x0, glmm_shuff1(x0, 0, 1, 0, 1)));
|
||||||
#else
|
#else
|
||||||
return a[0] * b[0] + a[1] * b[1] + a[2] * b[2] + a[3] * b[3];
|
return a[0] * b[0] + a[1] * b[1] + a[2] * b[2] + a[3] * b[3];
|
||||||
#endif
|
#endif
|
||||||
@@ -221,7 +218,15 @@ glm_vec4_dot(vec4 a, vec4 b) {
|
|||||||
CGLM_INLINE
|
CGLM_INLINE
|
||||||
float
|
float
|
||||||
glm_vec4_norm2(vec4 v) {
|
glm_vec4_norm2(vec4 v) {
|
||||||
return glm_vec4_dot(v, v);
|
#if defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
|
__m128 x0;
|
||||||
|
x0 = glmm_load(v);
|
||||||
|
x0 = _mm_mul_ps(x0, x0);
|
||||||
|
x0 = _mm_add_ps(x0, glmm_shuff1(x0, 1, 0, 3, 2));
|
||||||
|
return _mm_cvtss_f32(_mm_add_ss(x0, glmm_shuff1(x0, 0, 1, 0, 1)));
|
||||||
|
#else
|
||||||
|
return v[0] * v[0] + v[1] * v[1] + v[2] * v[2] + v[3] * v[3];
|
||||||
|
#endif
|
||||||
}
|
}
|
||||||
|
|
||||||
/*!
|
/*!
|
||||||
@@ -234,10 +239,12 @@ glm_vec4_norm2(vec4 v) {
|
|||||||
CGLM_INLINE
|
CGLM_INLINE
|
||||||
float
|
float
|
||||||
glm_vec4_norm(vec4 v) {
|
glm_vec4_norm(vec4 v) {
|
||||||
#if defined(CGLM_SIMD)
|
#if defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
return glmm_norm(glmm_load(v));
|
__m128 x0;
|
||||||
|
x0 = glmm_load(v);
|
||||||
|
return _mm_cvtss_f32(_mm_sqrt_ss(glmm_dot(x0, x0)));
|
||||||
#else
|
#else
|
||||||
return sqrtf(glm_vec4_dot(v, v));
|
return sqrtf(glm_vec4_norm2(v));
|
||||||
#endif
|
#endif
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -253,8 +260,6 @@ void
|
|||||||
glm_vec4_add(vec4 a, vec4 b, vec4 dest) {
|
glm_vec4_add(vec4 a, vec4 b, vec4 dest) {
|
||||||
#if defined( __SSE__ ) || defined( __SSE2__ )
|
#if defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
glmm_store(dest, _mm_add_ps(glmm_load(a), glmm_load(b)));
|
glmm_store(dest, _mm_add_ps(glmm_load(a), glmm_load(b)));
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(dest, vaddq_f32(vld1q_f32(a), vld1q_f32(b)));
|
|
||||||
#else
|
#else
|
||||||
dest[0] = a[0] + b[0];
|
dest[0] = a[0] + b[0];
|
||||||
dest[1] = a[1] + b[1];
|
dest[1] = a[1] + b[1];
|
||||||
@@ -275,8 +280,6 @@ void
|
|||||||
glm_vec4_adds(vec4 v, float s, vec4 dest) {
|
glm_vec4_adds(vec4 v, float s, vec4 dest) {
|
||||||
#if defined( __SSE__ ) || defined( __SSE2__ )
|
#if defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
glmm_store(dest, _mm_add_ps(glmm_load(v), _mm_set1_ps(s)));
|
glmm_store(dest, _mm_add_ps(glmm_load(v), _mm_set1_ps(s)));
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(dest, vaddq_f32(vld1q_f32(v), vdupq_n_f32(s)));
|
|
||||||
#else
|
#else
|
||||||
dest[0] = v[0] + s;
|
dest[0] = v[0] + s;
|
||||||
dest[1] = v[1] + s;
|
dest[1] = v[1] + s;
|
||||||
@@ -297,8 +300,6 @@ void
|
|||||||
glm_vec4_sub(vec4 a, vec4 b, vec4 dest) {
|
glm_vec4_sub(vec4 a, vec4 b, vec4 dest) {
|
||||||
#if defined( __SSE__ ) || defined( __SSE2__ )
|
#if defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
glmm_store(dest, _mm_sub_ps(glmm_load(a), glmm_load(b)));
|
glmm_store(dest, _mm_sub_ps(glmm_load(a), glmm_load(b)));
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(dest, vsubq_f32(vld1q_f32(a), vld1q_f32(b)));
|
|
||||||
#else
|
#else
|
||||||
dest[0] = a[0] - b[0];
|
dest[0] = a[0] - b[0];
|
||||||
dest[1] = a[1] - b[1];
|
dest[1] = a[1] - b[1];
|
||||||
@@ -319,8 +320,6 @@ void
|
|||||||
glm_vec4_subs(vec4 v, float s, vec4 dest) {
|
glm_vec4_subs(vec4 v, float s, vec4 dest) {
|
||||||
#if defined( __SSE__ ) || defined( __SSE2__ )
|
#if defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
glmm_store(dest, _mm_sub_ps(glmm_load(v), _mm_set1_ps(s)));
|
glmm_store(dest, _mm_sub_ps(glmm_load(v), _mm_set1_ps(s)));
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(dest, vsubq_f32(vld1q_f32(v), vdupq_n_f32(s)));
|
|
||||||
#else
|
#else
|
||||||
dest[0] = v[0] - s;
|
dest[0] = v[0] - s;
|
||||||
dest[1] = v[1] - s;
|
dest[1] = v[1] - s;
|
||||||
@@ -341,8 +340,6 @@ void
|
|||||||
glm_vec4_mul(vec4 a, vec4 b, vec4 dest) {
|
glm_vec4_mul(vec4 a, vec4 b, vec4 dest) {
|
||||||
#if defined( __SSE__ ) || defined( __SSE2__ )
|
#if defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
glmm_store(dest, _mm_mul_ps(glmm_load(a), glmm_load(b)));
|
glmm_store(dest, _mm_mul_ps(glmm_load(a), glmm_load(b)));
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(dest, vmulq_f32(vld1q_f32(a), vld1q_f32(b)));
|
|
||||||
#else
|
#else
|
||||||
dest[0] = a[0] * b[0];
|
dest[0] = a[0] * b[0];
|
||||||
dest[1] = a[1] * b[1];
|
dest[1] = a[1] * b[1];
|
||||||
@@ -363,8 +360,6 @@ void
|
|||||||
glm_vec4_scale(vec4 v, float s, vec4 dest) {
|
glm_vec4_scale(vec4 v, float s, vec4 dest) {
|
||||||
#if defined( __SSE__ ) || defined( __SSE2__ )
|
#if defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
glmm_store(dest, _mm_mul_ps(glmm_load(v), _mm_set1_ps(s)));
|
glmm_store(dest, _mm_mul_ps(glmm_load(v), _mm_set1_ps(s)));
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(dest, vmulq_f32(vld1q_f32(v), vdupq_n_f32(s)));
|
|
||||||
#else
|
#else
|
||||||
dest[0] = v[0] * s;
|
dest[0] = v[0] * s;
|
||||||
dest[1] = v[1] * s;
|
dest[1] = v[1] * s;
|
||||||
@@ -447,10 +442,6 @@ glm_vec4_addadd(vec4 a, vec4 b, vec4 dest) {
|
|||||||
glmm_store(dest, _mm_add_ps(glmm_load(dest),
|
glmm_store(dest, _mm_add_ps(glmm_load(dest),
|
||||||
_mm_add_ps(glmm_load(a),
|
_mm_add_ps(glmm_load(a),
|
||||||
glmm_load(b))));
|
glmm_load(b))));
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(dest, vaddq_f32(vld1q_f32(dest),
|
|
||||||
vaddq_f32(vld1q_f32(a),
|
|
||||||
vld1q_f32(b))));
|
|
||||||
#else
|
#else
|
||||||
dest[0] += a[0] + b[0];
|
dest[0] += a[0] + b[0];
|
||||||
dest[1] += a[1] + b[1];
|
dest[1] += a[1] + b[1];
|
||||||
@@ -475,10 +466,6 @@ glm_vec4_subadd(vec4 a, vec4 b, vec4 dest) {
|
|||||||
glmm_store(dest, _mm_add_ps(glmm_load(dest),
|
glmm_store(dest, _mm_add_ps(glmm_load(dest),
|
||||||
_mm_sub_ps(glmm_load(a),
|
_mm_sub_ps(glmm_load(a),
|
||||||
glmm_load(b))));
|
glmm_load(b))));
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(dest, vaddq_f32(vld1q_f32(dest),
|
|
||||||
vsubq_f32(vld1q_f32(a),
|
|
||||||
vld1q_f32(b))));
|
|
||||||
#else
|
#else
|
||||||
dest[0] += a[0] - b[0];
|
dest[0] += a[0] - b[0];
|
||||||
dest[1] += a[1] - b[1];
|
dest[1] += a[1] - b[1];
|
||||||
@@ -503,10 +490,6 @@ glm_vec4_muladd(vec4 a, vec4 b, vec4 dest) {
|
|||||||
glmm_store(dest, _mm_add_ps(glmm_load(dest),
|
glmm_store(dest, _mm_add_ps(glmm_load(dest),
|
||||||
_mm_mul_ps(glmm_load(a),
|
_mm_mul_ps(glmm_load(a),
|
||||||
glmm_load(b))));
|
glmm_load(b))));
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(dest, vaddq_f32(vld1q_f32(dest),
|
|
||||||
vmulq_f32(vld1q_f32(a),
|
|
||||||
vld1q_f32(b))));
|
|
||||||
#else
|
#else
|
||||||
dest[0] += a[0] * b[0];
|
dest[0] += a[0] * b[0];
|
||||||
dest[1] += a[1] * b[1];
|
dest[1] += a[1] * b[1];
|
||||||
@@ -531,10 +514,6 @@ glm_vec4_muladds(vec4 a, float s, vec4 dest) {
|
|||||||
glmm_store(dest, _mm_add_ps(glmm_load(dest),
|
glmm_store(dest, _mm_add_ps(glmm_load(dest),
|
||||||
_mm_mul_ps(glmm_load(a),
|
_mm_mul_ps(glmm_load(a),
|
||||||
_mm_set1_ps(s))));
|
_mm_set1_ps(s))));
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(dest, vaddq_f32(vld1q_f32(dest),
|
|
||||||
vsubq_f32(vld1q_f32(a),
|
|
||||||
vdupq_n_f32(s))));
|
|
||||||
#else
|
#else
|
||||||
dest[0] += a[0] * s;
|
dest[0] += a[0] * s;
|
||||||
dest[1] += a[1] * s;
|
dest[1] += a[1] * s;
|
||||||
@@ -559,10 +538,6 @@ glm_vec4_maxadd(vec4 a, vec4 b, vec4 dest) {
|
|||||||
glmm_store(dest, _mm_add_ps(glmm_load(dest),
|
glmm_store(dest, _mm_add_ps(glmm_load(dest),
|
||||||
_mm_max_ps(glmm_load(a),
|
_mm_max_ps(glmm_load(a),
|
||||||
glmm_load(b))));
|
glmm_load(b))));
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(dest, vaddq_f32(vld1q_f32(dest),
|
|
||||||
vmaxq_f32(vld1q_f32(a),
|
|
||||||
vld1q_f32(b))));
|
|
||||||
#else
|
#else
|
||||||
dest[0] += glm_max(a[0], b[0]);
|
dest[0] += glm_max(a[0], b[0]);
|
||||||
dest[1] += glm_max(a[1], b[1]);
|
dest[1] += glm_max(a[1], b[1]);
|
||||||
@@ -587,10 +562,6 @@ glm_vec4_minadd(vec4 a, vec4 b, vec4 dest) {
|
|||||||
glmm_store(dest, _mm_add_ps(glmm_load(dest),
|
glmm_store(dest, _mm_add_ps(glmm_load(dest),
|
||||||
_mm_min_ps(glmm_load(a),
|
_mm_min_ps(glmm_load(a),
|
||||||
glmm_load(b))));
|
glmm_load(b))));
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(dest, vaddq_f32(vld1q_f32(dest),
|
|
||||||
vminq_f32(vld1q_f32(a),
|
|
||||||
vld1q_f32(b))));
|
|
||||||
#else
|
#else
|
||||||
dest[0] += glm_min(a[0], b[0]);
|
dest[0] += glm_min(a[0], b[0]);
|
||||||
dest[1] += glm_min(a[1], b[1]);
|
dest[1] += glm_min(a[1], b[1]);
|
||||||
@@ -610,8 +581,6 @@ void
|
|||||||
glm_vec4_negate_to(vec4 v, vec4 dest) {
|
glm_vec4_negate_to(vec4 v, vec4 dest) {
|
||||||
#if defined( __SSE__ ) || defined( __SSE2__ )
|
#if defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
glmm_store(dest, _mm_xor_ps(glmm_load(v), _mm_set1_ps(-0.0f)));
|
glmm_store(dest, _mm_xor_ps(glmm_load(v), _mm_set1_ps(-0.0f)));
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(dest, veorq_s32(vld1q_f32(v), vdupq_n_f32(-0.0f)));
|
|
||||||
#else
|
#else
|
||||||
dest[0] = -v[0];
|
dest[0] = -v[0];
|
||||||
dest[1] = -v[1];
|
dest[1] = -v[1];
|
||||||
@@ -645,7 +614,7 @@ glm_vec4_normalize_to(vec4 v, vec4 dest) {
|
|||||||
float dot;
|
float dot;
|
||||||
|
|
||||||
x0 = glmm_load(v);
|
x0 = glmm_load(v);
|
||||||
xdot = glmm_vdot(x0, x0);
|
xdot = glmm_dot(x0, x0);
|
||||||
dot = _mm_cvtss_f32(xdot);
|
dot = _mm_cvtss_f32(xdot);
|
||||||
|
|
||||||
if (dot == 0.0f) {
|
if (dot == 0.0f) {
|
||||||
@@ -689,25 +658,10 @@ glm_vec4_normalize(vec4 v) {
|
|||||||
CGLM_INLINE
|
CGLM_INLINE
|
||||||
float
|
float
|
||||||
glm_vec4_distance(vec4 a, vec4 b) {
|
glm_vec4_distance(vec4 a, vec4 b) {
|
||||||
#if defined( __SSE__ ) || defined( __SSE2__ )
|
|
||||||
__m128 x0;
|
|
||||||
x0 = _mm_sub_ps(glmm_load(b), glmm_load(a));
|
|
||||||
x0 = _mm_mul_ps(x0, x0);
|
|
||||||
x0 = _mm_add_ps(x0, glmm_shuff1(x0, 1, 0, 3, 2));
|
|
||||||
return _mm_cvtss_f32(_mm_sqrt_ss(_mm_add_ss(x0,
|
|
||||||
glmm_shuff1(x0, 0, 1, 0, 1))));
|
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
float32x4_t v0;
|
|
||||||
float32_t r;
|
|
||||||
v0 = vsubq_f32(vld1q_f32(a), vld1q_f32(b));
|
|
||||||
r = vaddvq_f32(vmulq_f32(v0, v0));
|
|
||||||
return sqrtf(r);
|
|
||||||
#else
|
|
||||||
return sqrtf(glm_pow2(b[0] - a[0])
|
return sqrtf(glm_pow2(b[0] - a[0])
|
||||||
+ glm_pow2(b[1] - a[1])
|
+ glm_pow2(b[1] - a[1])
|
||||||
+ glm_pow2(b[2] - a[2])
|
+ glm_pow2(b[2] - a[2])
|
||||||
+ glm_pow2(b[3] - a[3]));
|
+ glm_pow2(b[3] - a[3]));
|
||||||
#endif
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/*!
|
/*!
|
||||||
@@ -722,8 +676,6 @@ void
|
|||||||
glm_vec4_maxv(vec4 a, vec4 b, vec4 dest) {
|
glm_vec4_maxv(vec4 a, vec4 b, vec4 dest) {
|
||||||
#if defined( __SSE__ ) || defined( __SSE2__ )
|
#if defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
glmm_store(dest, _mm_max_ps(glmm_load(a), glmm_load(b)));
|
glmm_store(dest, _mm_max_ps(glmm_load(a), glmm_load(b)));
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(dest, vmaxq_f32(vld1q_f32(a), vld1q_f32(b)));
|
|
||||||
#else
|
#else
|
||||||
dest[0] = glm_max(a[0], b[0]);
|
dest[0] = glm_max(a[0], b[0]);
|
||||||
dest[1] = glm_max(a[1], b[1]);
|
dest[1] = glm_max(a[1], b[1]);
|
||||||
@@ -744,8 +696,6 @@ void
|
|||||||
glm_vec4_minv(vec4 a, vec4 b, vec4 dest) {
|
glm_vec4_minv(vec4 a, vec4 b, vec4 dest) {
|
||||||
#if defined( __SSE__ ) || defined( __SSE2__ )
|
#if defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
glmm_store(dest, _mm_min_ps(glmm_load(a), glmm_load(b)));
|
glmm_store(dest, _mm_min_ps(glmm_load(a), glmm_load(b)));
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(dest, vminq_f32(vld1q_f32(a), vld1q_f32(b)));
|
|
||||||
#else
|
#else
|
||||||
dest[0] = glm_min(a[0], b[0]);
|
dest[0] = glm_min(a[0], b[0]);
|
||||||
dest[1] = glm_min(a[1], b[1]);
|
dest[1] = glm_min(a[1], b[1]);
|
||||||
@@ -767,9 +717,6 @@ glm_vec4_clamp(vec4 v, float minVal, float maxVal) {
|
|||||||
#if defined( __SSE__ ) || defined( __SSE2__ )
|
#if defined( __SSE__ ) || defined( __SSE2__ )
|
||||||
glmm_store(v, _mm_min_ps(_mm_max_ps(glmm_load(v), _mm_set1_ps(minVal)),
|
glmm_store(v, _mm_min_ps(_mm_max_ps(glmm_load(v), _mm_set1_ps(minVal)),
|
||||||
_mm_set1_ps(maxVal)));
|
_mm_set1_ps(maxVal)));
|
||||||
#elif defined(CGLM_NEON_FP)
|
|
||||||
vst1q_f32(v, vminq_f32(vmaxq_f32(vld1q_f32(v), vdupq_n_f32(minVal)),
|
|
||||||
vdupq_n_f32(maxVal)));
|
|
||||||
#else
|
#else
|
||||||
v[0] = glm_clamp(v[0], minVal, maxVal);
|
v[0] = glm_clamp(v[0], minVal, maxVal);
|
||||||
v[1] = glm_clamp(v[1], minVal, maxVal);
|
v[1] = glm_clamp(v[1], minVal, maxVal);
|
||||||
@@ -800,23 +747,4 @@ glm_vec4_lerp(vec4 from, vec4 to, float t, vec4 dest) {
|
|||||||
glm_vec4_add(from, v, dest);
|
glm_vec4_add(from, v, dest);
|
||||||
}
|
}
|
||||||
|
|
||||||
/*!
|
|
||||||
* @brief helper to fill vec4 as [S^3, S^2, S, 1]
|
|
||||||
*
|
|
||||||
* @param[in] s parameter
|
|
||||||
* @param[out] dest destination
|
|
||||||
*/
|
|
||||||
CGLM_INLINE
|
|
||||||
void
|
|
||||||
glm_vec4_cubic(float s, vec4 dest) {
|
|
||||||
float ss;
|
|
||||||
|
|
||||||
ss = s * s;
|
|
||||||
|
|
||||||
dest[0] = ss * s;
|
|
||||||
dest[1] = ss;
|
|
||||||
dest[2] = s;
|
|
||||||
dest[3] = 1.0f;
|
|
||||||
}
|
|
||||||
|
|
||||||
#endif /* cglm_vec4_h */
|
#endif /* cglm_vec4_h */
|
||||||
|
|||||||
@@ -10,6 +10,6 @@
|
|||||||
|
|
||||||
#define CGLM_VERSION_MAJOR 0
|
#define CGLM_VERSION_MAJOR 0
|
||||||
#define CGLM_VERSION_MINOR 5
|
#define CGLM_VERSION_MINOR 5
|
||||||
#define CGLM_VERSION_PATCH 3
|
#define CGLM_VERSION_PATCH 2
|
||||||
|
|
||||||
#endif /* cglm_version_h */
|
#endif /* cglm_version_h */
|
||||||
|
|||||||
19
makefile.am
19
makefile.am
@@ -57,9 +57,7 @@ cglm_HEADERS = include/cglm/version.h \
|
|||||||
include/cglm/color.h \
|
include/cglm/color.h \
|
||||||
include/cglm/project.h \
|
include/cglm/project.h \
|
||||||
include/cglm/sphere.h \
|
include/cglm/sphere.h \
|
||||||
include/cglm/ease.h \
|
include/cglm/ease.h
|
||||||
include/cglm/curve.h \
|
|
||||||
include/cglm/bezier.h
|
|
||||||
|
|
||||||
cglm_calldir=$(includedir)/cglm/call
|
cglm_calldir=$(includedir)/cglm/call
|
||||||
cglm_call_HEADERS = include/cglm/call/mat4.h \
|
cglm_call_HEADERS = include/cglm/call/mat4.h \
|
||||||
@@ -76,14 +74,10 @@ cglm_call_HEADERS = include/cglm/call/mat4.h \
|
|||||||
include/cglm/call/box.h \
|
include/cglm/call/box.h \
|
||||||
include/cglm/call/project.h \
|
include/cglm/call/project.h \
|
||||||
include/cglm/call/sphere.h \
|
include/cglm/call/sphere.h \
|
||||||
include/cglm/call/ease.h \
|
include/cglm/call/ease.h
|
||||||
include/cglm/call/curve.h \
|
|
||||||
include/cglm/call/bezier.h
|
|
||||||
|
|
||||||
cglm_simddir=$(includedir)/cglm/simd
|
cglm_simddir=$(includedir)/cglm/simd
|
||||||
cglm_simd_HEADERS = include/cglm/simd/intrin.h \
|
cglm_simd_HEADERS = include/cglm/simd/intrin.h
|
||||||
include/cglm/simd/x86.h \
|
|
||||||
include/cglm/simd/arm.h
|
|
||||||
|
|
||||||
cglm_simd_sse2dir=$(includedir)/cglm/simd/sse2
|
cglm_simd_sse2dir=$(includedir)/cglm/simd/sse2
|
||||||
cglm_simd_sse2_HEADERS = include/cglm/simd/sse2/affine.h \
|
cglm_simd_sse2_HEADERS = include/cglm/simd/sse2/affine.h \
|
||||||
@@ -113,9 +107,7 @@ libcglm_la_SOURCES=\
|
|||||||
src/box.c \
|
src/box.c \
|
||||||
src/project.c \
|
src/project.c \
|
||||||
src/sphere.c \
|
src/sphere.c \
|
||||||
src/ease.c \
|
src/ease.c
|
||||||
src/curve.c \
|
|
||||||
src/bezier.c
|
|
||||||
|
|
||||||
test_tests_SOURCES=\
|
test_tests_SOURCES=\
|
||||||
test/src/test_common.c \
|
test/src/test_common.c \
|
||||||
@@ -129,8 +121,7 @@ test_tests_SOURCES=\
|
|||||||
test/src/test_vec4.c \
|
test/src/test_vec4.c \
|
||||||
test/src/test_vec3.c \
|
test/src/test_vec3.c \
|
||||||
test/src/test_mat3.c \
|
test/src/test_mat3.c \
|
||||||
test/src/test_affine.c \
|
test/src/test_affine.c
|
||||||
test/src/test_bezier.c
|
|
||||||
|
|
||||||
all-local:
|
all-local:
|
||||||
sh ./post-build.sh
|
sh ./post-build.sh
|
||||||
|
|||||||
27
src/bezier.c
27
src/bezier.c
@@ -1,27 +0,0 @@
|
|||||||
/*
|
|
||||||
* Copyright (c), Recep Aslantas.
|
|
||||||
*
|
|
||||||
* MIT License (MIT), http://opensource.org/licenses/MIT
|
|
||||||
* Full license can be found in the LICENSE file
|
|
||||||
*/
|
|
||||||
|
|
||||||
#include "../include/cglm/cglm.h"
|
|
||||||
#include "../include/cglm/call.h"
|
|
||||||
|
|
||||||
CGLM_EXPORT
|
|
||||||
float
|
|
||||||
glmc_bezier(float s, float p0, float c0, float c1, float p1) {
|
|
||||||
return glm_bezier(s, p0, c0, c1, p1);
|
|
||||||
}
|
|
||||||
|
|
||||||
CGLM_EXPORT
|
|
||||||
float
|
|
||||||
glmc_hermite(float s, float p0, float t0, float t1, float p1) {
|
|
||||||
return glm_hermite(s, p0, t0, t1, p1);
|
|
||||||
}
|
|
||||||
|
|
||||||
CGLM_EXPORT
|
|
||||||
float
|
|
||||||
glmc_decasteljau(float prm, float p0, float c0, float c1, float p1) {
|
|
||||||
return glm_decasteljau(prm, p0, c0, c1, p1);
|
|
||||||
}
|
|
||||||
15
src/curve.c
15
src/curve.c
@@ -1,15 +0,0 @@
|
|||||||
/*
|
|
||||||
* Copyright (c), Recep Aslantas.
|
|
||||||
*
|
|
||||||
* MIT License (MIT), http://opensource.org/licenses/MIT
|
|
||||||
* Full license can be found in the LICENSE file
|
|
||||||
*/
|
|
||||||
|
|
||||||
#include "../include/cglm/cglm.h"
|
|
||||||
#include "../include/cglm/call.h"
|
|
||||||
|
|
||||||
CGLM_EXPORT
|
|
||||||
float
|
|
||||||
glmc_smc(float s, mat4 m, vec4 c) {
|
|
||||||
return glm_smc(s, m, c);
|
|
||||||
}
|
|
||||||
@@ -91,9 +91,3 @@ void
|
|||||||
glmc_mat3_swap_row(mat3 mat, int row1, int row2) {
|
glmc_mat3_swap_row(mat3 mat, int row1, int row2) {
|
||||||
glm_mat3_swap_row(mat, row1, row2);
|
glm_mat3_swap_row(mat, row1, row2);
|
||||||
}
|
}
|
||||||
|
|
||||||
CGLM_EXPORT
|
|
||||||
float
|
|
||||||
glmc_mat3_rmc(vec3 r, mat3 m, vec3 c) {
|
|
||||||
return glm_mat3_rmc(r, m, c);
|
|
||||||
}
|
|
||||||
|
|||||||
@@ -151,9 +151,3 @@ void
|
|||||||
glmc_mat4_swap_row(mat4 mat, int row1, int row2) {
|
glmc_mat4_swap_row(mat4 mat, int row1, int row2) {
|
||||||
glm_mat4_swap_row(mat, row1, row2);
|
glm_mat4_swap_row(mat, row1, row2);
|
||||||
}
|
}
|
||||||
|
|
||||||
CGLM_EXPORT
|
|
||||||
float
|
|
||||||
glmc_mat4_rmc(vec4 r, mat4 m, vec4 c) {
|
|
||||||
return glm_mat4_rmc(r, m, c);
|
|
||||||
}
|
|
||||||
|
|||||||
@@ -206,12 +206,6 @@ glmc_vec4_lerp(vec4 from, vec4 to, float t, vec4 dest) {
|
|||||||
glm_vec4_lerp(from, to, t, dest);
|
glm_vec4_lerp(from, to, t, dest);
|
||||||
}
|
}
|
||||||
|
|
||||||
CGLM_EXPORT
|
|
||||||
void
|
|
||||||
glmc_vec4_cubic(float s, vec4 dest) {
|
|
||||||
glm_vec4_cubic(s, dest);
|
|
||||||
}
|
|
||||||
|
|
||||||
/* ext */
|
/* ext */
|
||||||
|
|
||||||
CGLM_EXPORT
|
CGLM_EXPORT
|
||||||
|
|||||||
@@ -1,65 +0,0 @@
|
|||||||
/*
|
|
||||||
* Copyright (c), Recep Aslantas.
|
|
||||||
*
|
|
||||||
* MIT License (MIT), http://opensource.org/licenses/MIT
|
|
||||||
* Full license can be found in the LICENSE file
|
|
||||||
*/
|
|
||||||
|
|
||||||
#include "test_common.h"
|
|
||||||
|
|
||||||
CGLM_INLINE
|
|
||||||
float
|
|
||||||
test_bezier_plain(float s, float p0, float c0, float c1, float p1) {
|
|
||||||
float x, xx, xxx, ss, sss;
|
|
||||||
|
|
||||||
x = 1.0f - s;
|
|
||||||
xx = x * x;
|
|
||||||
xxx = xx * x;
|
|
||||||
ss = s * s;
|
|
||||||
sss = ss * s;
|
|
||||||
|
|
||||||
return p0 * xxx + 3.0f * (c0 * s * xx + c1 * ss * x) + p1 * sss;
|
|
||||||
}
|
|
||||||
|
|
||||||
CGLM_INLINE
|
|
||||||
float
|
|
||||||
test_hermite_plain(float s, float p0, float t0, float t1, float p1) {
|
|
||||||
float ss, sss;
|
|
||||||
|
|
||||||
ss = s * s;
|
|
||||||
sss = ss * s;
|
|
||||||
|
|
||||||
return p0 * (2.0f * sss - 3.0f * ss + 1.0f)
|
|
||||||
+ t0 * (sss - 2.0f * ss + s)
|
|
||||||
+ p1 * (-2.0f * sss + 3.0f * ss)
|
|
||||||
+ t1 * (sss - ss);
|
|
||||||
}
|
|
||||||
|
|
||||||
void
|
|
||||||
test_bezier(void **state) {
|
|
||||||
float s, p0, p1, c0, c1, smc, Bs, Bs_plain;
|
|
||||||
|
|
||||||
s = test_rand();
|
|
||||||
p0 = test_rand();
|
|
||||||
p1 = test_rand();
|
|
||||||
c0 = test_rand();
|
|
||||||
c1 = test_rand();
|
|
||||||
|
|
||||||
/* test cubic bezier */
|
|
||||||
smc = glm_smc(s, GLM_BEZIER_MAT, (vec4){p0, c0, c1, p1});
|
|
||||||
Bs = glm_bezier(s, p0, c0, c1, p1);
|
|
||||||
Bs_plain = test_bezier_plain(s, p0, c0, c1, p1);
|
|
||||||
|
|
||||||
assert_true(glm_eq(Bs, Bs_plain));
|
|
||||||
assert_true(glm_eq(smc, Bs_plain));
|
|
||||||
assert_true(glm_eq(Bs, smc));
|
|
||||||
|
|
||||||
/* test cubic hermite */
|
|
||||||
smc = glm_smc(s, GLM_HERMITE_MAT, (vec4){p0, p1, c0, c1});
|
|
||||||
Bs = glm_hermite(s, p0, c0, c1, p1);
|
|
||||||
Bs_plain = test_hermite_plain(s, p0, c0, c1, p1);
|
|
||||||
|
|
||||||
assert_true(glm_eq(Bs, Bs_plain));
|
|
||||||
assert_true(glm_eq(smc, Bs_plain));
|
|
||||||
assert_true(glm_eq(Bs, smc));
|
|
||||||
}
|
|
||||||
@@ -58,7 +58,7 @@ test_rand_vec4(vec4 dest) {
|
|||||||
}
|
}
|
||||||
|
|
||||||
float
|
float
|
||||||
test_rand(void) {
|
test_rand_angle(void) {
|
||||||
srand((unsigned int)time(NULL));
|
srand((unsigned int)time(NULL));
|
||||||
return drand48();
|
return drand48();
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -59,7 +59,7 @@ void
|
|||||||
test_rand_vec4(vec4 dest) ;
|
test_rand_vec4(vec4 dest) ;
|
||||||
|
|
||||||
float
|
float
|
||||||
test_rand(void);
|
test_rand_angle(void);
|
||||||
|
|
||||||
void
|
void
|
||||||
test_rand_quat(versor q);
|
test_rand_quat(versor q);
|
||||||
|
|||||||
@@ -38,10 +38,7 @@ main(int argc, const char * argv[]) {
|
|||||||
cmocka_unit_test(test_vec3),
|
cmocka_unit_test(test_vec3),
|
||||||
|
|
||||||
/* affine */
|
/* affine */
|
||||||
cmocka_unit_test(test_affine),
|
cmocka_unit_test(test_affine)
|
||||||
|
|
||||||
/* bezier */
|
|
||||||
cmocka_unit_test(test_bezier)
|
|
||||||
};
|
};
|
||||||
|
|
||||||
return cmocka_run_group_tests(tests, NULL, NULL);
|
return cmocka_run_group_tests(tests, NULL, NULL);
|
||||||
|
|||||||
@@ -40,7 +40,4 @@ test_vec3(void **state);
|
|||||||
void
|
void
|
||||||
test_affine(void **state);
|
test_affine(void **state);
|
||||||
|
|
||||||
void
|
|
||||||
test_bezier(void **state);
|
|
||||||
|
|
||||||
#endif /* test_tests_h */
|
#endif /* test_tests_h */
|
||||||
|
|||||||
@@ -20,10 +20,8 @@
|
|||||||
</ItemGroup>
|
</ItemGroup>
|
||||||
<ItemGroup>
|
<ItemGroup>
|
||||||
<ClCompile Include="..\src\affine.c" />
|
<ClCompile Include="..\src\affine.c" />
|
||||||
<ClCompile Include="..\src\bezier.c" />
|
|
||||||
<ClCompile Include="..\src\box.c" />
|
<ClCompile Include="..\src\box.c" />
|
||||||
<ClCompile Include="..\src\cam.c" />
|
<ClCompile Include="..\src\cam.c" />
|
||||||
<ClCompile Include="..\src\curve.c" />
|
|
||||||
<ClCompile Include="..\src\dllmain.c" />
|
<ClCompile Include="..\src\dllmain.c" />
|
||||||
<ClCompile Include="..\src\ease.c" />
|
<ClCompile Include="..\src\ease.c" />
|
||||||
<ClCompile Include="..\src\euler.c" />
|
<ClCompile Include="..\src\euler.c" />
|
||||||
@@ -41,14 +39,11 @@
|
|||||||
<ItemGroup>
|
<ItemGroup>
|
||||||
<ClInclude Include="..\include\cglm\affine-mat.h" />
|
<ClInclude Include="..\include\cglm\affine-mat.h" />
|
||||||
<ClInclude Include="..\include\cglm\affine.h" />
|
<ClInclude Include="..\include\cglm\affine.h" />
|
||||||
<ClInclude Include="..\include\cglm\bezier.h" />
|
|
||||||
<ClInclude Include="..\include\cglm\box.h" />
|
<ClInclude Include="..\include\cglm\box.h" />
|
||||||
<ClInclude Include="..\include\cglm\call.h" />
|
<ClInclude Include="..\include\cglm\call.h" />
|
||||||
<ClInclude Include="..\include\cglm\call\affine.h" />
|
<ClInclude Include="..\include\cglm\call\affine.h" />
|
||||||
<ClInclude Include="..\include\cglm\call\bezier.h" />
|
|
||||||
<ClInclude Include="..\include\cglm\call\box.h" />
|
<ClInclude Include="..\include\cglm\call\box.h" />
|
||||||
<ClInclude Include="..\include\cglm\call\cam.h" />
|
<ClInclude Include="..\include\cglm\call\cam.h" />
|
||||||
<ClInclude Include="..\include\cglm\call\curve.h" />
|
|
||||||
<ClInclude Include="..\include\cglm\call\ease.h" />
|
<ClInclude Include="..\include\cglm\call\ease.h" />
|
||||||
<ClInclude Include="..\include\cglm\call\euler.h" />
|
<ClInclude Include="..\include\cglm\call\euler.h" />
|
||||||
<ClInclude Include="..\include\cglm\call\frustum.h" />
|
<ClInclude Include="..\include\cglm\call\frustum.h" />
|
||||||
@@ -65,7 +60,6 @@
|
|||||||
<ClInclude Include="..\include\cglm\cglm.h" />
|
<ClInclude Include="..\include\cglm\cglm.h" />
|
||||||
<ClInclude Include="..\include\cglm\color.h" />
|
<ClInclude Include="..\include\cglm\color.h" />
|
||||||
<ClInclude Include="..\include\cglm\common.h" />
|
<ClInclude Include="..\include\cglm\common.h" />
|
||||||
<ClInclude Include="..\include\cglm\curve.h" />
|
|
||||||
<ClInclude Include="..\include\cglm\ease.h" />
|
<ClInclude Include="..\include\cglm\ease.h" />
|
||||||
<ClInclude Include="..\include\cglm\euler.h" />
|
<ClInclude Include="..\include\cglm\euler.h" />
|
||||||
<ClInclude Include="..\include\cglm\frustum.h" />
|
<ClInclude Include="..\include\cglm\frustum.h" />
|
||||||
@@ -75,7 +69,6 @@
|
|||||||
<ClInclude Include="..\include\cglm\plane.h" />
|
<ClInclude Include="..\include\cglm\plane.h" />
|
||||||
<ClInclude Include="..\include\cglm\project.h" />
|
<ClInclude Include="..\include\cglm\project.h" />
|
||||||
<ClInclude Include="..\include\cglm\quat.h" />
|
<ClInclude Include="..\include\cglm\quat.h" />
|
||||||
<ClInclude Include="..\include\cglm\simd\arm.h" />
|
|
||||||
<ClInclude Include="..\include\cglm\simd\avx\affine.h" />
|
<ClInclude Include="..\include\cglm\simd\avx\affine.h" />
|
||||||
<ClInclude Include="..\include\cglm\simd\avx\mat4.h" />
|
<ClInclude Include="..\include\cglm\simd\avx\mat4.h" />
|
||||||
<ClInclude Include="..\include\cglm\simd\intrin.h" />
|
<ClInclude Include="..\include\cglm\simd\intrin.h" />
|
||||||
@@ -84,7 +77,6 @@
|
|||||||
<ClInclude Include="..\include\cglm\simd\sse2\mat3.h" />
|
<ClInclude Include="..\include\cglm\simd\sse2\mat3.h" />
|
||||||
<ClInclude Include="..\include\cglm\simd\sse2\mat4.h" />
|
<ClInclude Include="..\include\cglm\simd\sse2\mat4.h" />
|
||||||
<ClInclude Include="..\include\cglm\simd\sse2\quat.h" />
|
<ClInclude Include="..\include\cglm\simd\sse2\quat.h" />
|
||||||
<ClInclude Include="..\include\cglm\simd\x86.h" />
|
|
||||||
<ClInclude Include="..\include\cglm\sphere.h" />
|
<ClInclude Include="..\include\cglm\sphere.h" />
|
||||||
<ClInclude Include="..\include\cglm\types.h" />
|
<ClInclude Include="..\include\cglm\types.h" />
|
||||||
<ClInclude Include="..\include\cglm\util.h" />
|
<ClInclude Include="..\include\cglm\util.h" />
|
||||||
|
|||||||
@@ -84,12 +84,6 @@
|
|||||||
<ClCompile Include="..\src\ease.c">
|
<ClCompile Include="..\src\ease.c">
|
||||||
<Filter>src</Filter>
|
<Filter>src</Filter>
|
||||||
</ClCompile>
|
</ClCompile>
|
||||||
<ClCompile Include="..\src\curve.c">
|
|
||||||
<Filter>src</Filter>
|
|
||||||
</ClCompile>
|
|
||||||
<ClCompile Include="..\src\bezier.c">
|
|
||||||
<Filter>src</Filter>
|
|
||||||
</ClCompile>
|
|
||||||
</ItemGroup>
|
</ItemGroup>
|
||||||
<ItemGroup>
|
<ItemGroup>
|
||||||
<ClInclude Include="..\src\config.h">
|
<ClInclude Include="..\src\config.h">
|
||||||
@@ -239,23 +233,5 @@
|
|||||||
<ClInclude Include="..\include\cglm\ease.h">
|
<ClInclude Include="..\include\cglm\ease.h">
|
||||||
<Filter>include\cglm</Filter>
|
<Filter>include\cglm</Filter>
|
||||||
</ClInclude>
|
</ClInclude>
|
||||||
<ClInclude Include="..\include\cglm\simd\arm.h">
|
|
||||||
<Filter>include\cglm\simd</Filter>
|
|
||||||
</ClInclude>
|
|
||||||
<ClInclude Include="..\include\cglm\simd\x86.h">
|
|
||||||
<Filter>include\cglm\simd</Filter>
|
|
||||||
</ClInclude>
|
|
||||||
<ClInclude Include="..\include\cglm\call\curve.h">
|
|
||||||
<Filter>include\cglm\call</Filter>
|
|
||||||
</ClInclude>
|
|
||||||
<ClInclude Include="..\include\cglm\curve.h">
|
|
||||||
<Filter>include\cglm</Filter>
|
|
||||||
</ClInclude>
|
|
||||||
<ClInclude Include="..\include\cglm\bezier.h">
|
|
||||||
<Filter>include\cglm</Filter>
|
|
||||||
</ClInclude>
|
|
||||||
<ClInclude Include="..\include\cglm\call\bezier.h">
|
|
||||||
<Filter>include\cglm\call</Filter>
|
|
||||||
</ClInclude>
|
|
||||||
</ItemGroup>
|
</ItemGroup>
|
||||||
</Project>
|
</Project>
|
||||||
Reference in New Issue
Block a user