| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245 | /******************************************************************************    Copyright (C) 2013 by Hugh Bailey <[email protected]>    This program is free software: you can redistribute it and/or modify    it under the terms of the GNU General Public License as published by    the Free Software Foundation, either version 2 of the License, or    (at your option) any later version.    This program is distributed in the hope that it will be useful,    but WITHOUT ANY WARRANTY; without even the implied warranty of    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the    GNU General Public License for more details.    You should have received a copy of the GNU General Public License    along with this program.  If not, see <http://www.gnu.org/licenses/>.******************************************************************************/#pragma once#include "math-defs.h"#include <xmmintrin.h>#ifdef __cplusplusextern "C" {#endifstruct vec3;struct matrix4;struct vec4 {	union {		struct {			float x, y, z, w;		};		float ptr[4];		__m128 m;	};};static inline void vec4_zero(struct vec4 *v){	v->m = _mm_setzero_ps();}static inline void vec4_set(struct vec4 *dst, float x, float y, float z,			    float w){	dst->m = _mm_set_ps(w, z, y, x);}static inline void vec4_copy(struct vec4 *dst, const struct vec4 *v){	dst->m = v->m;}EXPORT void vec4_from_vec3(struct vec4 *dst, const struct vec3 *v);static inline void vec4_add(struct vec4 *dst, const struct vec4 *v1,			    const struct vec4 *v2){	dst->m = _mm_add_ps(v1->m, v2->m);}static inline void vec4_sub(struct vec4 *dst, const struct vec4 *v1,			    const struct vec4 *v2){	dst->m = _mm_sub_ps(v1->m, v2->m);}static inline void vec4_mul(struct vec4 *dst, const struct vec4 *v1,			    const struct vec4 *v2){	dst->m = _mm_mul_ps(v1->m, v2->m);}static inline void vec4_div(struct vec4 *dst, const struct vec4 *v1,			    const struct vec4 *v2){	dst->m = _mm_div_ps(v1->m, v2->m);}static inline void vec4_addf(struct vec4 *dst, const struct vec4 *v, float f){	dst->m = _mm_add_ps(v->m, _mm_set1_ps(f));}static inline void vec4_subf(struct vec4 *dst, const struct vec4 *v, float f){	dst->m = _mm_sub_ps(v->m, _mm_set1_ps(f));}static inline void vec4_mulf(struct vec4 *dst, const struct vec4 *v, float f){	dst->m = _mm_mul_ps(v->m, _mm_set1_ps(f));}static inline void vec4_divf(struct vec4 *dst, const struct vec4 *v, float f){	dst->m = _mm_div_ps(v->m, _mm_set1_ps(f));}static inline float vec4_dot(const struct vec4 *v1, const struct vec4 *v2){	struct vec4 add;	__m128 mul = _mm_mul_ps(v1->m, v2->m);	add.m = _mm_add_ps(_mm_movehl_ps(mul, mul), mul);	add.m = _mm_add_ps(_mm_shuffle_ps(add.m, add.m, 0x55), add.m);	return add.x;}static inline void vec4_neg(struct vec4 *dst, const struct vec4 *v){	dst->x = -v->x;	dst->y = -v->y;	dst->z = -v->z;	dst->w = -v->w;}static inline float vec4_len(const struct vec4 *v){	float dot_val = vec4_dot(v, v);	return (dot_val > 0.0f) ? sqrtf(dot_val) : 0.0f;}static inline float vec4_dist(const struct vec4 *v1, const struct vec4 *v2){	struct vec4 temp;	float dot_val;	vec4_sub(&temp, v1, v2);	dot_val = vec4_dot(&temp, &temp);	return (dot_val > 0.0f) ? sqrtf(dot_val) : 0.0f;}static inline void vec4_norm(struct vec4 *dst, const struct vec4 *v){	float dot_val = vec4_dot(v, v);	dst->m = (dot_val > 0.0f)			 ? _mm_mul_ps(v->m, _mm_set1_ps(1.0f / sqrtf(dot_val)))			 : _mm_setzero_ps();}static inline int vec4_close(const struct vec4 *v1, const struct vec4 *v2,			     float epsilon){	struct vec4 test;	vec4_sub(&test, v1, v2);	return test.x < epsilon && test.y < epsilon && test.z < epsilon &&	       test.w < epsilon;}static inline void vec4_min(struct vec4 *dst, const struct vec4 *v1,			    const struct vec4 *v2){	dst->m = _mm_min_ps(v1->m, v2->m);}static inline void vec4_minf(struct vec4 *dst, const struct vec4 *v, float f){	dst->m = _mm_min_ps(v->m, _mm_set1_ps(f));}static inline void vec4_max(struct vec4 *dst, const struct vec4 *v1,			    const struct vec4 *v2){	dst->m = _mm_max_ps(v1->m, v2->m);}static inline void vec4_maxf(struct vec4 *dst, const struct vec4 *v, float f){	dst->m = _mm_max_ps(v->m, _mm_set1_ps(f));}static inline void vec4_abs(struct vec4 *dst, const struct vec4 *v){	dst->x = fabsf(v->x);	dst->y = fabsf(v->y);	dst->z = fabsf(v->z);	dst->w = fabsf(v->w);}static inline void vec4_floor(struct vec4 *dst, const struct vec4 *v){	dst->x = floorf(v->x);	dst->y = floorf(v->y);	dst->z = floorf(v->z);	dst->w = floorf(v->w);}static inline void vec4_ceil(struct vec4 *dst, const struct vec4 *v){	dst->x = ceilf(v->x);	dst->y = ceilf(v->y);	dst->z = ceilf(v->z);	dst->w = ceilf(v->w);}static inline uint32_t vec4_to_rgba(const struct vec4 *src){	uint32_t val;	val = (uint32_t)((double)src->x * 255.0);	val |= (uint32_t)((double)src->y * 255.0) << 8;	val |= (uint32_t)((double)src->z * 255.0) << 16;	val |= (uint32_t)((double)src->w * 255.0) << 24;	return val;}static inline uint32_t vec4_to_bgra(const struct vec4 *src){	uint32_t val;	val = (uint32_t)((double)src->z * 255.0);	val |= (uint32_t)((double)src->y * 255.0) << 8;	val |= (uint32_t)((double)src->x * 255.0) << 16;	val |= (uint32_t)((double)src->w * 255.0) << 24;	return val;}static inline void vec4_from_rgba(struct vec4 *dst, uint32_t rgba){	dst->x = (float)((double)(rgba & 0xFF) * (1.0 / 255.0));	rgba >>= 8;	dst->y = (float)((double)(rgba & 0xFF) * (1.0 / 255.0));	rgba >>= 8;	dst->z = (float)((double)(rgba & 0xFF) * (1.0 / 255.0));	rgba >>= 8;	dst->w = (float)((double)(rgba & 0xFF) * (1.0 / 255.0));}static inline void vec4_from_bgra(struct vec4 *dst, uint32_t bgra){	dst->z = (float)((double)(bgra & 0xFF) * (1.0 / 255.0));	bgra >>= 8;	dst->y = (float)((double)(bgra & 0xFF) * (1.0 / 255.0));	bgra >>= 8;	dst->x = (float)((double)(bgra & 0xFF) * (1.0 / 255.0));	bgra >>= 8;	dst->w = (float)((double)(bgra & 0xFF) * (1.0 / 255.0));}EXPORT void vec4_transform(struct vec4 *dst, const struct vec4 *v,			   const struct matrix4 *m);#ifdef __cplusplus}#endif
 |