You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and dots ('.'), can be up to 35 characters long. Letters must be lowercase.
117 lines
3.2 KiB
117 lines
3.2 KiB
/////////////////////////////////////////////////////////////////////////////////////////////////// |
|
// OpenGL Mathematics Copyright (c) 2005 - 2010 G-Truc Creation (www.g-truc.net) |
|
/////////////////////////////////////////////////////////////////////////////////////////////////// |
|
// Created : 2009-05-08 |
|
// Updated : 2009-05-08 |
|
// Licence : This source is under MIT License |
|
// File : glm/core/intrinsic_geometric.inl |
|
/////////////////////////////////////////////////////////////////////////////////////////////////// |
|
|
|
//length |
|
inline __m128 _mm_len_ps(__m128 x) |
|
{ |
|
__m128 dot0 = _mm_dot_ps(x, x); |
|
__m128 sqt0 = _mm_sqrt_ps(dot0); |
|
return sqt0; |
|
} |
|
|
|
//distance |
|
inline __m128 _mm_dst_ps(__m128 p0, __m128 p1) |
|
{ |
|
__m128 sub0 = _mm_sub_ps(p0, p1); |
|
__m128 len0 = _mm_len_ps(sub0); |
|
return len0; |
|
} |
|
|
|
//dot |
|
inline __m128 _mm_dot_ps(__m128 v1, __m128 v2) |
|
{ |
|
__m128 mul0 = _mm_mul_ps(v1, v2); |
|
__m128 swp0 = _mm_shuffle_ps(mul0, mul0, _MM_SHUFFLE(2, 3, 0, 1)); |
|
__m128 add0 = _mm_add_ps(mul0, swp0); |
|
__m128 swp1 = _mm_shuffle_ps(add0, add0, _MM_SHUFFLE(0, 1, 2, 3)); |
|
__m128 add1 = _mm_add_ps(add0, swp1); |
|
return add1; |
|
} |
|
|
|
// SSE1 |
|
inline __m128 _mm_dot_ss(__m128 v1, __m128 v2) |
|
{ |
|
__m128 mul0 = _mm_mul_ps(v1, v2); |
|
__m128 mov0 = _mm_movehl_ps(mul0, mul0); |
|
__m128 add0 = _mm_add_ps(mov0, mul0); |
|
__m128 swp1 = _mm_shuffle_ps(add0, add0, 1); |
|
__m128 add1 = _mm_add_ss(add0, swp1); |
|
return add1; |
|
} |
|
|
|
//cross |
|
inline __m128 _mm_xpd_ps(__m128 v1, __m128 v2) |
|
{ |
|
__m128 swp0 = _mm_shuffle_ps(v1, v1, _MM_SHUFFLE(3, 0, 2, 1)); |
|
__m128 swp1 = _mm_shuffle_ps(v1, v1, _MM_SHUFFLE(3, 1, 0, 2)); |
|
__m128 swp2 = _mm_shuffle_ps(v2, v2, _MM_SHUFFLE(3, 0, 2, 1)); |
|
__m128 swp3 = _mm_shuffle_ps(v2, v2, _MM_SHUFFLE(3, 1, 0, 2)); |
|
__m128 mul0 = _mm_mul_ps(swp0, swp3); |
|
__m128 mul1 = _mm_mul_ps(swp1, swp2); |
|
__m128 sub0 = _mm_sub_ps(mul0, mul1); |
|
return sub0; |
|
} |
|
|
|
//normalize |
|
inline __m128 _mm_nrm_ps(__m128 v) |
|
{ |
|
__m128 dot0 = _mm_dot_ps(v, v); |
|
__m128 isr0 = _mm_rsqrt_ps(dot0); |
|
__m128 mul0 = _mm_mul_ps(v, isr0); |
|
return mul0; |
|
} |
|
|
|
//faceforward |
|
inline __m128 _mm_ffd_ps(__m128 N, __m128 I, __m128 Nref) |
|
{ |
|
//__m128 dot0 = _mm_dot_ps(v, v); |
|
//__m128 neg0 = _mm_neg_ps(N); |
|
//__m128 sgn0 = _mm_sgn_ps(dot0); |
|
//__m128 mix0 = _mm_mix_ps(N, neg0, sgn0); |
|
//return mix0; |
|
|
|
__m128 dot0 = _mm_dot_ps(Nref, I); |
|
__m128 sgn0 = _mm_sgn_ps(dot0); |
|
__m128 mul0 = _mm_mul_ps(sgn0, glm::detail::minus_one); |
|
__m128 mul1 = _mm_mul_ps(N, mul0); |
|
return mul1; |
|
} |
|
|
|
//reflect |
|
inline __m128 _mm_rfe_ps(__m128 I, __m128 N) |
|
{ |
|
__m128 dot0 = _mm_dot_ps(N, I); |
|
__m128 mul0 = _mm_mul_ps(N, I); |
|
__m128 mul1 = _mm_mul_ps(mul0, glm::detail::two); |
|
__m128 sub0 = _mm_sub_ps(I, mul1); |
|
return sub0; |
|
} |
|
|
|
//refract |
|
inline __m128 _mm_rfa_ps(__m128 I, __m128 N, __m128 eta) |
|
{ |
|
__m128 dot0 = _mm_dot_ps(N, I); |
|
__m128 mul0 = _mm_mul_ps(eta, eta); |
|
__m128 mul1 = _mm_mul_ps(dot0, dot0); |
|
__m128 sub0 = _mm_sub_ps(glm::detail::one, mul0); |
|
__m128 sub1 = _mm_sub_ps(glm::detail::one, mul1); |
|
__m128 mul2 = _mm_mul_ps(sub0, sub1); |
|
|
|
if(_mm_movemask_ps(_mm_cmplt_ss(mul2, glm::detail::zero)) == 0) |
|
return glm::detail::zero; |
|
|
|
__m128 sqt0 = _mm_sqrt_ps(mul2); |
|
__m128 mul3 = _mm_mul_ps(eta, dot0); |
|
__m128 add0 = _mm_add_ps(mul3, sqt0); |
|
__m128 mul4 = _mm_mul_ps(add0, N); |
|
__m128 mul5 = _mm_mul_ps(eta, I); |
|
__m128 sub2 = _mm_sub_ps(mul5, mul4); |
|
|
|
return sub2; |
|
}
|
|
|