sleefsseavx: added horizontal min and max

2019-09-23 13:42:23 +02:00
parent 7a8225d274
commit 204475dd05
1 changed files with 12 additions and 0 deletions
--- a/rtengine/sleefsseavx.c
+++ b/rtengine/sleefsseavx.c
@@ -1390,6 +1390,18 @@ static inline float vhadd( vfloat a ) {
    return _mm_cvtss_f32(_mm_add_ss(a, _mm_shuffle_ps(a, a, 1)));
 }
 static inline float vhmin(vfloat a) {
    // returns min(a[0], a[1], a[2], a[3])
    a = vminf(a, _mm_movehl_ps(a, a));
    return _mm_cvtss_f32(vminf(a, _mm_shuffle_ps(a, a, 1)));
 }
 static inline float vhmax(vfloat a) {
    // returns max(a[0], a[1], a[2], a[3])
    a = vmaxf(a, _mm_movehl_ps(a, a));
    return _mm_cvtss_f32(vmaxf(a, _mm_shuffle_ps(a, a, 1)));
 }
 static INLINE vfloat vmul2f(vfloat a){
    // fastest way to multiply by 2
 	return a + a;