28 #ifndef INCLUDE_VOLK_VOLK_SSE3_INTRINSICS_H_
29 #define INCLUDE_VOLK_VOLK_SSE3_INTRINSICS_H_
30 #include <pmmintrin.h>
35 __m128 yl, yh, tmp1, tmp2;
36 yl = _mm_moveldup_ps(y);
37 yh = _mm_movehdup_ps(y);
38 tmp1 = _mm_mul_ps(x, yl);
39 x = _mm_shuffle_ps(x, x, 0xB1);
40 tmp2 = _mm_mul_ps(x, yh);
41 return _mm_addsub_ps(tmp1, tmp2);
47 const __m128 conjugator = _mm_setr_ps(0, -0.f, 0, -0.f);
48 y = _mm_xor_ps(y, conjugator);
54 cplxValue1 = _mm_mul_ps(cplxValue1, cplxValue1);
55 cplxValue2 = _mm_mul_ps(cplxValue2, cplxValue2);
56 return _mm_hadd_ps(cplxValue1, cplxValue2);
71 const __m128 diff0 = _mm_sub_ps(symbols0, points0);
72 const __m128 diff1 = _mm_sub_ps(symbols1, points1);
74 return _mm_mul_ps(norms, scalar);