29 const __m128 a1 = _mm_set1_ps(+0x1.ffffeap-1f);
30 const __m128 a3 = _mm_set1_ps(-0x1.55437p-2f);
31 const __m128 a5 = _mm_set1_ps(+0x1.972be6p-3f);
32 const __m128 a7 = _mm_set1_ps(-0x1.1436ap-3f);
33 const __m128 a9 = _mm_set1_ps(+0x1.5785aap-4f);
34 const __m128 a11 = _mm_set1_ps(-0x1.2f3004p-5f);
35 const __m128 a13 = _mm_set1_ps(+0x1.01a37cp-7f);
37 const __m128 x_times_x = _mm_mul_ps(x, x);
40 arctan = _mm_mul_ps(x_times_x, arctan);
41 arctan = _mm_add_ps(arctan, a11);
42 arctan = _mm_mul_ps(x_times_x, arctan);
43 arctan = _mm_add_ps(arctan, a9);
44 arctan = _mm_mul_ps(x_times_x, arctan);
45 arctan = _mm_add_ps(arctan, a7);
46 arctan = _mm_mul_ps(x_times_x, arctan);
47 arctan = _mm_add_ps(arctan, a5);
48 arctan = _mm_mul_ps(x_times_x, arctan);
49 arctan = _mm_add_ps(arctan, a3);
50 arctan = _mm_mul_ps(x_times_x, arctan);
51 arctan = _mm_add_ps(arctan, a1);
52 arctan = _mm_mul_ps(x, arctan);
59 __m128 iValue, qValue;
61 iValue = _mm_shuffle_ps(cplxValue1, cplxValue2, _MM_SHUFFLE(2, 0, 2, 0));
63 qValue = _mm_shuffle_ps(cplxValue1, cplxValue2, _MM_SHUFFLE(3, 1, 3, 1));
64 iValue = _mm_mul_ps(iValue, iValue);
65 qValue = _mm_mul_ps(qValue, qValue);
66 return _mm_add_ps(iValue, qValue);
88 __m128 sq_acc, __m128 acc, __m128 val, __m128 rec, __m128 aux)
90 aux = _mm_mul_ps(aux, val);
91 aux = _mm_sub_ps(aux, acc);
92 aux = _mm_mul_ps(aux, aux);
93 aux = _mm_mul_ps(aux, rec);
94 return _mm_add_ps(sq_acc, aux);
static __m128 _mm_accumulate_square_sum_ps(__m128 sq_acc, __m128 acc, __m128 val, __m128 rec, __m128 aux)
Definition volk_sse_intrinsics.h:87
static __m128 _mm_scaled_norm_dist_ps_sse(const __m128 symbols0, const __m128 symbols1, const __m128 points0, const __m128 points1, const __m128 scalar)
Definition volk_sse_intrinsics.h:74