2 * Single-precision vector sin function.
4 * Copyright (c) 2019, Arm Limited.
5 * SPDX-License-Identifier: MIT
12 static const float Poly[] = {
19 #define Pi1 v_f32 (0x1.921fb6p+1f)
20 #define Pi2 v_f32 (-0x1.777a5cp-24f)
21 #define Pi3 v_f32 (-0x1.ee59dap-49f)
22 #define A3 v_f32 (Poly[3])
23 #define A5 v_f32 (Poly[2])
24 #define A7 v_f32 (Poly[1])
25 #define A9 v_f32 (Poly[0])
26 #define RangeVal v_f32 (0x1p20f)
27 #define InvPi v_f32 (0x1.45f306p-2f)
28 #define Shift v_f32 (0x1.8p+23f)
29 #define AbsMask v_u32 (0x7fffffff)
33 specialcase (v_f32_t x, v_f32_t y, v_u32_t cmp)
35 /* Fall back to scalar code. */
36 return v_call_f32 (sinf, x, y, cmp);
41 V_NAME(sinf) (v_f32_t x)
44 v_u32_t sign, odd, cmp;
46 r = v_as_f32_u32 (v_as_u32_f32 (x) & AbsMask);
47 sign = v_as_u32_f32 (x) & ~AbsMask;
48 cmp = v_cond_u32 (v_as_u32_f32 (r) >= v_as_u32_f32 (RangeVal));
50 /* n = rint(|x|/pi) */
51 n = v_fma_f32 (InvPi, r, Shift);
52 odd = v_as_u32_f32 (n) << 31;
55 /* r = |x| - n*pi (range reduction into -pi/2 .. pi/2) */
56 r = v_fma_f32 (-Pi1, n, r);
57 r = v_fma_f32 (-Pi2, n, r);
58 r = v_fma_f32 (-Pi3, n, r);
62 y = v_fma_f32 (A9, r2, A7);
63 y = v_fma_f32 (y, r2, A5);
64 y = v_fma_f32 (y, r2, A3);
65 y = v_fma_f32 (y * r2, r, r);
68 y = v_as_f32_u32 (v_as_u32_f32 (y) ^ sign ^ odd);
70 if (unlikely (v_any_u32 (cmp)))
71 return specialcase (x, y, cmp);