aarch64: Add vector implementations of expm1 routines
[glibc.git] / sysdeps / aarch64 / fpu / bits / math-vector.h
blob52aad95e3b9fc130b49ed2e6363b3b53049d37d3
1 /* Platform-specific SIMD declarations of math functions.
3 Copyright (C) 2023 Free Software Foundation, Inc.
4 This file is part of the GNU C Library.
6 The GNU C Library is free software; you can redistribute it and/or
7 modify it under the terms of the GNU Lesser General Public
8 License as published by the Free Software Foundation; either
9 version 2.1 of the License, or (at your option) any later version.
11 The GNU C Library is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 Lesser General Public License for more details.
16 You should have received a copy of the GNU Lesser General Public
17 License along with the GNU C Library; if not, see
18 <https://www.gnu.org/licenses/>. */
20 #ifndef _MATH_H
21 # error "Never include <bits/math-vector.h> directly;\
22 include <math.h> instead."
23 #endif
25 /* Get default empty definitions for simd declarations. */
26 #include <bits/libm-simd-decl-stubs.h>
28 #if __GNUC_PREREQ(9, 0)
29 # define __ADVSIMD_VEC_MATH_SUPPORTED
30 typedef __Float32x4_t __f32x4_t;
31 typedef __Float64x2_t __f64x2_t;
32 #elif __glibc_clang_prereq(8, 0)
33 # define __ADVSIMD_VEC_MATH_SUPPORTED
34 typedef __attribute__ ((__neon_vector_type__ (4))) float __f32x4_t;
35 typedef __attribute__ ((__neon_vector_type__ (2))) double __f64x2_t;
36 #endif
38 #if __GNUC_PREREQ(10, 0) || __glibc_clang_prereq(11, 0)
39 # define __SVE_VEC_MATH_SUPPORTED
40 typedef __SVFloat32_t __sv_f32_t;
41 typedef __SVFloat64_t __sv_f64_t;
42 typedef __SVBool_t __sv_bool_t;
43 #endif
45 /* If vector types and vector PCS are unsupported in the working
46 compiler, no choice but to omit vector math declarations. */
48 #ifdef __ADVSIMD_VEC_MATH_SUPPORTED
50 # define __vpcs __attribute__ ((__aarch64_vector_pcs__))
52 __vpcs __f32x4_t _ZGVnN4vv_atan2f (__f32x4_t, __f32x4_t);
53 __vpcs __f32x4_t _ZGVnN4v_acosf (__f32x4_t);
54 __vpcs __f32x4_t _ZGVnN4v_asinf (__f32x4_t);
55 __vpcs __f32x4_t _ZGVnN4v_atanf (__f32x4_t);
56 __vpcs __f32x4_t _ZGVnN4v_cosf (__f32x4_t);
57 __vpcs __f32x4_t _ZGVnN4v_expf (__f32x4_t);
58 __vpcs __f32x4_t _ZGVnN4v_exp10f (__f32x4_t);
59 __vpcs __f32x4_t _ZGVnN4v_exp2f (__f32x4_t);
60 __vpcs __f32x4_t _ZGVnN4v_expm1f (__f32x4_t);
61 __vpcs __f32x4_t _ZGVnN4v_logf (__f32x4_t);
62 __vpcs __f32x4_t _ZGVnN4v_log10f (__f32x4_t);
63 __vpcs __f32x4_t _ZGVnN4v_log1pf (__f32x4_t);
64 __vpcs __f32x4_t _ZGVnN4v_log2f (__f32x4_t);
65 __vpcs __f32x4_t _ZGVnN4v_sinf (__f32x4_t);
66 __vpcs __f32x4_t _ZGVnN4v_tanf (__f32x4_t);
68 __vpcs __f64x2_t _ZGVnN2vv_atan2 (__f64x2_t, __f64x2_t);
69 __vpcs __f64x2_t _ZGVnN2v_acos (__f64x2_t);
70 __vpcs __f64x2_t _ZGVnN2v_asin (__f64x2_t);
71 __vpcs __f64x2_t _ZGVnN2v_atan (__f64x2_t);
72 __vpcs __f64x2_t _ZGVnN2v_cos (__f64x2_t);
73 __vpcs __f64x2_t _ZGVnN2v_exp (__f64x2_t);
74 __vpcs __f64x2_t _ZGVnN2v_exp10 (__f64x2_t);
75 __vpcs __f64x2_t _ZGVnN2v_exp2 (__f64x2_t);
76 __vpcs __f64x2_t _ZGVnN2v_expm1 (__f64x2_t);
77 __vpcs __f64x2_t _ZGVnN2v_log (__f64x2_t);
78 __vpcs __f64x2_t _ZGVnN2v_log10 (__f64x2_t);
79 __vpcs __f64x2_t _ZGVnN2v_log1p (__f64x2_t);
80 __vpcs __f64x2_t _ZGVnN2v_log2 (__f64x2_t);
81 __vpcs __f64x2_t _ZGVnN2v_sin (__f64x2_t);
82 __vpcs __f64x2_t _ZGVnN2v_tan (__f64x2_t);
84 # undef __ADVSIMD_VEC_MATH_SUPPORTED
85 #endif /* __ADVSIMD_VEC_MATH_SUPPORTED */
87 #ifdef __SVE_VEC_MATH_SUPPORTED
89 __sv_f32_t _ZGVsMxvv_atan2f (__sv_f32_t, __sv_f32_t, __sv_bool_t);
90 __sv_f32_t _ZGVsMxv_acosf (__sv_f32_t, __sv_bool_t);
91 __sv_f32_t _ZGVsMxv_asinf (__sv_f32_t, __sv_bool_t);
92 __sv_f32_t _ZGVsMxv_atanf (__sv_f32_t, __sv_bool_t);
93 __sv_f32_t _ZGVsMxv_cosf (__sv_f32_t, __sv_bool_t);
94 __sv_f32_t _ZGVsMxv_expf (__sv_f32_t, __sv_bool_t);
95 __sv_f32_t _ZGVsMxv_exp10f (__sv_f32_t, __sv_bool_t);
96 __sv_f32_t _ZGVsMxv_exp2f (__sv_f32_t, __sv_bool_t);
97 __sv_f32_t _ZGVsMxv_expm1f (__sv_f32_t, __sv_bool_t);
98 __sv_f32_t _ZGVsMxv_logf (__sv_f32_t, __sv_bool_t);
99 __sv_f32_t _ZGVsMxv_log10f (__sv_f32_t, __sv_bool_t);
100 __sv_f32_t _ZGVsMxv_log1pf (__sv_f32_t, __sv_bool_t);
101 __sv_f32_t _ZGVsMxv_log2f (__sv_f32_t, __sv_bool_t);
102 __sv_f32_t _ZGVsMxv_sinf (__sv_f32_t, __sv_bool_t);
103 __sv_f32_t _ZGVsMxv_tanf (__sv_f32_t, __sv_bool_t);
105 __sv_f64_t _ZGVsMxvv_atan2 (__sv_f64_t, __sv_f64_t, __sv_bool_t);
106 __sv_f64_t _ZGVsMxv_acos (__sv_f64_t, __sv_bool_t);
107 __sv_f64_t _ZGVsMxv_asin (__sv_f64_t, __sv_bool_t);
108 __sv_f64_t _ZGVsMxv_atan (__sv_f64_t, __sv_bool_t);
109 __sv_f64_t _ZGVsMxv_cos (__sv_f64_t, __sv_bool_t);
110 __sv_f64_t _ZGVsMxv_exp (__sv_f64_t, __sv_bool_t);
111 __sv_f64_t _ZGVsMxv_exp10 (__sv_f64_t, __sv_bool_t);
112 __sv_f64_t _ZGVsMxv_exp2 (__sv_f64_t, __sv_bool_t);
113 __sv_f64_t _ZGVsMxv_expm1 (__sv_f64_t, __sv_bool_t);
114 __sv_f64_t _ZGVsMxv_log (__sv_f64_t, __sv_bool_t);
115 __sv_f64_t _ZGVsMxv_log10 (__sv_f64_t, __sv_bool_t);
116 __sv_f64_t _ZGVsMxv_log1p (__sv_f64_t, __sv_bool_t);
117 __sv_f64_t _ZGVsMxv_log2 (__sv_f64_t, __sv_bool_t);
118 __sv_f64_t _ZGVsMxv_sin (__sv_f64_t, __sv_bool_t);
119 __sv_f64_t _ZGVsMxv_tan (__sv_f64_t, __sv_bool_t);
121 # undef __SVE_VEC_MATH_SUPPORTED
122 #endif /* __SVE_VEC_MATH_SUPPORTED */