diff options
author | Yunlian Jiang <yunlian@google.com> | 2018-04-24 22:15:37 -0700 |
---|---|---|
committer | Yunlian Jiang <yunlian@google.com> | 2018-04-24 22:15:37 -0700 |
commit | 71959ce8f47f676a26bb21da7117101d9d73867e (patch) | |
tree | c9c8f11d31a4a22bb04fa5798311919929ffafb0 /gcc-4.9/gcc/config/aarch64/arm_neon.h | |
parent | e46354e85363dbd7ea85492f70af89273881709f (diff) | |
download | toolchain_gcc-71959ce8f47f676a26bb21da7117101d9d73867e.tar.gz toolchain_gcc-71959ce8f47f676a26bb21da7117101d9d73867e.tar.bz2 toolchain_gcc-71959ce8f47f676a26bb21da7117101d9d73867e.zip |
gcc: backport patch to support vrnd<*>_f64 aarch64 intrinsics.
This backports upstream patch to add support of vrdn<*>_f64 intrinisics
for aarch64. This is needed because glibc 2.27 uses some of them.
Author: mshawcroft <mshawcroft@138bc75d-0d04-0410-961f-82ee72b054a4>
Date: Tue Apr 22 08:39:48 2014 +0000
[AArch64] vrnd<*>_f64 patch
This patch adds vrnd<*>_f64 aarch64 intrinsics. A testcase for those
intrinsics is added. Run a complete LE and BE regression run with no
regressions.
BUG=chromium:834385
TEST=./setup_board --board kevin --nousepkg
cross-aarch64-cros-linux-gnu-glibc builds for glibc 2.27
Change-Id: Iaf9508a433e35d3304e44ac4b6c93071ff6c5ec0
Diffstat (limited to 'gcc-4.9/gcc/config/aarch64/arm_neon.h')
-rw-r--r-- | gcc-4.9/gcc/config/aarch64/arm_neon.h | 43 |
1 files changed, 43 insertions, 0 deletions
diff --git a/gcc-4.9/gcc/config/aarch64/arm_neon.h b/gcc-4.9/gcc/config/aarch64/arm_neon.h index ae0ae9c1b..03addc955 100644 --- a/gcc-4.9/gcc/config/aarch64/arm_neon.h +++ b/gcc-4.9/gcc/config/aarch64/arm_neon.h @@ -22469,6 +22469,12 @@ vrnd_f32 (float32x2_t __a) return __builtin_aarch64_btruncv2sf (__a); } +__extension__ static __inline float64x1_t __attribute__ ((__always_inline__)) +vrnd_f64 (float64x1_t __a) +{ + return vset_lane_f64 (__builtin_trunc (vget_lane_f64 (__a, 0)), __a, 0); +} + __extension__ static __inline float32x4_t __attribute__ ((__always_inline__)) vrndq_f32 (float32x4_t __a) { @@ -22489,6 +22495,12 @@ vrnda_f32 (float32x2_t __a) return __builtin_aarch64_roundv2sf (__a); } +__extension__ static __inline float64x1_t __attribute__ ((__always_inline__)) +vrnda_f64 (float64x1_t __a) +{ + return vset_lane_f64 (__builtin_round (vget_lane_f64 (__a, 0)), __a, 0); +} + __extension__ static __inline float32x4_t __attribute__ ((__always_inline__)) vrndaq_f32 (float32x4_t __a) { @@ -22509,6 +22521,12 @@ vrndi_f32 (float32x2_t __a) return __builtin_aarch64_nearbyintv2sf (__a); } +__extension__ static __inline float64x1_t __attribute__ ((__always_inline__)) +vrndi_f64 (float64x1_t __a) +{ + return vset_lane_f64 (__builtin_nearbyint (vget_lane_f64 (__a, 0)), __a, 0); +} + __extension__ static __inline float32x4_t __attribute__ ((__always_inline__)) vrndiq_f32 (float32x4_t __a) { @@ -22529,6 +22547,12 @@ vrndm_f32 (float32x2_t __a) return __builtin_aarch64_floorv2sf (__a); } +__extension__ static __inline float64x1_t __attribute__ ((__always_inline__)) +vrndm_f64 (float64x1_t __a) +{ + return vset_lane_f64 (__builtin_floor (vget_lane_f64 (__a, 0)), __a, 0); +} + __extension__ static __inline float32x4_t __attribute__ ((__always_inline__)) vrndmq_f32 (float32x4_t __a) { @@ -22548,6 +22572,13 @@ vrndn_f32 (float32x2_t __a) { return __builtin_aarch64_frintnv2sf (__a); } + +__extension__ static __inline float64x1_t __attribute__ ((__always_inline__)) +vrndn_f64 (float64x1_t __a) +{ + return __builtin_aarch64_frintndf (__a); +} + __extension__ static __inline float32x4_t __attribute__ ((__always_inline__)) vrndnq_f32 (float32x4_t __a) { @@ -22568,6 +22599,12 @@ vrndp_f32 (float32x2_t __a) return __builtin_aarch64_ceilv2sf (__a); } +__extension__ static __inline float64x1_t __attribute__ ((__always_inline__)) +vrndp_f64 (float64x1_t __a) +{ + return vset_lane_f64 (__builtin_ceil (vget_lane_f64 (__a, 0)), __a, 0); +} + __extension__ static __inline float32x4_t __attribute__ ((__always_inline__)) vrndpq_f32 (float32x4_t __a) { @@ -22588,6 +22625,12 @@ vrndx_f32 (float32x2_t __a) return __builtin_aarch64_rintv2sf (__a); } +__extension__ static __inline float64x1_t __attribute__ ((__always_inline__)) +vrndx_f64 (float64x1_t __a) +{ + return vset_lane_f64 (__builtin_rint (vget_lane_f64 (__a, 0)), __a, 0); +} + __extension__ static __inline float32x4_t __attribute__ ((__always_inline__)) vrndxq_f32 (float32x4_t __a) { |