diff options
author | jiwang <jiwang@138bc75d-0d04-0410-961f-82ee72b054a4> | 2016-07-25 16:13:22 +0000 |
---|---|---|
committer | jiwang <jiwang@138bc75d-0d04-0410-961f-82ee72b054a4> | 2016-07-25 16:13:22 +0000 |
commit | 1c14d8edb192765e9cd60651414fc4ac3050301e (patch) | |
tree | 4c422015c975da2319df4e6bea103ae1781e7450 /gcc | |
parent | 90a2895e02c3a7d9b1ad67557ba3aaf2faa94daa (diff) | |
download | gcc-1c14d8edb192765e9cd60651414fc4ac3050301e.tar.gz |
[AArch64][9/10] ARMv8.2-A FP16 three operands scalar intrinsics
gcc/
* config/aarch64/aarch64-simd-builtins.def: Register new builtins.
* config/aarch64/aarch64.md (fma, fnma): Support HF.
* config/aarch64/arm_fp16.h (vfmah_f16, vfmsh_f16): New.
git-svn-id: svn+ssh://gcc.gnu.org/svn/gcc/trunk@238724 138bc75d-0d04-0410-961f-82ee72b054a4
Diffstat (limited to 'gcc')
-rw-r--r-- | gcc/ChangeLog | 6 | ||||
-rw-r--r-- | gcc/config/aarch64/aarch64-simd-builtins.def | 2 | ||||
-rw-r--r-- | gcc/config/aarch64/aarch64.md | 21 | ||||
-rw-r--r-- | gcc/config/aarch64/arm_fp16.h | 14 |
4 files changed, 33 insertions, 10 deletions
diff --git a/gcc/ChangeLog b/gcc/ChangeLog index 3bef6f026f6..c1da62a26fe 100644 --- a/gcc/ChangeLog +++ b/gcc/ChangeLog @@ -1,6 +1,12 @@ 2016-07-25 Jiong Wang <jiong.wang@arm.com> * config/aarch64/aarch64-simd-builtins.def: Register new builtins. + * config/aarch64/aarch64.md (fma, fnma): Support HF. + * config/aarch64/arm_fp16.h (vfmah_f16, vfmsh_f16): New. + +2016-07-25 Jiong Wang <jiong.wang@arm.com> + + * config/aarch64/aarch64-simd-builtins.def: Register new builtins. * config/aarch64/aarch64.md (<FCVT_F2FIXED:fcvt_fixed_insn>hf<mode>3): New. (<FCVT_FIXED2F:fcvt_fixed_insn><mode>hf3): Likewise. diff --git a/gcc/config/aarch64/aarch64-simd-builtins.def b/gcc/config/aarch64/aarch64-simd-builtins.def index 31abc077859..c7fe08bb21a 100644 --- a/gcc/config/aarch64/aarch64-simd-builtins.def +++ b/gcc/config/aarch64/aarch64-simd-builtins.def @@ -422,8 +422,10 @@ /* Implemented by fma<mode>4. */ BUILTIN_VHSDF (TERNOP, fma, 4) + VAR1 (TERNOP, fma, 4, hf) /* Implemented by fnma<mode>4. */ BUILTIN_VHSDF (TERNOP, fnma, 4) + VAR1 (TERNOP, fnma, 4, hf) /* Implemented by aarch64_simd_bsl<mode>. */ BUILTIN_VDQQH (BSL_P, simd_bsl, 0) diff --git a/gcc/config/aarch64/aarch64.md b/gcc/config/aarch64/aarch64.md index 6d0a9dcf90c..7d8b3943100 100644 --- a/gcc/config/aarch64/aarch64.md +++ b/gcc/config/aarch64/aarch64.md @@ -4492,23 +4492,24 @@ ;; fma - no throw (define_insn "fma<mode>4" - [(set (match_operand:GPF 0 "register_operand" "=w") - (fma:GPF (match_operand:GPF 1 "register_operand" "w") - (match_operand:GPF 2 "register_operand" "w") - (match_operand:GPF 3 "register_operand" "w")))] + [(set (match_operand:GPF_F16 0 "register_operand" "=w") + (fma:GPF_F16 (match_operand:GPF_F16 1 "register_operand" "w") + (match_operand:GPF_F16 2 "register_operand" "w") + (match_operand:GPF_F16 3 "register_operand" "w")))] "TARGET_FLOAT" "fmadd\\t%<s>0, %<s>1, %<s>2, %<s>3" - [(set_attr "type" "fmac<s>")] + [(set_attr "type" "fmac<stype>")] ) (define_insn "fnma<mode>4" - [(set (match_operand:GPF 0 "register_operand" "=w") - (fma:GPF (neg:GPF (match_operand:GPF 1 "register_operand" "w")) - (match_operand:GPF 2 "register_operand" "w") - (match_operand:GPF 3 "register_operand" "w")))] + [(set (match_operand:GPF_F16 0 "register_operand" "=w") + (fma:GPF_F16 + (neg:GPF_F16 (match_operand:GPF_F16 1 "register_operand" "w")) + (match_operand:GPF_F16 2 "register_operand" "w") + (match_operand:GPF_F16 3 "register_operand" "w")))] "TARGET_FLOAT" "fmsub\\t%<s>0, %<s>1, %<s>2, %<s>3" - [(set_attr "type" "fmac<s>")] + [(set_attr "type" "fmac<stype>")] ) (define_insn "fms<mode>4" diff --git a/gcc/config/aarch64/arm_fp16.h b/gcc/config/aarch64/arm_fp16.h index 21edc656953..4b7c2dd3bcc 100644 --- a/gcc/config/aarch64/arm_fp16.h +++ b/gcc/config/aarch64/arm_fp16.h @@ -560,6 +560,20 @@ vsubh_f16 (float16_t __a, float16_t __b) return __a - __b; } +/* ARMv8.2-A FP16 three operands scalar intrinsics. */ + +__extension__ static __inline float16_t __attribute__ ((__always_inline__)) +vfmah_f16 (float16_t __a, float16_t __b, float16_t __c) +{ + return __builtin_aarch64_fmahf (__b, __c, __a); +} + +__extension__ static __inline float16_t __attribute__ ((__always_inline__)) +vfmsh_f16 (float16_t __a, float16_t __b, float16_t __c) +{ + return __builtin_aarch64_fnmahf (__b, __c, __a); +} + #pragma GCC pop_options #endif |