From de6f79d955fdc946834b7084383a885415c5d983 Mon Sep 17 00:00:00 2001 From: Paul Brook Date: Mon, 2 Nov 2009 13:43:59 +0000 Subject: [PATCH] 2009-11-02 Paul Brook ld/testsuite/ * ld-arm/arm-elf.exp: Add new attr-merge-vfp tests. * ld-arm/attr-merge-vfp-1.d: New test. * ld-arm/attr-merge-vfp-1r.d: New test. * ld-arm/attr-merge-vfp-2.d: New test. * ld-arm/attr-merge-vfp-2r.d: New test. * ld-arm/attr-merge-vfp-3.d: New test. * ld-arm/attr-merge-vfp-3r.d: New test. * ld-arm/attr-merge-vfp-4.d: New test. * ld-arm/attr-merge-vfp-4r.d: New test. * ld-arm/attr-merge-vfp-5.d: New test. * ld-arm/attr-merge-vfp-5r.d: New test. * ld-arm/attr-merge-vfp-2.s: New test. * ld-arm/attr-merge-vfp-3.s: New test. * ld-arm/attr-merge-vfp-3-d16.s: New test. * ld-arm/attr-merge-vfp-4.s: New test. * ld-arm/attr-merge-vfp-4-d16.s: New test. gas/ * doc/c-arm.texi: Document new -mfpu options. * config/tc-arm.c (fpu_vfp_ext_v3xd, fpu_vfp_fp16, fpu_neon_ext_fma, fpu_vfp_ext_fma): New. (NEON_ENC_TAB): Add vfma, vfms, vfnma and vfnms. (do_vfp_nsyn_fma_fms, do_neon_fmac): New functions. (insns): Move double precision load/store. Split out double precision VFPv3 instrucitons. Add VFPv4 instructions. (arm_fpus): Add VFPv3-FP16, VFPv3xD and VFPv4 variants. (aeabi_set_public_attributes): Set VFPv4 variants gas/testsuite/ * gas/arm/attr-mfpu-vfpv4.d: New test. * gas/arm/attr-mfpu-vfpv4-d16.d: New test. * gas/arm/neon-fma-cov.d: New test. * gas/arm/neon-fma-cov.s: New test. * gas/arm/vfp-fma-inc.s: New test. * gas/arm/vfp-fma-arm.d: New test. * gas/arm/vfp-fma-arm.s: New test. * gas/arm/vfp-fma-thumb.d: New test. * gas/arm/vfp-fma-thumb.s: New test. * gas/arm/vfma1.d: New test. * gas/arm/vfma1.s: New test. * gas/arm/vfpv3xd.d: New test. * gas/arm/vfpv3xd.s: New test. include/opcode/ * arm.h (FPU_VFP_EXT_V3xD, FPU_VFP_EXT_FP16, FPU_NEON_EXT_FMA, FPU_VFP_EXT_FMA, FPU_VFP_V3xD, FPU_VFP_V4D16, FPU_VFP_V4): Define. (FPU_ARCH_VFP_V3D16_FP16, FPU_ARCH_VFP_V3_FP16, FPU_ARCH_VFP_V3xD, FPU_ARCH_VFP_V3xD_FP16, FPU_ARCH_VFP_V4, FPU_ARCH_VFP_V4D16, FPU_ARCH_NEON_VFP_V4): Define. binutils/ * readelf.c (arm_attr_tag_VFP_arch): Add VFPv4 and VFPv4-D16. bfd/ * elf32-arm.c (elf32_arm_merge_eabi_attributes): Handle VFPv4 attributes. opcodes/ * arm-dis.c (coprocessor_opcodes): Update to use new feature flags. Add VFPv4 instructions. --- bfd/ChangeLog | 5 ++ bfd/elf32-arm.c | 52 +++++++++-- binutils/ChangeLog | 4 + binutils/readelf.c | 2 +- gas/ChangeLog | 12 +++ gas/config/tc-arm.c | 135 ++++++++++++++++++++++------ gas/doc/c-arm.texi | 17 ++-- gas/testsuite/ChangeLog | 16 ++++ gas/testsuite/gas/arm/attr-mfpu-vfpv4-d16.d | 13 +++ gas/testsuite/gas/arm/attr-mfpu-vfpv4.d | 13 +++ gas/testsuite/gas/arm/neon-fma-cov.d | 13 +++ gas/testsuite/gas/arm/neon-fma-cov.s | 12 +++ gas/testsuite/gas/arm/vfma1.d | 34 +++++++ gas/testsuite/gas/arm/vfma1.s | 43 +++++++++ gas/testsuite/gas/arm/vfp-fma-arm.d | 23 +++++ gas/testsuite/gas/arm/vfp-fma-arm.s | 2 + gas/testsuite/gas/arm/vfp-fma-inc.s | 20 +++++ gas/testsuite/gas/arm/vfp-fma-thumb.d | 27 ++++++ gas/testsuite/gas/arm/vfp-fma-thumb.s | 2 + gas/testsuite/gas/arm/vfpv3xd.d | 23 +++++ gas/testsuite/gas/arm/vfpv3xd.s | 19 ++++ include/opcode/ChangeLog | 8 ++ include/opcode/arm.h | 28 ++++-- ld/testsuite/ChangeLog | 19 ++++ ld/testsuite/ld-arm/arm-elf.exp | 10 +++ ld/testsuite/ld-arm/attr-merge-vfp-1.d | 13 +++ ld/testsuite/ld-arm/attr-merge-vfp-1r.d | 13 +++ ld/testsuite/ld-arm/attr-merge-vfp-2.d | 13 +++ ld/testsuite/ld-arm/attr-merge-vfp-2.s | 2 + ld/testsuite/ld-arm/attr-merge-vfp-2r.d | 13 +++ ld/testsuite/ld-arm/attr-merge-vfp-3-d16.s | 2 + ld/testsuite/ld-arm/attr-merge-vfp-3.d | 14 +++ ld/testsuite/ld-arm/attr-merge-vfp-3.s | 2 + ld/testsuite/ld-arm/attr-merge-vfp-3r.d | 14 +++ ld/testsuite/ld-arm/attr-merge-vfp-4-d16.s | 2 + ld/testsuite/ld-arm/attr-merge-vfp-4.d | 14 +++ ld/testsuite/ld-arm/attr-merge-vfp-4.s | 2 + ld/testsuite/ld-arm/attr-merge-vfp-4r.d | 14 +++ ld/testsuite/ld-arm/attr-merge-vfp-5.d | 14 +++ ld/testsuite/ld-arm/attr-merge-vfp-5r.d | 14 +++ opcodes/ChangeLog | 5 ++ opcodes/arm-dis.c | 28 ++++-- 42 files changed, 679 insertions(+), 52 deletions(-) create mode 100644 gas/testsuite/gas/arm/attr-mfpu-vfpv4-d16.d create mode 100644 gas/testsuite/gas/arm/attr-mfpu-vfpv4.d create mode 100644 gas/testsuite/gas/arm/neon-fma-cov.d create mode 100644 gas/testsuite/gas/arm/neon-fma-cov.s create mode 100644 gas/testsuite/gas/arm/vfma1.d create mode 100644 gas/testsuite/gas/arm/vfma1.s create mode 100644 gas/testsuite/gas/arm/vfp-fma-arm.d create mode 100644 gas/testsuite/gas/arm/vfp-fma-arm.s create mode 100644 gas/testsuite/gas/arm/vfp-fma-inc.s create mode 100644 gas/testsuite/gas/arm/vfp-fma-thumb.d create mode 100644 gas/testsuite/gas/arm/vfp-fma-thumb.s create mode 100644 gas/testsuite/gas/arm/vfpv3xd.d create mode 100644 gas/testsuite/gas/arm/vfpv3xd.s create mode 100644 ld/testsuite/ld-arm/attr-merge-vfp-1.d create mode 100644 ld/testsuite/ld-arm/attr-merge-vfp-1r.d create mode 100644 ld/testsuite/ld-arm/attr-merge-vfp-2.d create mode 100644 ld/testsuite/ld-arm/attr-merge-vfp-2.s create mode 100644 ld/testsuite/ld-arm/attr-merge-vfp-2r.d create mode 100644 ld/testsuite/ld-arm/attr-merge-vfp-3-d16.s create mode 100644 ld/testsuite/ld-arm/attr-merge-vfp-3.d create mode 100644 ld/testsuite/ld-arm/attr-merge-vfp-3.s create mode 100644 ld/testsuite/ld-arm/attr-merge-vfp-3r.d create mode 100644 ld/testsuite/ld-arm/attr-merge-vfp-4-d16.s create mode 100644 ld/testsuite/ld-arm/attr-merge-vfp-4.d create mode 100644 ld/testsuite/ld-arm/attr-merge-vfp-4.s create mode 100644 ld/testsuite/ld-arm/attr-merge-vfp-4r.d create mode 100644 ld/testsuite/ld-arm/attr-merge-vfp-5.d create mode 100644 ld/testsuite/ld-arm/attr-merge-vfp-5r.d diff --git a/bfd/ChangeLog b/bfd/ChangeLog index 52265cb3db..ce48a24ec6 100644 --- a/bfd/ChangeLog +++ b/bfd/ChangeLog @@ -1,3 +1,8 @@ +2009-11-02 Paul Brook + + * elf32-arm.c (elf32_arm_merge_eabi_attributes): Handle VFPv4 + attributes. + 2009-11-02 Alan Modra * elflink.c (elf_link_add_object_symbols): Don't force debug diff --git a/bfd/elf32-arm.c b/bfd/elf32-arm.c index b449ee8333..caa3bd2006 100644 --- a/bfd/elf32-arm.c +++ b/bfd/elf32-arm.c @@ -9730,8 +9730,6 @@ elf32_arm_merge_eabi_attributes (bfd *ibfd, bfd *obfd) /* Some tags have 0 = don't care, 1 = strong requirement, 2 = weak requirement. */ static const int order_021[3] = {0, 2, 1}; - /* For use with Tag_VFP_arch. */ - static const int order_01243[5] = {0, 1, 2, 4, 3}; int i; bfd_boolean result = TRUE; @@ -9923,12 +9921,50 @@ elf32_arm_merge_eabi_attributes (bfd *ibfd, bfd *obfd) } break; case Tag_VFP_arch: - /* Use the "greatest" from the sequence 0, 1, 2, 4, 3, or the - largest value if greater than 4 (for future-proofing). */ - if ((in_attr[i].i > 4 && in_attr[i].i > out_attr[i].i) - || (in_attr[i].i <= 4 && out_attr[i].i <= 4 - && order_01243[in_attr[i].i] > order_01243[out_attr[i].i])) - out_attr[i].i = in_attr[i].i; + { + static const struct + { + int ver; + int regs; + } vfp_versions[7] = + { + {0, 0}, + {1, 16}, + {2, 16}, + {3, 32}, + {3, 16}, + {4, 32}, + {4, 16} + }; + int ver; + int regs; + int newval; + + /* Values greater than 6 aren't defined, so just pick the + biggest */ + if (in_attr[i].i > 6 && in_attr[i].i > out_attr[i].i) + { + out_attr[i] = in_attr[i]; + break; + } + /* The output uses the superset of input features + (ISA version) and registers. */ + ver = vfp_versions[in_attr[i].i].ver; + if (ver < vfp_versions[out_attr[i].i].ver) + ver = vfp_versions[out_attr[i].i].ver; + regs = vfp_versions[in_attr[i].i].regs; + if (regs < vfp_versions[out_attr[i].i].regs) + regs = vfp_versions[out_attr[i].i].regs; + /* This assumes all possible supersets are also a valid + options. */ + for (newval = 6; newval > 0; newval--) + { + if (regs == vfp_versions[newval].regs + && ver == vfp_versions[newval].ver) + break; + } + out_attr[i].i = newval; + } break; case Tag_PCS_config: if (out_attr[i].i == 0) diff --git a/binutils/ChangeLog b/binutils/ChangeLog index e23e18f4d7..393a723569 100644 --- a/binutils/ChangeLog +++ b/binutils/ChangeLog @@ -1,3 +1,7 @@ +2009-11-02 Paul Brook + + * readelf.c (arm_attr_tag_VFP_arch): Add VFPv4 and VFPv4-D16. + 2009-10-28 Kai Tietz * dlltool.c (leading_underscore): New local variable. diff --git a/binutils/readelf.c b/binutils/readelf.c index d0c8b38f87..38a19a7adf 100644 --- a/binutils/readelf.c +++ b/binutils/readelf.c @@ -8967,7 +8967,7 @@ static const char * arm_attr_tag_ARM_ISA_use[] = {"No", "Yes"}; static const char * arm_attr_tag_THUMB_ISA_use[] = {"No", "Thumb-1", "Thumb-2"}; static const char * arm_attr_tag_VFP_arch[] = - {"No", "VFPv1", "VFPv2", "VFPv3", "VFPv3-D16"}; + {"No", "VFPv1", "VFPv2", "VFPv3", "VFPv3-D16", "VFPv4", "VFPv4-D16"}; static const char * arm_attr_tag_WMMX_arch[] = {"No", "WMMXv1", "WMMXv2"}; static const char * arm_attr_tag_Advanced_SIMD_arch[] = {"No", "NEONv1"}; static const char * arm_attr_tag_PCS_config[] = diff --git a/gas/ChangeLog b/gas/ChangeLog index 3eb9ce08df..c562391a9a 100644 --- a/gas/ChangeLog +++ b/gas/ChangeLog @@ -1,3 +1,15 @@ +2009-11-02 Paul Brook + + * doc/c-arm.texi: Document new -mfpu options. + * config/tc-arm.c (fpu_vfp_ext_v3xd, fpu_vfp_fp16, fpu_neon_ext_fma, + fpu_vfp_ext_fma): New. + (NEON_ENC_TAB): Add vfma, vfms, vfnma and vfnms. + (do_vfp_nsyn_fma_fms, do_neon_fmac): New functions. + (insns): Move double precision load/store. Split out double + precision VFPv3 instrucitons. Add VFPv4 instructions. + (arm_fpus): Add VFPv3-FP16, VFPv3xD and VFPv4 variants. + (aeabi_set_public_attributes): Set VFPv4 variants + 2009-11-02 Alan Modra * ecoff.c (ecoff_symbol_clone_hook): New function. diff --git a/gas/config/tc-arm.c b/gas/config/tc-arm.c index 52242a81a4..6da0462b07 100644 --- a/gas/config/tc-arm.c +++ b/gas/config/tc-arm.c @@ -216,13 +216,16 @@ static const arm_feature_set fpu_vfp_ext_v1xd = ARM_FEATURE (0, FPU_VFP_EXT_V1xD); static const arm_feature_set fpu_vfp_ext_v1 = ARM_FEATURE (0, FPU_VFP_EXT_V1); static const arm_feature_set fpu_vfp_ext_v2 = ARM_FEATURE (0, FPU_VFP_EXT_V2); +static const arm_feature_set fpu_vfp_ext_v3xd = ARM_FEATURE (0, FPU_VFP_EXT_V3xD); static const arm_feature_set fpu_vfp_ext_v3 = ARM_FEATURE (0, FPU_VFP_EXT_V3); static const arm_feature_set fpu_vfp_ext_d32 = ARM_FEATURE (0, FPU_VFP_EXT_D32); static const arm_feature_set fpu_neon_ext_v1 = ARM_FEATURE (0, FPU_NEON_EXT_V1); static const arm_feature_set fpu_vfp_v3_or_neon_ext = ARM_FEATURE (0, FPU_NEON_EXT_V1 | FPU_VFP_EXT_V3); -static const arm_feature_set fpu_neon_fp16 = ARM_FEATURE (0, FPU_NEON_FP16); +static const arm_feature_set fpu_vfp_fp16 = ARM_FEATURE (0, FPU_VFP_EXT_FP16); +static const arm_feature_set fpu_neon_ext_fma = ARM_FEATURE (0, FPU_NEON_EXT_FMA); +static const arm_feature_set fpu_vfp_ext_fma = ARM_FEATURE (0, FPU_VFP_EXT_FMA); static int mfloat_abi_opt = -1; /* Record user cpu selection for object attributes. */ @@ -11293,6 +11296,8 @@ struct neon_tab_entry vcge / vcgt with the operands reversed. */ \ X(vclt, 0x0000300, 0x1200e00, 0x1b10200), \ X(vcle, 0x0000310, 0x1000e00, 0x1b10180), \ + X(vfma, N_INV, 0x0000c10, N_INV), \ + X(vfms, N_INV, 0x0200c10, N_INV), \ X(vmla, 0x0000900, 0x0000d10, 0x0800040), \ X(vmls, 0x1000900, 0x0200d10, 0x0800440), \ X(vmul, 0x0000910, 0x1000d10, 0x0800840), \ @@ -11330,6 +11335,8 @@ struct neon_tab_entry X(vnmul, 0xe200a40, 0xe200b40, N_INV), \ X(vnmla, 0xe100a40, 0xe100b40, N_INV), \ X(vnmls, 0xe100a00, 0xe100b00, N_INV), \ + X(vfnma, 0xe900a40, 0xe900b40, N_INV), \ + X(vfnms, 0xe900a00, 0xe900b00, N_INV), \ X(vcmp, 0xeb40a40, 0xeb40b40, N_INV), \ X(vcmpz, 0xeb50a40, 0xeb50b40, N_INV), \ X(vcmpe, 0xeb40ac0, 0xeb40bc0, N_INV), \ @@ -12149,6 +12156,27 @@ do_vfp_nsyn_mla_mls (enum neon_shape rs) } static void +do_vfp_nsyn_fma_fms (enum neon_shape rs) +{ + int is_fma = (inst.instruction & 0x0fffffff) == N_MNEM_vfma; + + if (rs == NS_FFF) + { + if (is_fma) + do_vfp_nsyn_opcode ("ffmas"); + else + do_vfp_nsyn_opcode ("ffnmas"); + } + else + { + if (is_fma) + do_vfp_nsyn_opcode ("ffmad"); + else + do_vfp_nsyn_opcode ("ffnmad"); + } +} + +static void do_vfp_nsyn_mul (enum neon_shape rs) { if (rs == NS_FFF) @@ -13116,6 +13144,18 @@ do_neon_mac_maybe_scalar (void) } static void +do_neon_fmac (void) +{ + if (try_vfp_nsyn (3, do_vfp_nsyn_fma_fms) == SUCCESS) + return; + + if (vfp_or_neon_is_neon (NEON_CHECK_CC | NEON_CHECK_ARCH) == FAIL) + return; + + neon_dyadic_misc (NT_untyped, N_IF_32, 0); +} + +static void do_neon_tst (void) { enum neon_shape rs = neon_select_shape (NS_DDD, NS_QQQ, NS_NULL); @@ -17179,6 +17219,19 @@ static const struct asm_opcode insns[] = cCE("fcmpes", eb40ac0, 2, (RVS, RVS), vfp_sp_monadic), cCE("fcmpezs", eb50ac0, 1, (RVS), vfp_sp_compare_z), + /* Double precision load/store are still present on single precision + implementations. */ + cCE("fldd", d100b00, 2, (RVD, ADDRGLDC), vfp_dp_ldst), + cCE("fstd", d000b00, 2, (RVD, ADDRGLDC), vfp_dp_ldst), + cCE("fldmiad", c900b00, 2, (RRw, VRDLST), vfp_dp_ldstmia), + cCE("fldmfdd", c900b00, 2, (RRw, VRDLST), vfp_dp_ldstmia), + cCE("fldmdbd", d300b00, 2, (RRw, VRDLST), vfp_dp_ldstmdb), + cCE("fldmead", d300b00, 2, (RRw, VRDLST), vfp_dp_ldstmdb), + cCE("fstmiad", c800b00, 2, (RRw, VRDLST), vfp_dp_ldstmia), + cCE("fstmead", c800b00, 2, (RRw, VRDLST), vfp_dp_ldstmia), + cCE("fstmdbd", d200b00, 2, (RRw, VRDLST), vfp_dp_ldstmdb), + cCE("fstmfdd", d200b00, 2, (RRw, VRDLST), vfp_dp_ldstmdb), + #undef ARM_VARIANT #define ARM_VARIANT & fpu_vfp_ext_v1 /* VFP V1 (Double precision). */ @@ -17197,18 +17250,6 @@ static const struct asm_opcode insns[] = cCE("ftouid", ebc0b40, 2, (RVS, RVD), vfp_sp_dp_cvt), cCE("ftouizd", ebc0bc0, 2, (RVS, RVD), vfp_sp_dp_cvt), - /* Memory operations. */ - cCE("fldd", d100b00, 2, (RVD, ADDRGLDC), vfp_dp_ldst), - cCE("fstd", d000b00, 2, (RVD, ADDRGLDC), vfp_dp_ldst), - cCE("fldmiad", c900b00, 2, (RRw, VRDLST), vfp_dp_ldstmia), - cCE("fldmfdd", c900b00, 2, (RRw, VRDLST), vfp_dp_ldstmia), - cCE("fldmdbd", d300b00, 2, (RRw, VRDLST), vfp_dp_ldstmdb), - cCE("fldmead", d300b00, 2, (RRw, VRDLST), vfp_dp_ldstmdb), - cCE("fstmiad", c800b00, 2, (RRw, VRDLST), vfp_dp_ldstmia), - cCE("fstmead", c800b00, 2, (RRw, VRDLST), vfp_dp_ldstmia), - cCE("fstmdbd", d200b00, 2, (RRw, VRDLST), vfp_dp_ldstmdb), - cCE("fstmfdd", d200b00, 2, (RRw, VRDLST), vfp_dp_ldstmdb), - /* Monadic operations. */ cCE("fabsd", eb00bc0, 2, (RVD, RVD), vfp_dp_rd_rm), cCE("fnegd", eb10b40, 2, (RVD, RVD), vfp_dp_rd_rm), @@ -17535,29 +17576,52 @@ static const struct asm_opcode insns[] = nUF(vst4, _vst4, 2, (NSTRLST, ADDR), neon_ldx_stx), #undef THUMB_VARIANT +#define THUMB_VARIANT &fpu_vfp_ext_v3xd +#undef ARM_VARIANT +#define ARM_VARIANT &fpu_vfp_ext_v3xd + cCE("fconsts", eb00a00, 2, (RVS, I255), vfp_sp_const), + cCE("fshtos", eba0a40, 2, (RVS, I16z), vfp_sp_conv_16), + cCE("fsltos", eba0ac0, 2, (RVS, I32), vfp_sp_conv_32), + cCE("fuhtos", ebb0a40, 2, (RVS, I16z), vfp_sp_conv_16), + cCE("fultos", ebb0ac0, 2, (RVS, I32), vfp_sp_conv_32), + cCE("ftoshs", ebe0a40, 2, (RVS, I16z), vfp_sp_conv_16), + cCE("ftosls", ebe0ac0, 2, (RVS, I32), vfp_sp_conv_32), + cCE("ftouhs", ebf0a40, 2, (RVS, I16z), vfp_sp_conv_16), + cCE("ftouls", ebf0ac0, 2, (RVS, I32), vfp_sp_conv_32), + +#undef THUMB_VARIANT #define THUMB_VARIANT & fpu_vfp_ext_v3 #undef ARM_VARIANT #define ARM_VARIANT & fpu_vfp_ext_v3 - cCE("fconsts", eb00a00, 2, (RVS, I255), vfp_sp_const), cCE("fconstd", eb00b00, 2, (RVD, I255), vfp_dp_const), - cCE("fshtos", eba0a40, 2, (RVS, I16z), vfp_sp_conv_16), cCE("fshtod", eba0b40, 2, (RVD, I16z), vfp_dp_conv_16), - cCE("fsltos", eba0ac0, 2, (RVS, I32), vfp_sp_conv_32), cCE("fsltod", eba0bc0, 2, (RVD, I32), vfp_dp_conv_32), - cCE("fuhtos", ebb0a40, 2, (RVS, I16z), vfp_sp_conv_16), cCE("fuhtod", ebb0b40, 2, (RVD, I16z), vfp_dp_conv_16), - cCE("fultos", ebb0ac0, 2, (RVS, I32), vfp_sp_conv_32), cCE("fultod", ebb0bc0, 2, (RVD, I32), vfp_dp_conv_32), - cCE("ftoshs", ebe0a40, 2, (RVS, I16z), vfp_sp_conv_16), cCE("ftoshd", ebe0b40, 2, (RVD, I16z), vfp_dp_conv_16), - cCE("ftosls", ebe0ac0, 2, (RVS, I32), vfp_sp_conv_32), cCE("ftosld", ebe0bc0, 2, (RVD, I32), vfp_dp_conv_32), - cCE("ftouhs", ebf0a40, 2, (RVS, I16z), vfp_sp_conv_16), cCE("ftouhd", ebf0b40, 2, (RVD, I16z), vfp_dp_conv_16), - cCE("ftouls", ebf0ac0, 2, (RVS, I32), vfp_sp_conv_32), cCE("ftould", ebf0bc0, 2, (RVD, I32), vfp_dp_conv_32), +#undef ARM_VARIANT +#define ARM_VARIANT &fpu_vfp_ext_fma +#undef THUMB_VARIANT +#define THUMB_VARIANT &fpu_vfp_ext_fma + /* Mnemonics shared by Neon and VFP. These are included in the + VFP FMA variant; NEON and VFP FMA always includes the NEON + FMA instructions. */ + nCEF(vfma, _vfma, 3, (RNSDQ, oRNSDQ, RNSDQ), neon_fmac), + nCEF(vfms, _vfms, 3, (RNSDQ, oRNSDQ, RNSDQ), neon_fmac), + /* ffmas/ffmad/ffmss/ffmsd are dummy mnemonics to satisfy gas; + the v form should always be used. */ + cCE("ffmas", ea00a00, 3, (RVS, RVS, RVS), vfp_sp_dyadic), + cCE("ffnmas", ea00a40, 3, (RVS, RVS, RVS), vfp_sp_dyadic), + cCE("ffmad", ea00b00, 3, (RVD, RVD, RVD), vfp_dp_rd_rn_rm), + cCE("ffnmad", ea00b40, 3, (RVD, RVD, RVD), vfp_dp_rd_rn_rm), + nCE(vfnma, _vfnma, 3, (RVSD, RVSD, RVSD), vfp_nsyn_nmul), + nCE(vfnms, _vfnms, 3, (RVSD, RVSD, RVSD), vfp_nsyn_nmul), + #undef THUMB_VARIANT #undef ARM_VARIANT #define ARM_VARIANT & arm_cext_xscale /* Intel XScale extensions. */ @@ -21967,7 +22031,11 @@ static const struct arm_option_cpu_value_table arm_fpus[] = {"vfpxd", FPU_ARCH_VFP_V1xD}, {"vfpv2", FPU_ARCH_VFP_V2}, {"vfpv3", FPU_ARCH_VFP_V3}, + {"vfpv3-fp16", FPU_ARCH_VFP_V3_FP16}, {"vfpv3-d16", FPU_ARCH_VFP_V3D16}, + {"vfpv3-d16-fp16", FPU_ARCH_VFP_V3D16_FP16}, + {"vfpv3xd", FPU_ARCH_VFP_V3xD}, + {"vfpv3xd-fp16", FPU_ARCH_VFP_V3xD_FP16}, {"arm1020t", FPU_ARCH_VFP_V1}, {"arm1020e", FPU_ARCH_VFP_V2}, {"arm1136jfs", FPU_ARCH_VFP_V2}, @@ -21975,6 +22043,9 @@ static const struct arm_option_cpu_value_table arm_fpus[] = {"maverick", FPU_ARCH_MAVERICK}, {"neon", FPU_ARCH_VFP_V3_PLUS_NEON_V1}, {"neon-fp16", FPU_ARCH_NEON_FP16}, + {"vfpv4", FPU_ARCH_VFP_V4}, + {"vfpv4-d16", FPU_ARCH_VFP_V4D16}, + {"neon-vfpv4", FPU_ARCH_NEON_VFP_V4}, {NULL, ARM_ARCH_NONE} }; @@ -22453,8 +22524,10 @@ aeabi_set_public_attributes (void) } aeabi_set_attribute_string (Tag_CPU_name, p); } + /* Tag_CPU_arch. */ aeabi_set_attribute_int (Tag_CPU_arch, arch); + /* Tag_CPU_arch_profile. */ if (ARM_CPU_HAS_FEATURE (flags, arm_ext_v7a)) aeabi_set_attribute_int (Tag_CPU_arch_profile, 'A'); @@ -22462,17 +22535,24 @@ aeabi_set_public_attributes (void) aeabi_set_attribute_int (Tag_CPU_arch_profile, 'R'); else if (ARM_CPU_HAS_FEATURE (flags, arm_ext_m)) aeabi_set_attribute_int (Tag_CPU_arch_profile, 'M'); + /* Tag_ARM_ISA_use. */ if (ARM_CPU_HAS_FEATURE (flags, arm_ext_v1) || arch == 0) aeabi_set_attribute_int (Tag_ARM_ISA_use, 1); + /* Tag_THUMB_ISA_use. */ if (ARM_CPU_HAS_FEATURE (flags, arm_ext_v4t) || arch == 0) aeabi_set_attribute_int (Tag_THUMB_ISA_use, ARM_CPU_HAS_FEATURE (flags, arm_arch_t2) ? 2 : 1); + /* Tag_VFP_arch. */ - if (ARM_CPU_HAS_FEATURE (flags, fpu_vfp_ext_d32)) + if (ARM_CPU_HAS_FEATURE (flags, fpu_vfp_ext_fma)) + aeabi_set_attribute_int (Tag_VFP_arch, + ARM_CPU_HAS_FEATURE (flags, fpu_vfp_ext_d32) + ? 5 : 6); + else if (ARM_CPU_HAS_FEATURE (flags, fpu_vfp_ext_d32)) aeabi_set_attribute_int (Tag_VFP_arch, 3); else if (ARM_CPU_HAS_FEATURE (flags, fpu_vfp_ext_v3)) aeabi_set_attribute_int (Tag_VFP_arch, 4); @@ -22481,16 +22561,21 @@ aeabi_set_public_attributes (void) else if (ARM_CPU_HAS_FEATURE (flags, fpu_vfp_ext_v1) || ARM_CPU_HAS_FEATURE (flags, fpu_vfp_ext_v1xd)) aeabi_set_attribute_int (Tag_VFP_arch, 1); + /* Tag_WMMX_arch. */ if (ARM_CPU_HAS_FEATURE (flags, arm_cext_iwmmxt2)) aeabi_set_attribute_int (Tag_WMMX_arch, 2); else if (ARM_CPU_HAS_FEATURE (flags, arm_cext_iwmmxt)) aeabi_set_attribute_int (Tag_WMMX_arch, 1); + /* Tag_Advanced_SIMD_arch (formerly Tag_NEON_arch). */ if (ARM_CPU_HAS_FEATURE (flags, fpu_neon_ext_v1)) - aeabi_set_attribute_int (Tag_Advanced_SIMD_arch, 1); + aeabi_set_attribute_int + (Tag_Advanced_SIMD_arch, (ARM_CPU_HAS_FEATURE (flags, fpu_neon_ext_fma) + ? 2 : 1)); + /* Tag_VFP_HP_extension (formerly Tag_NEON_FP16_arch). */ - if (ARM_CPU_HAS_FEATURE (flags, fpu_neon_fp16)) + if (ARM_CPU_HAS_FEATURE (flags, fpu_vfp_fp16)) aeabi_set_attribute_int (Tag_VFP_HP_extension, 1); } diff --git a/gas/doc/c-arm.texi b/gas/doc/c-arm.texi index 2f4bf853bb..eb58a562c7 100644 --- a/gas/doc/c-arm.texi +++ b/gas/doc/c-arm.texi @@ -200,15 +200,22 @@ The following format options are recognized: @code{vfp10-r0}, @code{vfp9}, @code{vfpxd}, -@code{vfpv2} -@code{vfpv3} -@code{vfpv3-d16} +@code{vfpv2}, +@code{vfpv3}, +@code{vfpv3-fp16}, +@code{vfpv3-d16}, +@code{vfpv3-d16-fp16}, +@code{vfpv3xd}, +@code{vfpv3xd-d16}, +@code{vfpv4}, +@code{vfpv4-d16}, @code{arm1020t}, @code{arm1020e}, @code{arm1136jf-s}, -@code{maverick} +@code{maverick}, +@code{neon}, and -@code{neon}. +@code{neon-vfpv4}. In addition to determining which instructions are assembled, this option also affects the way in which the @code{.double} assembler directive behaves diff --git a/gas/testsuite/ChangeLog b/gas/testsuite/ChangeLog index 370438ffe6..d15afcbaed 100644 --- a/gas/testsuite/ChangeLog +++ b/gas/testsuite/ChangeLog @@ -1,3 +1,19 @@ +2009-11-02 Paul Brook + + * gas/arm/attr-mfpu-vfpv4.d: New test. + * gas/arm/attr-mfpu-vfpv4-d16.d: New test. + * gas/arm/neon-fma-cov.d: New test. + * gas/arm/neon-fma-cov.s: New test. + * gas/arm/vfp-fma-inc.s: New test. + * gas/arm/vfp-fma-arm.d: New test. + * gas/arm/vfp-fma-arm.s: New test. + * gas/arm/vfp-fma-thumb.d: New test. + * gas/arm/vfp-fma-thumb.s: New test. + * gas/arm/vfma1.d: New test. + * gas/arm/vfma1.s: New test. + * gas/arm/vfpv3xd.d: New test. + * gas/arm/vfpv3xd.s: New test. + 2009-10-29 Sebastian Pop * gas/i386/fma4.d: Updated patterns. diff --git a/gas/testsuite/gas/arm/attr-mfpu-vfpv4-d16.d b/gas/testsuite/gas/arm/attr-mfpu-vfpv4-d16.d new file mode 100644 index 0000000000..6b3574de77 --- /dev/null +++ b/gas/testsuite/gas/arm/attr-mfpu-vfpv4-d16.d @@ -0,0 +1,13 @@ +# name: attributes for -mfpu=vfpv4-d16 +# source: blank.s +# as: -mfpu=vfpv4-d16 +# readelf: -A +# This test is only valid on EABI based ports. +# target: *-*-*eabi + +Attribute Section: aeabi +File Attributes + Tag_ARM_ISA_use: Yes + Tag_THUMB_ISA_use: Thumb-1 + Tag_VFP_arch: VFPv4-D16 + Tag_VFP_HP_extension: Allowed diff --git a/gas/testsuite/gas/arm/attr-mfpu-vfpv4.d b/gas/testsuite/gas/arm/attr-mfpu-vfpv4.d new file mode 100644 index 0000000000..a3b91a5e65 --- /dev/null +++ b/gas/testsuite/gas/arm/attr-mfpu-vfpv4.d @@ -0,0 +1,13 @@ +# name: attributes for -mfpu=vfpv4 +# source: blank.s +# as: -mfpu=vfpv4 +# readelf: -A +# This test is only valid on EABI based ports. +# target: *-*-*eabi + +Attribute Section: aeabi +File Attributes + Tag_ARM_ISA_use: Yes + Tag_THUMB_ISA_use: Thumb-1 + Tag_VFP_arch: VFPv4 + Tag_VFP_HP_extension: Allowed diff --git a/gas/testsuite/gas/arm/neon-fma-cov.d b/gas/testsuite/gas/arm/neon-fma-cov.d new file mode 100644 index 0000000000..1c51d7bf04 --- /dev/null +++ b/gas/testsuite/gas/arm/neon-fma-cov.d @@ -0,0 +1,13 @@ +# name: Neon FMA instruction coverage +# as: -mfpu=neon-vfpv4 +# objdump: -dr --prefix-addresses --show-raw-insn + +.*: +file format .*arm.* + +Disassembly of section \.text: +0[0-9a-f]+ <[^>]+> f2000c50 vfma\.f32 q0, q0, q0 +0[0-9a-f]+ <[^>]+> f2000c50 vfma\.f32 q0, q0, q0 +0[0-9a-f]+ <[^>]+> f2000c10 vfma\.f32 d0, d0, d0 +0[0-9a-f]+ <[^>]+> f2200c50 vfms\.f32 q0, q0, q0 +0[0-9a-f]+ <[^>]+> f2200c50 vfms\.f32 q0, q0, q0 +0[0-9a-f]+ <[^>]+> f2200c10 vfms\.f32 d0, d0, d0 diff --git a/gas/testsuite/gas/arm/neon-fma-cov.s b/gas/testsuite/gas/arm/neon-fma-cov.s new file mode 100644 index 0000000000..db34807d0b --- /dev/null +++ b/gas/testsuite/gas/arm/neon-fma-cov.s @@ -0,0 +1,12 @@ + .arm + .syntax unified + .text + + .macro regs3_1 op opq vtype + \op\vtype q0,q0,q0 + \opq\vtype q0,q0,q0 + \op\vtype d0,d0,d0 + .endm + + regs3_1 vfma vfma .f32 + regs3_1 vfms vfms .f32 diff --git a/gas/testsuite/gas/arm/vfma1.d b/gas/testsuite/gas/arm/vfma1.d new file mode 100644 index 0000000000..4c638d380b --- /dev/null +++ b/gas/testsuite/gas/arm/vfma1.d @@ -0,0 +1,34 @@ +#objdump: -dr --prefix-addresses --show-raw-insn +#name: VFMA decoding +#as: -mcpu=arm7m + +# Test VFMA instruction disassembly + +.*: *file format .*arm.* + + +Disassembly of section .text: +00000000 <[^>]*> ee000a00 vmla.f32 s0, s0, s0 +00000004 <[^>]*> ee000b00 vmla.f64 d0, d0, d0 +00000008 <[^>]*> f2000d10 vmla.f32 d0, d0, d0 +0000000c <[^>]*> f2000d50 vmla.f32 q0, q0, q0 +00000010 <[^>]*> eea00a00 vfma.f32 s0, s0, s0 +00000014 <[^>]*> eea00b00 vfma.f64 d0, d0, d0 +00000018 <[^>]*> f2000c10 vfma.f32 d0, d0, d0 +0000001c <[^>]*> f2000c50 vfma.f32 q0, q0, q0 +00000020 <[^>]*> ee000a40 vmls.f32 s0, s0, s0 +00000024 <[^>]*> ee000b40 vmls.f64 d0, d0, d0 +00000028 <[^>]*> f2200d10 vmls.f32 d0, d0, d0 +0000002c <[^>]*> f2200d50 vmls.f32 q0, q0, q0 +00000030 <[^>]*> eea00a40 vfms.f32 s0, s0, s0 +00000034 <[^>]*> eea00b40 vfms.f64 d0, d0, d0 +00000038 <[^>]*> f2200c10 vfms.f32 d0, d0, d0 +0000003c <[^>]*> f2200c50 vfms.f32 q0, q0, q0 +00000040 <[^>]*> ee100a40 vnmla.f32 s0, s0, s0 +00000044 <[^>]*> ee100b40 vnmla.f64 d0, d0, d0 +00000048 <[^>]*> ee900a40 vfnma.f32 s0, s0, s0 +0000004c <[^>]*> ee900b40 vfnma.f64 d0, d0, d0 +00000050 <[^>]*> ee100a00 vnmls.f32 s0, s0, s0 +00000054 <[^>]*> ee100b00 vnmls.f64 d0, d0, d0 +00000058 <[^>]*> ee900a00 vfnms.f32 s0, s0, s0 +0000005c <[^>]*> ee900b00 vfnms.f64 d0, d0, d0 diff --git a/gas/testsuite/gas/arm/vfma1.s b/gas/testsuite/gas/arm/vfma1.s new file mode 100644 index 0000000000..bc124f89db --- /dev/null +++ b/gas/testsuite/gas/arm/vfma1.s @@ -0,0 +1,43 @@ + + .eabi_attribute Tag_Advanced_SIMD_arch, 2 + .eabi_attribute Tag_VFP_arch, 6 + + @VMLA + .inst 0xee000a00 @ VFP vmla.f32 s0,s0,s0 + .inst 0xee000b00 @ VFP vmla.f64 d0,d0,d0 + .inst 0xf2000d10 @ NEON vmla.f32 d0,d0,d0 + .inst 0xf2000d50 @ NEON vmla.f32 q0,q0,q0 + + @VFMA new + .inst 0xeea00a00 @ VFP vfma.f32 s0,s0,s0 + .inst 0xeea00b00 @ VFP vfma.f64 d0,d0,d0 + .inst 0xf2000c10 @ NEON vfma.f32 d0,d0,d0 + .inst 0xf2000c50 @ NEON vfma.f32 q0,q0,q0 + + @VMLS + .inst 0xee000a40 @ VFP vmls.F32 s0,s0,s0 + .inst 0xee000b40 @ VFP vmls.F64 d0,d0,d0 + .inst 0xf2200d10 @ NEON vmls.F32 d0,d0,d0 + .inst 0xf2200d50 @ NEON vmls.F32 q0,q0,q0 + + @VFMS new + .inst 0xeea00a40 @ VFP vfms.F32 s0,s0,s0 + .inst 0xeea00b40 @ VFP vfms.F64 d0,d0,d0 + .inst 0xf2200c10 @ NEON vfms.F32 d0,d0,d0 + .inst 0xf2200c50 @ NEON vfms.F32 q0,q0,q0 + + @VNMLA + .inst 0xee100a40 @ VFP vnmla.F32 s0,s0,s0 + .inst 0xee100b40 @ VFP vnmla.F64 d0,d0,d0 + + @VFNMA new + .inst 0xee900a40 @ VFP vfnma.F32 s0,s0,s0 + .inst 0xee900b40 @ VFP vfnma.F64 d0,d0,d0 + + @VNMLS + .inst 0xee100a00 @ VFP vnmls.F32 s0,s0,s0 + .inst 0xee100b00 @ VFP vnmls.F64 d0,d0,d0 + + @VFNMS new + .inst 0xee900a00 @ VFP vfnms.F32 s0,s0,s0 + .inst 0xee900b00 @ VFP vfnms.F64 d0,d0,d0 diff --git a/gas/testsuite/gas/arm/vfp-fma-arm.d b/gas/testsuite/gas/arm/vfp-fma-arm.d new file mode 100644 index 0000000000..6a4f717071 --- /dev/null +++ b/gas/testsuite/gas/arm/vfp-fma-arm.d @@ -0,0 +1,23 @@ +# name: FMA instructions, ARM mode +# as: -mfpu=vfpv4 -I$srcdir/$subdir +# objdump: -dr --prefix-addresses --show-raw-insn + +.*: +file format .*arm.* + +Disassembly of section .text: +0[0-9a-f]+ <[^>]+> eea00a81 vfma\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> eea10b02 vfma\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> 0ea00a81 vfmaeq\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> 0ea10b02 vfmaeq\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> eea00ac1 vfms\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> eea10b42 vfms\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> 0ea00ac1 vfmseq\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> 0ea10b42 vfmseq\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> ee900ac1 vfnma\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> ee910b42 vfnma\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> 0e900ac1 vfnmaeq\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> 0e910b42 vfnmaeq\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> ee900a81 vfnms\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> ee910b02 vfnms\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> 0e900a81 vfnmseq\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> 0e910b02 vfnmseq\.f64 d0, d1, d2 diff --git a/gas/testsuite/gas/arm/vfp-fma-arm.s b/gas/testsuite/gas/arm/vfp-fma-arm.s new file mode 100644 index 0000000000..945926b1ba --- /dev/null +++ b/gas/testsuite/gas/arm/vfp-fma-arm.s @@ -0,0 +1,2 @@ + .arm + .include "vfp-fma-inc.s" diff --git a/gas/testsuite/gas/arm/vfp-fma-inc.s b/gas/testsuite/gas/arm/vfp-fma-inc.s new file mode 100644 index 0000000000..a9dcb1445e --- /dev/null +++ b/gas/testsuite/gas/arm/vfp-fma-inc.s @@ -0,0 +1,20 @@ + .syntax unified + + .include "itblock.s" + +func: + .macro dyadic op cond="" f32=".f32" f64=".f64" + itblock 2 \cond + \op\cond\f32 s0,s1,s2 + \op\cond\f64 d0,d1,d2 + .endm + + .macro dyadic_c op + dyadic \op + dyadic \op eq + .endm + + dyadic_c vfma + dyadic_c vfms + dyadic_c vfnma + dyadic_c vfnms diff --git a/gas/testsuite/gas/arm/vfp-fma-thumb.d b/gas/testsuite/gas/arm/vfp-fma-thumb.d new file mode 100644 index 0000000000..2ee77fd8fb --- /dev/null +++ b/gas/testsuite/gas/arm/vfp-fma-thumb.d @@ -0,0 +1,27 @@ +# name: FMA instructions, Thumb mode +# as: -mfpu=vfpv4 -I$srcdir/$subdir +# objdump: -dr --prefix-addresses --show-raw-insn + +.*: +file format .*arm.* + +Disassembly of section .text: +0[0-9a-f]+ <[^>]+> eea0 0a81 vfma\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> eea1 0b02 vfma\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> bf04 itt eq +0[0-9a-f]+ <[^>]+> eea0 0a81 vfmaeq\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> eea1 0b02 vfmaeq\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> eea0 0ac1 vfms\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> eea1 0b42 vfms\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> bf04 itt eq +0[0-9a-f]+ <[^>]+> eea0 0ac1 vfmseq\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> eea1 0b42 vfmseq\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> ee90 0ac1 vfnma\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> ee91 0b42 vfnma\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> bf04 itt eq +0[0-9a-f]+ <[^>]+> ee90 0ac1 vfnmaeq\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> ee91 0b42 vfnmaeq\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> ee90 0a81 vfnms\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> ee91 0b02 vfnms\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> bf04 itt eq +0[0-9a-f]+ <[^>]+> ee90 0a81 vfnmseq\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> ee91 0b02 vfnmseq\.f64 d0, d1, d2 diff --git a/gas/testsuite/gas/arm/vfp-fma-thumb.s b/gas/testsuite/gas/arm/vfp-fma-thumb.s new file mode 100644 index 0000000000..fa3b79245a --- /dev/null +++ b/gas/testsuite/gas/arm/vfp-fma-thumb.s @@ -0,0 +1,2 @@ + .thumb + .include "vfp-fma-inc.s" diff --git a/gas/testsuite/gas/arm/vfpv3xd.d b/gas/testsuite/gas/arm/vfpv3xd.d new file mode 100644 index 0000000000..508f70f73f --- /dev/null +++ b/gas/testsuite/gas/arm/vfpv3xd.d @@ -0,0 +1,23 @@ +#objdump: -dr --prefix-addresses --show-raw-insn +#name: VFP Double-precision load/store +#as: -mfpu=vfpv3xd + +# Test the ARM VFP Double Precision load/store on single precision FPU + +.*: +file format .*arm.* + +Disassembly of section .text: +0+[0-9a-f]* <[^>]*> ed900b00 vldr d0, \[r0\] +0+[0-9a-f]* <[^>]*> ed800b00 vstr d0, \[r0\] +0+[0-9a-f]* <[^>]*> ec900b02 vldmia r0, {d0} +0+[0-9a-f]* <[^>]*> ec900b02 vldmia r0, {d0} +0+[0-9a-f]* <[^>]*> ecb00b02 vldmia r0!, {d0} +0+[0-9a-f]* <[^>]*> ecb00b02 vldmia r0!, {d0} +0+[0-9a-f]* <[^>]*> ed300b02 vldmdb r0!, {d0} +0+[0-9a-f]* <[^>]*> ed300b02 vldmdb r0!, {d0} +0+[0-9a-f]* <[^>]*> ec800b02 vstmia r0, {d0} +0+[0-9a-f]* <[^>]*> ec800b02 vstmia r0, {d0} +0+[0-9a-f]* <[^>]*> eca00b02 vstmia r0!, {d0} +0+[0-9a-f]* <[^>]*> eca00b02 vstmia r0!, {d0} +0+[0-9a-f]* <[^>]*> ed200b02 vstmdb r0!, {d0} +0+[0-9a-f]* <[^>]*> ed200b02 vstmdb r0!, {d0} diff --git a/gas/testsuite/gas/arm/vfpv3xd.s b/gas/testsuite/gas/arm/vfpv3xd.s new file mode 100644 index 0000000000..a16b969f03 --- /dev/null +++ b/gas/testsuite/gas/arm/vfpv3xd.s @@ -0,0 +1,19 @@ +# Check double precision load/store are allowed on single precision +# implementation + + fldd d0, [r0] + fstd d0, [r0] + + fldmiad r0, {d0} + fldmfdd r0, {d0} + fldmiad r0!, {d0} + fldmfdd r0!, {d0} + fldmdbd r0!, {d0} + fldmead r0!, {d0} + + fstmiad r0, {d0} + fstmead r0, {d0} + fstmiad r0!, {d0} + fstmead r0!, {d0} + fstmdbd r0!, {d0} + fstmfdd r0!, {d0} diff --git a/include/opcode/ChangeLog b/include/opcode/ChangeLog index ec2bf97dda..dacf3ee1c7 100644 --- a/include/opcode/ChangeLog +++ b/include/opcode/ChangeLog @@ -1,3 +1,11 @@ +2009-11-02 Paul Brook + + * arm.h (FPU_VFP_EXT_V3xD, FPU_VFP_EXT_FP16, FPU_NEON_EXT_FMA, + FPU_VFP_EXT_FMA, FPU_VFP_V3xD, FPU_VFP_V4D16, FPU_VFP_V4): Define. + (FPU_ARCH_VFP_V3D16_FP16, FPU_ARCH_VFP_V3_FP16, FPU_ARCH_VFP_V3xD, + FPU_ARCH_VFP_V3xD_FP16, FPU_ARCH_VFP_V4, FPU_ARCH_VFP_V4D16, + FPU_ARCH_NEON_VFP_V4): Define. + 2009-10-23 Doug Evans * cgen-bitset.h: Delete, moved to ../cgen/bitset.h. diff --git a/include/opcode/arm.h b/include/opcode/arm.h index a639a8b041..459a80338b 100644 --- a/include/opcode/arm.h +++ b/include/opcode/arm.h @@ -62,10 +62,13 @@ #define FPU_VFP_EXT_V1xD 0x08000000 /* Base VFP instruction set. */ #define FPU_VFP_EXT_V1 0x04000000 /* Double-precision insns. */ #define FPU_VFP_EXT_V2 0x02000000 /* ARM10E VFPr1. */ -#define FPU_VFP_EXT_V3 0x01000000 /* VFPv3 insns. */ -#define FPU_NEON_EXT_V1 0x00800000 /* Neon (SIMD) insns. */ -#define FPU_VFP_EXT_D32 0x00400000 /* Registers D16-D31. */ -#define FPU_NEON_FP16 0x00200000 /* Half-precision extensions. */ +#define FPU_VFP_EXT_V3xD 0x01000000 /* VFPv3 single-precision. */ +#define FPU_VFP_EXT_V3 0x00800000 /* VFPv3 double-precision. */ +#define FPU_NEON_EXT_V1 0x00400000 /* Neon (SIMD) insns. */ +#define FPU_VFP_EXT_D32 0x00200000 /* Registers D16-D31. */ +#define FPU_VFP_EXT_FP16 0x00100000 /* Half-precision extensions. */ +#define FPU_NEON_EXT_FMA 0x00080000 /* Neon fused multiply-add */ +#define FPU_VFP_EXT_FMA 0x00040000 /* VFP fused multiply-add */ /* Architectures are the sum of the base and extensions. The ARM ARM (rev E) defines the following: ARMv3, ARMv3M, ARMv4xM, ARMv4, ARMv4TxM, ARMv4T, @@ -120,9 +123,13 @@ #define FPU_VFP_V1xD (FPU_VFP_EXT_V1xD | FPU_ENDIAN_PURE) #define FPU_VFP_V1 (FPU_VFP_V1xD | FPU_VFP_EXT_V1) #define FPU_VFP_V2 (FPU_VFP_V1 | FPU_VFP_EXT_V2) -#define FPU_VFP_V3D16 (FPU_VFP_V2 | FPU_VFP_EXT_V3) +#define FPU_VFP_V3D16 (FPU_VFP_V2 | FPU_VFP_EXT_V3xD | FPU_VFP_EXT_V3) #define FPU_VFP_V3 (FPU_VFP_V3D16 | FPU_VFP_EXT_D32) +#define FPU_VFP_V3xD (FPU_VFP_V1xD | FPU_VFP_EXT_V2 | FPU_VFP_EXT_V3xD) +#define FPU_VFP_V4D16 (FPU_VFP_V3D16 | FPU_VFP_EXT_FP16 | FPU_VFP_EXT_FMA) +#define FPU_VFP_V4 (FPU_VFP_V3 | FPU_VFP_EXT_FP16 | FPU_VFP_EXT_FMA) #define FPU_VFP_HARD (FPU_VFP_EXT_V1xD | FPU_VFP_EXT_V1 | FPU_VFP_EXT_V2 \ + | FPU_VFP_EXT_V3xD | FPU_VFP_EXT_FMA | FPU_NEON_EXT_FMA \ | FPU_VFP_EXT_V3 | FPU_NEON_EXT_V1 | FPU_VFP_EXT_D32) #define FPU_FPA (FPU_FPA_EXT_V1 | FPU_FPA_EXT_V2) @@ -136,13 +143,22 @@ #define FPU_ARCH_VFP_V1 ARM_FEATURE (0, FPU_VFP_V1) #define FPU_ARCH_VFP_V2 ARM_FEATURE (0, FPU_VFP_V2) #define FPU_ARCH_VFP_V3D16 ARM_FEATURE (0, FPU_VFP_V3D16) +#define FPU_ARCH_VFP_V3D16_FP16 \ + ARM_FEATURE (0, FPU_VFP_V3D16 | FPU_VFP_EXT_FP16) #define FPU_ARCH_VFP_V3 ARM_FEATURE (0, FPU_VFP_V3) +#define FPU_ARCH_VFP_V3_FP16 ARM_FEATURE (0, FPU_VFP_V3 | FPU_VFP_EXT_FP16) +#define FPU_ARCH_VFP_V3xD ARM_FEATURE (0, FPU_VFP_V3xD) +#define FPU_ARCH_VFP_V3xD_FP16 ARM_FEATURE (0, FPU_VFP_V3xD | FPU_VFP_EXT_FP16) #define FPU_ARCH_NEON_V1 ARM_FEATURE (0, FPU_NEON_EXT_V1) #define FPU_ARCH_VFP_V3_PLUS_NEON_V1 \ ARM_FEATURE (0, FPU_VFP_V3 | FPU_NEON_EXT_V1) #define FPU_ARCH_NEON_FP16 \ - ARM_FEATURE (0, FPU_VFP_V3 | FPU_NEON_EXT_V1 | FPU_NEON_FP16) + ARM_FEATURE (0, FPU_VFP_V3 | FPU_NEON_EXT_V1 | FPU_VFP_EXT_FP16) #define FPU_ARCH_VFP_HARD ARM_FEATURE (0, FPU_VFP_HARD) +#define FPU_ARCH_VFP_V4 ARM_FEATURE(0, FPU_VFP_V4) +#define FPU_ARCH_VFP_V4D16 ARM_FEATURE(0, FPU_VFP_V4D16) +#define FPU_ARCH_NEON_VFP_V4 \ + ARM_FEATURE(0, FPU_VFP_V4 | FPU_NEON_EXT_V1 | FPU_NEON_EXT_FMA) #define FPU_ARCH_ENDIAN_PURE ARM_FEATURE (0, FPU_ENDIAN_PURE) diff --git a/ld/testsuite/ChangeLog b/ld/testsuite/ChangeLog index dcfae5f6bf..a0c73c66cd 100644 --- a/ld/testsuite/ChangeLog +++ b/ld/testsuite/ChangeLog @@ -1,3 +1,22 @@ +2009-11-02 Paul Brook + + * ld-arm/arm-elf.exp: Add new attr-merge-vfp tests. + * ld-arm/attr-merge-vfp-1.d: New test. + * ld-arm/attr-merge-vfp-1r.d: New test. + * ld-arm/attr-merge-vfp-2.d: New test. + * ld-arm/attr-merge-vfp-2r.d: New test. + * ld-arm/attr-merge-vfp-3.d: New test. + * ld-arm/attr-merge-vfp-3r.d: New test. + * ld-arm/attr-merge-vfp-4.d: New test. + * ld-arm/attr-merge-vfp-4r.d: New test. + * ld-arm/attr-merge-vfp-5.d: New test. + * ld-arm/attr-merge-vfp-5r.d: New test. + * ld-arm/attr-merge-vfp-2.s: New test. + * ld-arm/attr-merge-vfp-3.s: New test. + * ld-arm/attr-merge-vfp-3-d16.s: New test. + * ld-arm/attr-merge-vfp-4.s: New test. + * ld-arm/attr-merge-vfp-4-d16.s: New test. + 2009-11-02 Alan Modra * ld-scripts/phdrs3.exp (LDFLAGS): Add "--local-store 0:0" for SPU. diff --git a/ld/testsuite/ld-arm/arm-elf.exp b/ld/testsuite/ld-arm/arm-elf.exp index d88fb37ca1..21ec2254b6 100644 --- a/ld/testsuite/ld-arm/arm-elf.exp +++ b/ld/testsuite/ld-arm/arm-elf.exp @@ -450,3 +450,13 @@ run_dump_test "unwind-2" run_dump_test "unwind-3" run_dump_test "unwind-4" run_dump_test "unwind-5" +run_dump_test "attr-merge-vfp-1" +run_dump_test "attr-merge-vfp-1r" +run_dump_test "attr-merge-vfp-2" +run_dump_test "attr-merge-vfp-2r" +run_dump_test "attr-merge-vfp-3" +run_dump_test "attr-merge-vfp-3r" +run_dump_test "attr-merge-vfp-4" +run_dump_test "attr-merge-vfp-4r" +run_dump_test "attr-merge-vfp-5" +run_dump_test "attr-merge-vfp-5r" diff --git a/ld/testsuite/ld-arm/attr-merge-vfp-1.d b/ld/testsuite/ld-arm/attr-merge-vfp-1.d new file mode 100644 index 0000000000..01ffae5a37 --- /dev/null +++ b/ld/testsuite/ld-arm/attr-merge-vfp-1.d @@ -0,0 +1,13 @@ +#source: attr-merge-vfp-2.s +#source: attr-merge-vfp-3-d16.s +#as: +#ld: -r +#readelf: -A +# This test is only valid on ELF based ports. +# not-target: *-*-*coff *-*-pe *-*-wince *-*-*aout* *-*-netbsd *-*-riscix* + +Attribute Section: aeabi +File Attributes + Tag_ARM_ISA_use: Yes + Tag_THUMB_ISA_use: Thumb-1 + Tag_VFP_arch: VFPv3-D16 diff --git a/ld/testsuite/ld-arm/attr-merge-vfp-1r.d b/ld/testsuite/ld-arm/attr-merge-vfp-1r.d new file mode 100644 index 0000000000..7494cc4ab3 --- /dev/null +++ b/ld/testsuite/ld-arm/attr-merge-vfp-1r.d @@ -0,0 +1,13 @@ +#source: attr-merge-vfp-3-d16.s +#source: attr-merge-vfp-2.s +#as: +#ld: -r +#readelf: -A +# This test is only valid on ELF based ports. +# not-target: *-*-*coff *-*-pe *-*-wince *-*-*aout* *-*-netbsd *-*-riscix* + +Attribute Section: aeabi +File Attributes + Tag_ARM_ISA_use: Yes + Tag_THUMB_ISA_use: Thumb-1 + Tag_VFP_arch: VFPv3-D16 diff --git a/ld/testsuite/ld-arm/attr-merge-vfp-2.d b/ld/testsuite/ld-arm/attr-merge-vfp-2.d new file mode 100644 index 0000000000..b81a9eb98d --- /dev/null +++ b/ld/testsuite/ld-arm/attr-merge-vfp-2.d @@ -0,0 +1,13 @@ +#source: attr-merge-vfp-3.s +#source: attr-merge-vfp-3-d16.s +#as: +#ld: -r +#readelf: -A +# This test is only valid on ELF based ports. +# not-target: *-*-*coff *-*-pe *-*-wince *-*-*aout* *-*-netbsd *-*-riscix* + +Attribute Section: aeabi +File Attributes + Tag_ARM_ISA_use: Yes + Tag_THUMB_ISA_use: Thumb-1 + Tag_VFP_arch: VFPv3 diff --git a/ld/testsuite/ld-arm/attr-merge-vfp-2.s b/ld/testsuite/ld-arm/attr-merge-vfp-2.s new file mode 100644 index 0000000000..32657d3822 --- /dev/null +++ b/ld/testsuite/ld-arm/attr-merge-vfp-2.s @@ -0,0 +1,2 @@ +.fpu vfpv2 + diff --git a/ld/testsuite/ld-arm/attr-merge-vfp-2r.d b/ld/testsuite/ld-arm/attr-merge-vfp-2r.d new file mode 100644 index 0000000000..47758d6410 --- /dev/null +++ b/ld/testsuite/ld-arm/attr-merge-vfp-2r.d @@ -0,0 +1,13 @@ +#source: attr-merge-vfp-3-d16.s +#source: attr-merge-vfp-3.s +#as: +#ld: -r +#readelf: -A +# This test is only valid on ELF based ports. +# not-target: *-*-*coff *-*-pe *-*-wince *-*-*aout* *-*-netbsd *-*-riscix* + +Attribute Section: aeabi +File Attributes + Tag_ARM_ISA_use: Yes + Tag_THUMB_ISA_use: Thumb-1 + Tag_VFP_arch: VFPv3 diff --git a/ld/testsuite/ld-arm/attr-merge-vfp-3-d16.s b/ld/testsuite/ld-arm/attr-merge-vfp-3-d16.s new file mode 100644 index 0000000000..74729e0bc0 --- /dev/null +++ b/ld/testsuite/ld-arm/attr-merge-vfp-3-d16.s @@ -0,0 +1,2 @@ +.fpu vfpv3-d16 + diff --git a/ld/testsuite/ld-arm/attr-merge-vfp-3.d b/ld/testsuite/ld-arm/attr-merge-vfp-3.d new file mode 100644 index 0000000000..36f8947e5d --- /dev/null +++ b/ld/testsuite/ld-arm/attr-merge-vfp-3.d @@ -0,0 +1,14 @@ +#source: attr-merge-vfp-3-d16.s +#source: attr-merge-vfp-4-d16.s +#as: +#ld: -r +#readelf: -A +# This test is only valid on ELF based ports. +# not-target: *-*-*coff *-*-pe *-*-wince *-*-*aout* *-*-netbsd *-*-riscix* + +Attribute Section: aeabi +File Attributes + Tag_ARM_ISA_use: Yes + Tag_THUMB_ISA_use: Thumb-1 + Tag_VFP_arch: VFPv4-D16 + Tag_VFP_HP_extension: Allowed diff --git a/ld/testsuite/ld-arm/attr-merge-vfp-3.s b/ld/testsuite/ld-arm/attr-merge-vfp-3.s new file mode 100644 index 0000000000..4d603239a7 --- /dev/null +++ b/ld/testsuite/ld-arm/attr-merge-vfp-3.s @@ -0,0 +1,2 @@ +.fpu vfpv3 + diff --git a/ld/testsuite/ld-arm/attr-merge-vfp-3r.d b/ld/testsuite/ld-arm/attr-merge-vfp-3r.d new file mode 100644 index 0000000000..fa110e627d --- /dev/null +++ b/ld/testsuite/ld-arm/attr-merge-vfp-3r.d @@ -0,0 +1,14 @@ +#source: attr-merge-vfp-4-d16.s +#source: attr-merge-vfp-3-d16.s +#as: +#ld: -r +#readelf: -A +# This test is only valid on ELF based ports. +# not-target: *-*-*coff *-*-pe *-*-wince *-*-*aout* *-*-netbsd *-*-riscix* + +Attribute Section: aeabi +File Attributes + Tag_ARM_ISA_use: Yes + Tag_THUMB_ISA_use: Thumb-1 + Tag_VFP_arch: VFPv4-D16 + Tag_VFP_HP_extension: Allowed diff --git a/ld/testsuite/ld-arm/attr-merge-vfp-4-d16.s b/ld/testsuite/ld-arm/attr-merge-vfp-4-d16.s new file mode 100644 index 0000000000..8d8aeddae4 --- /dev/null +++ b/ld/testsuite/ld-arm/attr-merge-vfp-4-d16.s @@ -0,0 +1,2 @@ +.fpu vfpv4-d16 + diff --git a/ld/testsuite/ld-arm/attr-merge-vfp-4.d b/ld/testsuite/ld-arm/attr-merge-vfp-4.d new file mode 100644 index 0000000000..c027883483 --- /dev/null +++ b/ld/testsuite/ld-arm/attr-merge-vfp-4.d @@ -0,0 +1,14 @@ +#source: attr-merge-vfp-3.s +#source: attr-merge-vfp-4-d16.s +#as: +#ld: -r +#readelf: -A +# This test is only valid on ELF based ports. +# not-target: *-*-*coff *-*-pe *-*-wince *-*-*aout* *-*-netbsd *-*-riscix* + +Attribute Section: aeabi +File Attributes + Tag_ARM_ISA_use: Yes + Tag_THUMB_ISA_use: Thumb-1 + Tag_VFP_arch: VFPv4 + Tag_VFP_HP_extension: Allowed diff --git a/ld/testsuite/ld-arm/attr-merge-vfp-4.s b/ld/testsuite/ld-arm/attr-merge-vfp-4.s new file mode 100644 index 0000000000..190cdc079e --- /dev/null +++ b/ld/testsuite/ld-arm/attr-merge-vfp-4.s @@ -0,0 +1,2 @@ +.fpu vfpv4 + diff --git a/ld/testsuite/ld-arm/attr-merge-vfp-4r.d b/ld/testsuite/ld-arm/attr-merge-vfp-4r.d new file mode 100644 index 0000000000..4247e7ee41 --- /dev/null +++ b/ld/testsuite/ld-arm/attr-merge-vfp-4r.d @@ -0,0 +1,14 @@ +#source: attr-merge-vfp-4-d16.s +#source: attr-merge-vfp-3.s +#as: +#ld: -r +#readelf: -A +# This test is only valid on ELF based ports. +# not-target: *-*-*coff *-*-pe *-*-wince *-*-*aout* *-*-netbsd *-*-riscix* + +Attribute Section: aeabi +File Attributes + Tag_ARM_ISA_use: Yes + Tag_THUMB_ISA_use: Thumb-1 + Tag_VFP_arch: VFPv4 + Tag_VFP_HP_extension: Allowed diff --git a/ld/testsuite/ld-arm/attr-merge-vfp-5.d b/ld/testsuite/ld-arm/attr-merge-vfp-5.d new file mode 100644 index 0000000000..a1c86318a6 --- /dev/null +++ b/ld/testsuite/ld-arm/attr-merge-vfp-5.d @@ -0,0 +1,14 @@ +#source: attr-merge-vfp-4.s +#source: attr-merge-vfp-4-d16.s +#as: +#ld: -r +#readelf: -A +# This test is only valid on ELF based ports. +# not-target: *-*-*coff *-*-pe *-*-wince *-*-*aout* *-*-netbsd *-*-riscix* + +Attribute Section: aeabi +File Attributes + Tag_ARM_ISA_use: Yes + Tag_THUMB_ISA_use: Thumb-1 + Tag_VFP_arch: VFPv4 + Tag_VFP_HP_extension: Allowed diff --git a/ld/testsuite/ld-arm/attr-merge-vfp-5r.d b/ld/testsuite/ld-arm/attr-merge-vfp-5r.d new file mode 100644 index 0000000000..6de0da67ed --- /dev/null +++ b/ld/testsuite/ld-arm/attr-merge-vfp-5r.d @@ -0,0 +1,14 @@ +#source: attr-merge-vfp-4-d16.s +#source: attr-merge-vfp-4.s +#as: +#ld: -r +#readelf: -A +# This test is only valid on ELF based ports. +# not-target: *-*-*coff *-*-pe *-*-wince *-*-*aout* *-*-netbsd *-*-riscix* + +Attribute Section: aeabi +File Attributes + Tag_ARM_ISA_use: Yes + Tag_THUMB_ISA_use: Thumb-1 + Tag_VFP_arch: VFPv4 + Tag_VFP_HP_extension: Allowed diff --git a/opcodes/ChangeLog b/opcodes/ChangeLog index 4814ba3fea..c8f9195d91 100644 --- a/opcodes/ChangeLog +++ b/opcodes/ChangeLog @@ -1,3 +1,8 @@ +2009-11-02 Paul Brook + + * arm-dis.c (coprocessor_opcodes): Update to use new feature flags. + Add VFPv4 instructions. + 2009-10-29 Sebastian Pop * i386-dis.c (OP_VEX_FMA): Removed. diff --git a/opcodes/arm-dis.c b/opcodes/arm-dis.c index 7551249904..1616fed92d 100644 --- a/opcodes/arm-dis.c +++ b/opcodes/arm-dis.c @@ -289,8 +289,8 @@ static const struct opcode32 coprocessor_opcodes[] = {FPU_NEON_EXT_V1, 0x0e400b10, 0x0fd00f10, "vmov%c.8\t%16-19,7D[%5,6,21d], %12-15r"}, {FPU_NEON_EXT_V1, 0x0e500b10, 0x0f500f10, "vmov%c.%23?us8\t%12-15r, %16-19,7D[%5,6,21d]"}, /* Half-precision conversion instructions. */ - {FPU_NEON_FP16, 0x0eb20a40, 0x0fbf0f50, "vcvt%7?tb%c.f32.f16\t%y1, %y0"}, - {FPU_NEON_FP16, 0x0eb30a40, 0x0fbf0f50, "vcvt%7?tb%c.f16.f32\t%y1, %y0"}, + {FPU_VFP_EXT_FP16, 0x0eb20a40, 0x0fbf0f50, "vcvt%7?tb%c.f32.f16\t%y1, %y0"}, + {FPU_VFP_EXT_FP16, 0x0eb30a40, 0x0fbf0f50, "vcvt%7?tb%c.f16.f32\t%y1, %y0"}, /* Floating point coprocessor (VFP) instructions. */ {FPU_VFP_EXT_V1xD, 0x0ee00a10, 0x0fff0fff, "vmsr%c\tfpsid, %12-15r"}, @@ -330,14 +330,14 @@ static const struct opcode32 coprocessor_opcodes[] = {FPU_VFP_EXT_V1, 0x0eb80b40, 0x0fbf0f50, "vcvt%c.f64.%7?su32\t%z1, %y0"}, {FPU_VFP_EXT_V1xD, 0x0eb40a40, 0x0fbf0f50, "vcmp%7'e%c.f32\t%y1, %y0"}, {FPU_VFP_EXT_V1, 0x0eb40b40, 0x0fbf0f50, "vcmp%7'e%c.f64\t%z1, %z0"}, - {FPU_VFP_EXT_V3, 0x0eba0a40, 0x0fbe0f50, "vcvt%c.f32.%16?us%7?31%7?26\t%y1, %y1, #%5,0-3k"}, + {FPU_VFP_EXT_V3xD, 0x0eba0a40, 0x0fbe0f50, "vcvt%c.f32.%16?us%7?31%7?26\t%y1, %y1, #%5,0-3k"}, {FPU_VFP_EXT_V3, 0x0eba0b40, 0x0fbe0f50, "vcvt%c.f64.%16?us%7?31%7?26\t%z1, %z1, #%5,0-3k"}, {FPU_VFP_EXT_V1xD, 0x0ebc0a40, 0x0fbe0f50, "vcvt%7`r%c.%16?su32.f32\t%y1, %y0"}, {FPU_VFP_EXT_V1, 0x0ebc0b40, 0x0fbe0f50, "vcvt%7`r%c.%16?su32.f64\t%y1, %z0"}, - {FPU_VFP_EXT_V3, 0x0ebe0a40, 0x0fbe0f50, "vcvt%c.%16?us%7?31%7?26.f32\t%y1, %y1, #%5,0-3k"}, + {FPU_VFP_EXT_V3xD, 0x0ebe0a40, 0x0fbe0f50, "vcvt%c.%16?us%7?31%7?26.f32\t%y1, %y1, #%5,0-3k"}, {FPU_VFP_EXT_V3, 0x0ebe0b40, 0x0fbe0f50, "vcvt%c.%16?us%7?31%7?26.f64\t%z1, %z1, #%5,0-3k"}, {FPU_VFP_EXT_V1, 0x0c500b10, 0x0fb00ff0, "vmov%c\t%12-15r, %16-19r, %z0"}, - {FPU_VFP_EXT_V3, 0x0eb00a00, 0x0fb00ff0, "vmov%c.f32\t%y1, #%0-3,16-19d"}, + {FPU_VFP_EXT_V3xD, 0x0eb00a00, 0x0fb00ff0, "vmov%c.f32\t%y1, #%0-3,16-19d"}, {FPU_VFP_EXT_V3, 0x0eb00b00, 0x0fb00ff0, "vmov%c.f64\t%z1, #%0-3,16-19d"}, {FPU_VFP_EXT_V2, 0x0c400a10, 0x0ff00fd0, "vmov%c\t%y4, %12-15r, %16-19r"}, {FPU_VFP_EXT_V2, 0x0c400b10, 0x0ff00fd0, "vmov%c\t%z0, %12-15r, %16-19r"}, @@ -447,6 +447,16 @@ static const struct opcode32 coprocessor_opcodes[] = {ARM_CEXT_MAVERICK, 0x0e200600, 0x0ff00f10, "cfmadda32%c\tmvax%5-7d, mvax%12-15d, mvfx%16-19d, mvfx%0-3d"}, {ARM_CEXT_MAVERICK, 0x0e300600, 0x0ff00f10, "cfmsuba32%c\tmvax%5-7d, mvax%12-15d, mvfx%16-19d, mvfx%0-3d"}, + /* VFP Fused multiply add instructions. */ + {FPU_VFP_EXT_FMA, 0x0ea00a00, 0x0fb00f50, "vfma%c.f32\t%y1, %y2, %y0"}, + {FPU_VFP_EXT_FMA, 0x0ea00b00, 0x0fb00f50, "vfma%c.f64\t%z1, %z2, %z0"}, + {FPU_VFP_EXT_FMA, 0x0ea00a40, 0x0fb00f50, "vfms%c.f32\t%y1, %y2, %y0"}, + {FPU_VFP_EXT_FMA, 0x0ea00b40, 0x0fb00f50, "vfms%c.f64\t%z1, %z2, %z0"}, + {FPU_VFP_EXT_FMA, 0x0e900a40, 0x0fb00f50, "vfnma%c.f32\t%y1, %y2, %y0"}, + {FPU_VFP_EXT_FMA, 0x0e900b40, 0x0fb00f50, "vfnma%c.f64\t%z1, %z2, %z0"}, + {FPU_VFP_EXT_FMA, 0x0e900a00, 0x0fb00f50, "vfnms%c.f32\t%y1, %y2, %y0"}, + {FPU_VFP_EXT_FMA, 0x0e900b00, 0x0fb00f50, "vfnms%c.f64\t%z1, %z2, %z0"}, + /* Generic coprocessor instructions. */ { 0, SENTINEL_GENERIC_START, 0, "" }, {ARM_EXT_V5E, 0x0c400000, 0x0ff00000, "mcrr%c\t%8-11d, %4-7d, %12-15r, %16-19r, cr%0-3d"}, @@ -517,8 +527,12 @@ static const struct opcode32 neon_opcodes[] = {FPU_NEON_EXT_V1, 0xf3b00840, 0xffb00c50, "vtbx%c.8\t%12-15,22D, %F, %0-3,5D"}, /* Half-precision conversions. */ - {FPU_NEON_FP16, 0xf3b60600, 0xffbf0fd0, "vcvt%c.f16.f32\t%12-15,22D, %0-3,5Q"}, - {FPU_NEON_FP16, 0xf3b60700, 0xffbf0fd0, "vcvt%c.f32.f16\t%12-15,22Q, %0-3,5D"}, + {FPU_VFP_EXT_FP16, 0xf3b60600, 0xffbf0fd0, "vcvt%c.f16.f32\t%12-15,22D, %0-3,5Q"}, + {FPU_VFP_EXT_FP16, 0xf3b60700, 0xffbf0fd0, "vcvt%c.f32.f16\t%12-15,22Q, %0-3,5D"}, + + /* NEON fused multiply add instructions. */ + {FPU_NEON_EXT_FMA, 0xf2000c10, 0xffa00f10, "vfma%c.f%20U0\t%12-15,22R, %16-19,7R, %0-3,5R"}, + {FPU_NEON_EXT_FMA, 0xf2200c10, 0xffa00f10, "vfms%c.f%20U0\t%12-15,22R, %16-19,7R, %0-3,5R"}, /* Two registers, miscellaneous. */ {FPU_NEON_EXT_V1, 0xf2880a10, 0xfebf0fd0, "vmovl%c.%24?us8\t%12-15,22Q, %0-3,5D"}, -- 2.11.0