diff options
author | Paul Brook <paul@codesourcery.com> | 2009-11-02 13:44:05 +0000 |
---|---|---|
committer | Paul Brook <paul@codesourcery.com> | 2009-11-02 13:44:05 +0000 |
commit | 62f3b8c86784407e864ddf7698b9852cb76aa339 (patch) | |
tree | 6a7acbf09e26521be68c3b7f3a49fe3ccc90a339 /gas | |
parent | ec15ac506168c7b0ead70d5d52c5d3fd18c5acab (diff) | |
download | gdb-62f3b8c86784407e864ddf7698b9852cb76aa339.zip gdb-62f3b8c86784407e864ddf7698b9852cb76aa339.tar.gz gdb-62f3b8c86784407e864ddf7698b9852cb76aa339.tar.bz2 |
2009-11-02 Paul Brook <paul@codesourcery.com>
ld/testsuite/
* ld-arm/arm-elf.exp: Add new attr-merge-vfp tests.
* ld-arm/attr-merge-vfp-1.d: New test.
* ld-arm/attr-merge-vfp-1r.d: New test.
* ld-arm/attr-merge-vfp-2.d: New test.
* ld-arm/attr-merge-vfp-2r.d: New test.
* ld-arm/attr-merge-vfp-3.d: New test.
* ld-arm/attr-merge-vfp-3r.d: New test.
* ld-arm/attr-merge-vfp-4.d: New test.
* ld-arm/attr-merge-vfp-4r.d: New test.
* ld-arm/attr-merge-vfp-5.d: New test.
* ld-arm/attr-merge-vfp-5r.d: New test.
* ld-arm/attr-merge-vfp-2.s: New test.
* ld-arm/attr-merge-vfp-3.s: New test.
* ld-arm/attr-merge-vfp-3-d16.s: New test.
* ld-arm/attr-merge-vfp-4.s: New test.
* ld-arm/attr-merge-vfp-4-d16.s: New test.
gas/
* doc/c-arm.texi: Document new -mfpu options.
* config/tc-arm.c (fpu_vfp_ext_v3xd, fpu_vfp_fp16, fpu_neon_ext_fma,
fpu_vfp_ext_fma): New.
(NEON_ENC_TAB): Add vfma, vfms, vfnma and vfnms.
(do_vfp_nsyn_fma_fms, do_neon_fmac): New functions.
(insns): Move double precision load/store. Split out double
precision VFPv3 instrucitons. Add VFPv4 instructions.
(arm_fpus): Add VFPv3-FP16, VFPv3xD and VFPv4 variants.
(aeabi_set_public_attributes): Set VFPv4 variants
gas/testsuite/
* gas/arm/attr-mfpu-vfpv4.d: New test.
* gas/arm/attr-mfpu-vfpv4-d16.d: New test.
* gas/arm/neon-fma-cov.d: New test.
* gas/arm/neon-fma-cov.s: New test.
* gas/arm/vfp-fma-inc.s: New test.
* gas/arm/vfp-fma-arm.d: New test.
* gas/arm/vfp-fma-arm.s: New test.
* gas/arm/vfp-fma-thumb.d: New test.
* gas/arm/vfp-fma-thumb.s: New test.
* gas/arm/vfma1.d: New test.
* gas/arm/vfma1.s: New test.
* gas/arm/vfpv3xd.d: New test.
* gas/arm/vfpv3xd.s: New test.
include/opcode/
* arm.h (FPU_VFP_EXT_V3xD, FPU_VFP_EXT_FP16, FPU_NEON_EXT_FMA,
FPU_VFP_EXT_FMA, FPU_VFP_V3xD, FPU_VFP_V4D16, FPU_VFP_V4): Define.
(FPU_ARCH_VFP_V3D16_FP16, FPU_ARCH_VFP_V3_FP16, FPU_ARCH_VFP_V3xD,
FPU_ARCH_VFP_V3xD_FP16, FPU_ARCH_VFP_V4, FPU_ARCH_VFP_V4D16,
FPU_ARCH_NEON_VFP_V4): Define.
binutils/
* readelf.c (arm_attr_tag_VFP_arch): Add VFPv4 and VFPv4-D16.
bfd/
* elf32-arm.c (elf32_arm_merge_eabi_attributes): Handle VFPv4
attributes.
opcodes/
* arm-dis.c (coprocessor_opcodes): Update to use new feature flags.
Add VFPv4 instructions.
Diffstat (limited to 'gas')
-rw-r--r-- | gas/ChangeLog | 12 | ||||
-rw-r--r-- | gas/config/tc-arm.c | 135 | ||||
-rw-r--r-- | gas/doc/c-arm.texi | 17 | ||||
-rw-r--r-- | gas/testsuite/ChangeLog | 16 | ||||
-rw-r--r-- | gas/testsuite/gas/arm/attr-mfpu-vfpv4-d16.d | 13 | ||||
-rw-r--r-- | gas/testsuite/gas/arm/attr-mfpu-vfpv4.d | 13 | ||||
-rw-r--r-- | gas/testsuite/gas/arm/neon-fma-cov.d | 13 | ||||
-rw-r--r-- | gas/testsuite/gas/arm/neon-fma-cov.s | 12 | ||||
-rw-r--r-- | gas/testsuite/gas/arm/vfma1.d | 34 | ||||
-rw-r--r-- | gas/testsuite/gas/arm/vfma1.s | 43 | ||||
-rw-r--r-- | gas/testsuite/gas/arm/vfp-fma-arm.d | 23 | ||||
-rw-r--r-- | gas/testsuite/gas/arm/vfp-fma-arm.s | 2 | ||||
-rw-r--r-- | gas/testsuite/gas/arm/vfp-fma-inc.s | 20 | ||||
-rw-r--r-- | gas/testsuite/gas/arm/vfp-fma-thumb.d | 27 | ||||
-rw-r--r-- | gas/testsuite/gas/arm/vfp-fma-thumb.s | 2 | ||||
-rw-r--r-- | gas/testsuite/gas/arm/vfpv3xd.d | 23 | ||||
-rw-r--r-- | gas/testsuite/gas/arm/vfpv3xd.s | 19 |
17 files changed, 394 insertions, 30 deletions
diff --git a/gas/ChangeLog b/gas/ChangeLog index 3eb9ce0..c562391 100644 --- a/gas/ChangeLog +++ b/gas/ChangeLog @@ -1,3 +1,15 @@ +2009-11-02 Paul Brook <paul@codesourcery.com> + + * doc/c-arm.texi: Document new -mfpu options. + * config/tc-arm.c (fpu_vfp_ext_v3xd, fpu_vfp_fp16, fpu_neon_ext_fma, + fpu_vfp_ext_fma): New. + (NEON_ENC_TAB): Add vfma, vfms, vfnma and vfnms. + (do_vfp_nsyn_fma_fms, do_neon_fmac): New functions. + (insns): Move double precision load/store. Split out double + precision VFPv3 instrucitons. Add VFPv4 instructions. + (arm_fpus): Add VFPv3-FP16, VFPv3xD and VFPv4 variants. + (aeabi_set_public_attributes): Set VFPv4 variants + 2009-11-02 Alan Modra <amodra@bigpond.net.au> * ecoff.c (ecoff_symbol_clone_hook): New function. diff --git a/gas/config/tc-arm.c b/gas/config/tc-arm.c index 52242a8..6da0462 100644 --- a/gas/config/tc-arm.c +++ b/gas/config/tc-arm.c @@ -216,13 +216,16 @@ static const arm_feature_set fpu_vfp_ext_v1xd = ARM_FEATURE (0, FPU_VFP_EXT_V1xD); static const arm_feature_set fpu_vfp_ext_v1 = ARM_FEATURE (0, FPU_VFP_EXT_V1); static const arm_feature_set fpu_vfp_ext_v2 = ARM_FEATURE (0, FPU_VFP_EXT_V2); +static const arm_feature_set fpu_vfp_ext_v3xd = ARM_FEATURE (0, FPU_VFP_EXT_V3xD); static const arm_feature_set fpu_vfp_ext_v3 = ARM_FEATURE (0, FPU_VFP_EXT_V3); static const arm_feature_set fpu_vfp_ext_d32 = ARM_FEATURE (0, FPU_VFP_EXT_D32); static const arm_feature_set fpu_neon_ext_v1 = ARM_FEATURE (0, FPU_NEON_EXT_V1); static const arm_feature_set fpu_vfp_v3_or_neon_ext = ARM_FEATURE (0, FPU_NEON_EXT_V1 | FPU_VFP_EXT_V3); -static const arm_feature_set fpu_neon_fp16 = ARM_FEATURE (0, FPU_NEON_FP16); +static const arm_feature_set fpu_vfp_fp16 = ARM_FEATURE (0, FPU_VFP_EXT_FP16); +static const arm_feature_set fpu_neon_ext_fma = ARM_FEATURE (0, FPU_NEON_EXT_FMA); +static const arm_feature_set fpu_vfp_ext_fma = ARM_FEATURE (0, FPU_VFP_EXT_FMA); static int mfloat_abi_opt = -1; /* Record user cpu selection for object attributes. */ @@ -11293,6 +11296,8 @@ struct neon_tab_entry vcge / vcgt with the operands reversed. */ \ X(vclt, 0x0000300, 0x1200e00, 0x1b10200), \ X(vcle, 0x0000310, 0x1000e00, 0x1b10180), \ + X(vfma, N_INV, 0x0000c10, N_INV), \ + X(vfms, N_INV, 0x0200c10, N_INV), \ X(vmla, 0x0000900, 0x0000d10, 0x0800040), \ X(vmls, 0x1000900, 0x0200d10, 0x0800440), \ X(vmul, 0x0000910, 0x1000d10, 0x0800840), \ @@ -11330,6 +11335,8 @@ struct neon_tab_entry X(vnmul, 0xe200a40, 0xe200b40, N_INV), \ X(vnmla, 0xe100a40, 0xe100b40, N_INV), \ X(vnmls, 0xe100a00, 0xe100b00, N_INV), \ + X(vfnma, 0xe900a40, 0xe900b40, N_INV), \ + X(vfnms, 0xe900a00, 0xe900b00, N_INV), \ X(vcmp, 0xeb40a40, 0xeb40b40, N_INV), \ X(vcmpz, 0xeb50a40, 0xeb50b40, N_INV), \ X(vcmpe, 0xeb40ac0, 0xeb40bc0, N_INV), \ @@ -12149,6 +12156,27 @@ do_vfp_nsyn_mla_mls (enum neon_shape rs) } static void +do_vfp_nsyn_fma_fms (enum neon_shape rs) +{ + int is_fma = (inst.instruction & 0x0fffffff) == N_MNEM_vfma; + + if (rs == NS_FFF) + { + if (is_fma) + do_vfp_nsyn_opcode ("ffmas"); + else + do_vfp_nsyn_opcode ("ffnmas"); + } + else + { + if (is_fma) + do_vfp_nsyn_opcode ("ffmad"); + else + do_vfp_nsyn_opcode ("ffnmad"); + } +} + +static void do_vfp_nsyn_mul (enum neon_shape rs) { if (rs == NS_FFF) @@ -13116,6 +13144,18 @@ do_neon_mac_maybe_scalar (void) } static void +do_neon_fmac (void) +{ + if (try_vfp_nsyn (3, do_vfp_nsyn_fma_fms) == SUCCESS) + return; + + if (vfp_or_neon_is_neon (NEON_CHECK_CC | NEON_CHECK_ARCH) == FAIL) + return; + + neon_dyadic_misc (NT_untyped, N_IF_32, 0); +} + +static void do_neon_tst (void) { enum neon_shape rs = neon_select_shape (NS_DDD, NS_QQQ, NS_NULL); @@ -17179,6 +17219,19 @@ static const struct asm_opcode insns[] = cCE("fcmpes", eb40ac0, 2, (RVS, RVS), vfp_sp_monadic), cCE("fcmpezs", eb50ac0, 1, (RVS), vfp_sp_compare_z), + /* Double precision load/store are still present on single precision + implementations. */ + cCE("fldd", d100b00, 2, (RVD, ADDRGLDC), vfp_dp_ldst), + cCE("fstd", d000b00, 2, (RVD, ADDRGLDC), vfp_dp_ldst), + cCE("fldmiad", c900b00, 2, (RRw, VRDLST), vfp_dp_ldstmia), + cCE("fldmfdd", c900b00, 2, (RRw, VRDLST), vfp_dp_ldstmia), + cCE("fldmdbd", d300b00, 2, (RRw, VRDLST), vfp_dp_ldstmdb), + cCE("fldmead", d300b00, 2, (RRw, VRDLST), vfp_dp_ldstmdb), + cCE("fstmiad", c800b00, 2, (RRw, VRDLST), vfp_dp_ldstmia), + cCE("fstmead", c800b00, 2, (RRw, VRDLST), vfp_dp_ldstmia), + cCE("fstmdbd", d200b00, 2, (RRw, VRDLST), vfp_dp_ldstmdb), + cCE("fstmfdd", d200b00, 2, (RRw, VRDLST), vfp_dp_ldstmdb), + #undef ARM_VARIANT #define ARM_VARIANT & fpu_vfp_ext_v1 /* VFP V1 (Double precision). */ @@ -17197,18 +17250,6 @@ static const struct asm_opcode insns[] = cCE("ftouid", ebc0b40, 2, (RVS, RVD), vfp_sp_dp_cvt), cCE("ftouizd", ebc0bc0, 2, (RVS, RVD), vfp_sp_dp_cvt), - /* Memory operations. */ - cCE("fldd", d100b00, 2, (RVD, ADDRGLDC), vfp_dp_ldst), - cCE("fstd", d000b00, 2, (RVD, ADDRGLDC), vfp_dp_ldst), - cCE("fldmiad", c900b00, 2, (RRw, VRDLST), vfp_dp_ldstmia), - cCE("fldmfdd", c900b00, 2, (RRw, VRDLST), vfp_dp_ldstmia), - cCE("fldmdbd", d300b00, 2, (RRw, VRDLST), vfp_dp_ldstmdb), - cCE("fldmead", d300b00, 2, (RRw, VRDLST), vfp_dp_ldstmdb), - cCE("fstmiad", c800b00, 2, (RRw, VRDLST), vfp_dp_ldstmia), - cCE("fstmead", c800b00, 2, (RRw, VRDLST), vfp_dp_ldstmia), - cCE("fstmdbd", d200b00, 2, (RRw, VRDLST), vfp_dp_ldstmdb), - cCE("fstmfdd", d200b00, 2, (RRw, VRDLST), vfp_dp_ldstmdb), - /* Monadic operations. */ cCE("fabsd", eb00bc0, 2, (RVD, RVD), vfp_dp_rd_rm), cCE("fnegd", eb10b40, 2, (RVD, RVD), vfp_dp_rd_rm), @@ -17535,29 +17576,52 @@ static const struct asm_opcode insns[] = nUF(vst4, _vst4, 2, (NSTRLST, ADDR), neon_ldx_stx), #undef THUMB_VARIANT +#define THUMB_VARIANT &fpu_vfp_ext_v3xd +#undef ARM_VARIANT +#define ARM_VARIANT &fpu_vfp_ext_v3xd + cCE("fconsts", eb00a00, 2, (RVS, I255), vfp_sp_const), + cCE("fshtos", eba0a40, 2, (RVS, I16z), vfp_sp_conv_16), + cCE("fsltos", eba0ac0, 2, (RVS, I32), vfp_sp_conv_32), + cCE("fuhtos", ebb0a40, 2, (RVS, I16z), vfp_sp_conv_16), + cCE("fultos", ebb0ac0, 2, (RVS, I32), vfp_sp_conv_32), + cCE("ftoshs", ebe0a40, 2, (RVS, I16z), vfp_sp_conv_16), + cCE("ftosls", ebe0ac0, 2, (RVS, I32), vfp_sp_conv_32), + cCE("ftouhs", ebf0a40, 2, (RVS, I16z), vfp_sp_conv_16), + cCE("ftouls", ebf0ac0, 2, (RVS, I32), vfp_sp_conv_32), + +#undef THUMB_VARIANT #define THUMB_VARIANT & fpu_vfp_ext_v3 #undef ARM_VARIANT #define ARM_VARIANT & fpu_vfp_ext_v3 - cCE("fconsts", eb00a00, 2, (RVS, I255), vfp_sp_const), cCE("fconstd", eb00b00, 2, (RVD, I255), vfp_dp_const), - cCE("fshtos", eba0a40, 2, (RVS, I16z), vfp_sp_conv_16), cCE("fshtod", eba0b40, 2, (RVD, I16z), vfp_dp_conv_16), - cCE("fsltos", eba0ac0, 2, (RVS, I32), vfp_sp_conv_32), cCE("fsltod", eba0bc0, 2, (RVD, I32), vfp_dp_conv_32), - cCE("fuhtos", ebb0a40, 2, (RVS, I16z), vfp_sp_conv_16), cCE("fuhtod", ebb0b40, 2, (RVD, I16z), vfp_dp_conv_16), - cCE("fultos", ebb0ac0, 2, (RVS, I32), vfp_sp_conv_32), cCE("fultod", ebb0bc0, 2, (RVD, I32), vfp_dp_conv_32), - cCE("ftoshs", ebe0a40, 2, (RVS, I16z), vfp_sp_conv_16), cCE("ftoshd", ebe0b40, 2, (RVD, I16z), vfp_dp_conv_16), - cCE("ftosls", ebe0ac0, 2, (RVS, I32), vfp_sp_conv_32), cCE("ftosld", ebe0bc0, 2, (RVD, I32), vfp_dp_conv_32), - cCE("ftouhs", ebf0a40, 2, (RVS, I16z), vfp_sp_conv_16), cCE("ftouhd", ebf0b40, 2, (RVD, I16z), vfp_dp_conv_16), - cCE("ftouls", ebf0ac0, 2, (RVS, I32), vfp_sp_conv_32), cCE("ftould", ebf0bc0, 2, (RVD, I32), vfp_dp_conv_32), +#undef ARM_VARIANT +#define ARM_VARIANT &fpu_vfp_ext_fma +#undef THUMB_VARIANT +#define THUMB_VARIANT &fpu_vfp_ext_fma + /* Mnemonics shared by Neon and VFP. These are included in the + VFP FMA variant; NEON and VFP FMA always includes the NEON + FMA instructions. */ + nCEF(vfma, _vfma, 3, (RNSDQ, oRNSDQ, RNSDQ), neon_fmac), + nCEF(vfms, _vfms, 3, (RNSDQ, oRNSDQ, RNSDQ), neon_fmac), + /* ffmas/ffmad/ffmss/ffmsd are dummy mnemonics to satisfy gas; + the v form should always be used. */ + cCE("ffmas", ea00a00, 3, (RVS, RVS, RVS), vfp_sp_dyadic), + cCE("ffnmas", ea00a40, 3, (RVS, RVS, RVS), vfp_sp_dyadic), + cCE("ffmad", ea00b00, 3, (RVD, RVD, RVD), vfp_dp_rd_rn_rm), + cCE("ffnmad", ea00b40, 3, (RVD, RVD, RVD), vfp_dp_rd_rn_rm), + nCE(vfnma, _vfnma, 3, (RVSD, RVSD, RVSD), vfp_nsyn_nmul), + nCE(vfnms, _vfnms, 3, (RVSD, RVSD, RVSD), vfp_nsyn_nmul), + #undef THUMB_VARIANT #undef ARM_VARIANT #define ARM_VARIANT & arm_cext_xscale /* Intel XScale extensions. */ @@ -21967,7 +22031,11 @@ static const struct arm_option_cpu_value_table arm_fpus[] = {"vfpxd", FPU_ARCH_VFP_V1xD}, {"vfpv2", FPU_ARCH_VFP_V2}, {"vfpv3", FPU_ARCH_VFP_V3}, + {"vfpv3-fp16", FPU_ARCH_VFP_V3_FP16}, {"vfpv3-d16", FPU_ARCH_VFP_V3D16}, + {"vfpv3-d16-fp16", FPU_ARCH_VFP_V3D16_FP16}, + {"vfpv3xd", FPU_ARCH_VFP_V3xD}, + {"vfpv3xd-fp16", FPU_ARCH_VFP_V3xD_FP16}, {"arm1020t", FPU_ARCH_VFP_V1}, {"arm1020e", FPU_ARCH_VFP_V2}, {"arm1136jfs", FPU_ARCH_VFP_V2}, @@ -21975,6 +22043,9 @@ static const struct arm_option_cpu_value_table arm_fpus[] = {"maverick", FPU_ARCH_MAVERICK}, {"neon", FPU_ARCH_VFP_V3_PLUS_NEON_V1}, {"neon-fp16", FPU_ARCH_NEON_FP16}, + {"vfpv4", FPU_ARCH_VFP_V4}, + {"vfpv4-d16", FPU_ARCH_VFP_V4D16}, + {"neon-vfpv4", FPU_ARCH_NEON_VFP_V4}, {NULL, ARM_ARCH_NONE} }; @@ -22453,8 +22524,10 @@ aeabi_set_public_attributes (void) } aeabi_set_attribute_string (Tag_CPU_name, p); } + /* Tag_CPU_arch. */ aeabi_set_attribute_int (Tag_CPU_arch, arch); + /* Tag_CPU_arch_profile. */ if (ARM_CPU_HAS_FEATURE (flags, arm_ext_v7a)) aeabi_set_attribute_int (Tag_CPU_arch_profile, 'A'); @@ -22462,17 +22535,24 @@ aeabi_set_public_attributes (void) aeabi_set_attribute_int (Tag_CPU_arch_profile, 'R'); else if (ARM_CPU_HAS_FEATURE (flags, arm_ext_m)) aeabi_set_attribute_int (Tag_CPU_arch_profile, 'M'); + /* Tag_ARM_ISA_use. */ if (ARM_CPU_HAS_FEATURE (flags, arm_ext_v1) || arch == 0) aeabi_set_attribute_int (Tag_ARM_ISA_use, 1); + /* Tag_THUMB_ISA_use. */ if (ARM_CPU_HAS_FEATURE (flags, arm_ext_v4t) || arch == 0) aeabi_set_attribute_int (Tag_THUMB_ISA_use, ARM_CPU_HAS_FEATURE (flags, arm_arch_t2) ? 2 : 1); + /* Tag_VFP_arch. */ - if (ARM_CPU_HAS_FEATURE (flags, fpu_vfp_ext_d32)) + if (ARM_CPU_HAS_FEATURE (flags, fpu_vfp_ext_fma)) + aeabi_set_attribute_int (Tag_VFP_arch, + ARM_CPU_HAS_FEATURE (flags, fpu_vfp_ext_d32) + ? 5 : 6); + else if (ARM_CPU_HAS_FEATURE (flags, fpu_vfp_ext_d32)) aeabi_set_attribute_int (Tag_VFP_arch, 3); else if (ARM_CPU_HAS_FEATURE (flags, fpu_vfp_ext_v3)) aeabi_set_attribute_int (Tag_VFP_arch, 4); @@ -22481,16 +22561,21 @@ aeabi_set_public_attributes (void) else if (ARM_CPU_HAS_FEATURE (flags, fpu_vfp_ext_v1) || ARM_CPU_HAS_FEATURE (flags, fpu_vfp_ext_v1xd)) aeabi_set_attribute_int (Tag_VFP_arch, 1); + /* Tag_WMMX_arch. */ if (ARM_CPU_HAS_FEATURE (flags, arm_cext_iwmmxt2)) aeabi_set_attribute_int (Tag_WMMX_arch, 2); else if (ARM_CPU_HAS_FEATURE (flags, arm_cext_iwmmxt)) aeabi_set_attribute_int (Tag_WMMX_arch, 1); + /* Tag_Advanced_SIMD_arch (formerly Tag_NEON_arch). */ if (ARM_CPU_HAS_FEATURE (flags, fpu_neon_ext_v1)) - aeabi_set_attribute_int (Tag_Advanced_SIMD_arch, 1); + aeabi_set_attribute_int + (Tag_Advanced_SIMD_arch, (ARM_CPU_HAS_FEATURE (flags, fpu_neon_ext_fma) + ? 2 : 1)); + /* Tag_VFP_HP_extension (formerly Tag_NEON_FP16_arch). */ - if (ARM_CPU_HAS_FEATURE (flags, fpu_neon_fp16)) + if (ARM_CPU_HAS_FEATURE (flags, fpu_vfp_fp16)) aeabi_set_attribute_int (Tag_VFP_HP_extension, 1); } diff --git a/gas/doc/c-arm.texi b/gas/doc/c-arm.texi index 2f4bf85..eb58a56 100644 --- a/gas/doc/c-arm.texi +++ b/gas/doc/c-arm.texi @@ -200,15 +200,22 @@ The following format options are recognized: @code{vfp10-r0}, @code{vfp9}, @code{vfpxd}, -@code{vfpv2} -@code{vfpv3} -@code{vfpv3-d16} +@code{vfpv2}, +@code{vfpv3}, +@code{vfpv3-fp16}, +@code{vfpv3-d16}, +@code{vfpv3-d16-fp16}, +@code{vfpv3xd}, +@code{vfpv3xd-d16}, +@code{vfpv4}, +@code{vfpv4-d16}, @code{arm1020t}, @code{arm1020e}, @code{arm1136jf-s}, -@code{maverick} +@code{maverick}, +@code{neon}, and -@code{neon}. +@code{neon-vfpv4}. In addition to determining which instructions are assembled, this option also affects the way in which the @code{.double} assembler directive behaves diff --git a/gas/testsuite/ChangeLog b/gas/testsuite/ChangeLog index 370438f..d15afcb 100644 --- a/gas/testsuite/ChangeLog +++ b/gas/testsuite/ChangeLog @@ -1,3 +1,19 @@ +2009-11-02 Paul Brook <paul@codesourcery.com> + + * gas/arm/attr-mfpu-vfpv4.d: New test. + * gas/arm/attr-mfpu-vfpv4-d16.d: New test. + * gas/arm/neon-fma-cov.d: New test. + * gas/arm/neon-fma-cov.s: New test. + * gas/arm/vfp-fma-inc.s: New test. + * gas/arm/vfp-fma-arm.d: New test. + * gas/arm/vfp-fma-arm.s: New test. + * gas/arm/vfp-fma-thumb.d: New test. + * gas/arm/vfp-fma-thumb.s: New test. + * gas/arm/vfma1.d: New test. + * gas/arm/vfma1.s: New test. + * gas/arm/vfpv3xd.d: New test. + * gas/arm/vfpv3xd.s: New test. + 2009-10-29 Sebastian Pop <sebastian.pop@amd.com> * gas/i386/fma4.d: Updated patterns. diff --git a/gas/testsuite/gas/arm/attr-mfpu-vfpv4-d16.d b/gas/testsuite/gas/arm/attr-mfpu-vfpv4-d16.d new file mode 100644 index 0000000..6b3574d --- /dev/null +++ b/gas/testsuite/gas/arm/attr-mfpu-vfpv4-d16.d @@ -0,0 +1,13 @@ +# name: attributes for -mfpu=vfpv4-d16 +# source: blank.s +# as: -mfpu=vfpv4-d16 +# readelf: -A +# This test is only valid on EABI based ports. +# target: *-*-*eabi + +Attribute Section: aeabi +File Attributes + Tag_ARM_ISA_use: Yes + Tag_THUMB_ISA_use: Thumb-1 + Tag_VFP_arch: VFPv4-D16 + Tag_VFP_HP_extension: Allowed diff --git a/gas/testsuite/gas/arm/attr-mfpu-vfpv4.d b/gas/testsuite/gas/arm/attr-mfpu-vfpv4.d new file mode 100644 index 0000000..a3b91a5 --- /dev/null +++ b/gas/testsuite/gas/arm/attr-mfpu-vfpv4.d @@ -0,0 +1,13 @@ +# name: attributes for -mfpu=vfpv4 +# source: blank.s +# as: -mfpu=vfpv4 +# readelf: -A +# This test is only valid on EABI based ports. +# target: *-*-*eabi + +Attribute Section: aeabi +File Attributes + Tag_ARM_ISA_use: Yes + Tag_THUMB_ISA_use: Thumb-1 + Tag_VFP_arch: VFPv4 + Tag_VFP_HP_extension: Allowed diff --git a/gas/testsuite/gas/arm/neon-fma-cov.d b/gas/testsuite/gas/arm/neon-fma-cov.d new file mode 100644 index 0000000..1c51d7b --- /dev/null +++ b/gas/testsuite/gas/arm/neon-fma-cov.d @@ -0,0 +1,13 @@ +# name: Neon FMA instruction coverage +# as: -mfpu=neon-vfpv4 +# objdump: -dr --prefix-addresses --show-raw-insn + +.*: +file format .*arm.* + +Disassembly of section \.text: +0[0-9a-f]+ <[^>]+> f2000c50 vfma\.f32 q0, q0, q0 +0[0-9a-f]+ <[^>]+> f2000c50 vfma\.f32 q0, q0, q0 +0[0-9a-f]+ <[^>]+> f2000c10 vfma\.f32 d0, d0, d0 +0[0-9a-f]+ <[^>]+> f2200c50 vfms\.f32 q0, q0, q0 +0[0-9a-f]+ <[^>]+> f2200c50 vfms\.f32 q0, q0, q0 +0[0-9a-f]+ <[^>]+> f2200c10 vfms\.f32 d0, d0, d0 diff --git a/gas/testsuite/gas/arm/neon-fma-cov.s b/gas/testsuite/gas/arm/neon-fma-cov.s new file mode 100644 index 0000000..db34807 --- /dev/null +++ b/gas/testsuite/gas/arm/neon-fma-cov.s @@ -0,0 +1,12 @@ + .arm + .syntax unified + .text + + .macro regs3_1 op opq vtype + \op\vtype q0,q0,q0 + \opq\vtype q0,q0,q0 + \op\vtype d0,d0,d0 + .endm + + regs3_1 vfma vfma .f32 + regs3_1 vfms vfms .f32 diff --git a/gas/testsuite/gas/arm/vfma1.d b/gas/testsuite/gas/arm/vfma1.d new file mode 100644 index 0000000..4c638d3 --- /dev/null +++ b/gas/testsuite/gas/arm/vfma1.d @@ -0,0 +1,34 @@ +#objdump: -dr --prefix-addresses --show-raw-insn +#name: VFMA decoding +#as: -mcpu=arm7m + +# Test VFMA instruction disassembly + +.*: *file format .*arm.* + + +Disassembly of section .text: +00000000 <[^>]*> ee000a00 vmla.f32 s0, s0, s0 +00000004 <[^>]*> ee000b00 vmla.f64 d0, d0, d0 +00000008 <[^>]*> f2000d10 vmla.f32 d0, d0, d0 +0000000c <[^>]*> f2000d50 vmla.f32 q0, q0, q0 +00000010 <[^>]*> eea00a00 vfma.f32 s0, s0, s0 +00000014 <[^>]*> eea00b00 vfma.f64 d0, d0, d0 +00000018 <[^>]*> f2000c10 vfma.f32 d0, d0, d0 +0000001c <[^>]*> f2000c50 vfma.f32 q0, q0, q0 +00000020 <[^>]*> ee000a40 vmls.f32 s0, s0, s0 +00000024 <[^>]*> ee000b40 vmls.f64 d0, d0, d0 +00000028 <[^>]*> f2200d10 vmls.f32 d0, d0, d0 +0000002c <[^>]*> f2200d50 vmls.f32 q0, q0, q0 +00000030 <[^>]*> eea00a40 vfms.f32 s0, s0, s0 +00000034 <[^>]*> eea00b40 vfms.f64 d0, d0, d0 +00000038 <[^>]*> f2200c10 vfms.f32 d0, d0, d0 +0000003c <[^>]*> f2200c50 vfms.f32 q0, q0, q0 +00000040 <[^>]*> ee100a40 vnmla.f32 s0, s0, s0 +00000044 <[^>]*> ee100b40 vnmla.f64 d0, d0, d0 +00000048 <[^>]*> ee900a40 vfnma.f32 s0, s0, s0 +0000004c <[^>]*> ee900b40 vfnma.f64 d0, d0, d0 +00000050 <[^>]*> ee100a00 vnmls.f32 s0, s0, s0 +00000054 <[^>]*> ee100b00 vnmls.f64 d0, d0, d0 +00000058 <[^>]*> ee900a00 vfnms.f32 s0, s0, s0 +0000005c <[^>]*> ee900b00 vfnms.f64 d0, d0, d0 diff --git a/gas/testsuite/gas/arm/vfma1.s b/gas/testsuite/gas/arm/vfma1.s new file mode 100644 index 0000000..bc124f8 --- /dev/null +++ b/gas/testsuite/gas/arm/vfma1.s @@ -0,0 +1,43 @@ + + .eabi_attribute Tag_Advanced_SIMD_arch, 2 + .eabi_attribute Tag_VFP_arch, 6 + + @VMLA + .inst 0xee000a00 @ VFP vmla.f32 s0,s0,s0 + .inst 0xee000b00 @ VFP vmla.f64 d0,d0,d0 + .inst 0xf2000d10 @ NEON vmla.f32 d0,d0,d0 + .inst 0xf2000d50 @ NEON vmla.f32 q0,q0,q0 + + @VFMA new + .inst 0xeea00a00 @ VFP vfma.f32 s0,s0,s0 + .inst 0xeea00b00 @ VFP vfma.f64 d0,d0,d0 + .inst 0xf2000c10 @ NEON vfma.f32 d0,d0,d0 + .inst 0xf2000c50 @ NEON vfma.f32 q0,q0,q0 + + @VMLS + .inst 0xee000a40 @ VFP vmls.F32 s0,s0,s0 + .inst 0xee000b40 @ VFP vmls.F64 d0,d0,d0 + .inst 0xf2200d10 @ NEON vmls.F32 d0,d0,d0 + .inst 0xf2200d50 @ NEON vmls.F32 q0,q0,q0 + + @VFMS new + .inst 0xeea00a40 @ VFP vfms.F32 s0,s0,s0 + .inst 0xeea00b40 @ VFP vfms.F64 d0,d0,d0 + .inst 0xf2200c10 @ NEON vfms.F32 d0,d0,d0 + .inst 0xf2200c50 @ NEON vfms.F32 q0,q0,q0 + + @VNMLA + .inst 0xee100a40 @ VFP vnmla.F32 s0,s0,s0 + .inst 0xee100b40 @ VFP vnmla.F64 d0,d0,d0 + + @VFNMA new + .inst 0xee900a40 @ VFP vfnma.F32 s0,s0,s0 + .inst 0xee900b40 @ VFP vfnma.F64 d0,d0,d0 + + @VNMLS + .inst 0xee100a00 @ VFP vnmls.F32 s0,s0,s0 + .inst 0xee100b00 @ VFP vnmls.F64 d0,d0,d0 + + @VFNMS new + .inst 0xee900a00 @ VFP vfnms.F32 s0,s0,s0 + .inst 0xee900b00 @ VFP vfnms.F64 d0,d0,d0 diff --git a/gas/testsuite/gas/arm/vfp-fma-arm.d b/gas/testsuite/gas/arm/vfp-fma-arm.d new file mode 100644 index 0000000..6a4f717 --- /dev/null +++ b/gas/testsuite/gas/arm/vfp-fma-arm.d @@ -0,0 +1,23 @@ +# name: FMA instructions, ARM mode +# as: -mfpu=vfpv4 -I$srcdir/$subdir +# objdump: -dr --prefix-addresses --show-raw-insn + +.*: +file format .*arm.* + +Disassembly of section .text: +0[0-9a-f]+ <[^>]+> eea00a81 vfma\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> eea10b02 vfma\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> 0ea00a81 vfmaeq\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> 0ea10b02 vfmaeq\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> eea00ac1 vfms\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> eea10b42 vfms\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> 0ea00ac1 vfmseq\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> 0ea10b42 vfmseq\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> ee900ac1 vfnma\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> ee910b42 vfnma\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> 0e900ac1 vfnmaeq\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> 0e910b42 vfnmaeq\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> ee900a81 vfnms\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> ee910b02 vfnms\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> 0e900a81 vfnmseq\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> 0e910b02 vfnmseq\.f64 d0, d1, d2 diff --git a/gas/testsuite/gas/arm/vfp-fma-arm.s b/gas/testsuite/gas/arm/vfp-fma-arm.s new file mode 100644 index 0000000..945926b --- /dev/null +++ b/gas/testsuite/gas/arm/vfp-fma-arm.s @@ -0,0 +1,2 @@ + .arm + .include "vfp-fma-inc.s" diff --git a/gas/testsuite/gas/arm/vfp-fma-inc.s b/gas/testsuite/gas/arm/vfp-fma-inc.s new file mode 100644 index 0000000..a9dcb14 --- /dev/null +++ b/gas/testsuite/gas/arm/vfp-fma-inc.s @@ -0,0 +1,20 @@ + .syntax unified + + .include "itblock.s" + +func: + .macro dyadic op cond="" f32=".f32" f64=".f64" + itblock 2 \cond + \op\cond\f32 s0,s1,s2 + \op\cond\f64 d0,d1,d2 + .endm + + .macro dyadic_c op + dyadic \op + dyadic \op eq + .endm + + dyadic_c vfma + dyadic_c vfms + dyadic_c vfnma + dyadic_c vfnms diff --git a/gas/testsuite/gas/arm/vfp-fma-thumb.d b/gas/testsuite/gas/arm/vfp-fma-thumb.d new file mode 100644 index 0000000..2ee77fd --- /dev/null +++ b/gas/testsuite/gas/arm/vfp-fma-thumb.d @@ -0,0 +1,27 @@ +# name: FMA instructions, Thumb mode +# as: -mfpu=vfpv4 -I$srcdir/$subdir +# objdump: -dr --prefix-addresses --show-raw-insn + +.*: +file format .*arm.* + +Disassembly of section .text: +0[0-9a-f]+ <[^>]+> eea0 0a81 vfma\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> eea1 0b02 vfma\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> bf04 itt eq +0[0-9a-f]+ <[^>]+> eea0 0a81 vfmaeq\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> eea1 0b02 vfmaeq\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> eea0 0ac1 vfms\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> eea1 0b42 vfms\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> bf04 itt eq +0[0-9a-f]+ <[^>]+> eea0 0ac1 vfmseq\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> eea1 0b42 vfmseq\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> ee90 0ac1 vfnma\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> ee91 0b42 vfnma\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> bf04 itt eq +0[0-9a-f]+ <[^>]+> ee90 0ac1 vfnmaeq\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> ee91 0b42 vfnmaeq\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> ee90 0a81 vfnms\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> ee91 0b02 vfnms\.f64 d0, d1, d2 +0[0-9a-f]+ <[^>]+> bf04 itt eq +0[0-9a-f]+ <[^>]+> ee90 0a81 vfnmseq\.f32 s0, s1, s2 +0[0-9a-f]+ <[^>]+> ee91 0b02 vfnmseq\.f64 d0, d1, d2 diff --git a/gas/testsuite/gas/arm/vfp-fma-thumb.s b/gas/testsuite/gas/arm/vfp-fma-thumb.s new file mode 100644 index 0000000..fa3b792 --- /dev/null +++ b/gas/testsuite/gas/arm/vfp-fma-thumb.s @@ -0,0 +1,2 @@ + .thumb + .include "vfp-fma-inc.s" diff --git a/gas/testsuite/gas/arm/vfpv3xd.d b/gas/testsuite/gas/arm/vfpv3xd.d new file mode 100644 index 0000000..508f70f --- /dev/null +++ b/gas/testsuite/gas/arm/vfpv3xd.d @@ -0,0 +1,23 @@ +#objdump: -dr --prefix-addresses --show-raw-insn +#name: VFP Double-precision load/store +#as: -mfpu=vfpv3xd + +# Test the ARM VFP Double Precision load/store on single precision FPU + +.*: +file format .*arm.* + +Disassembly of section .text: +0+[0-9a-f]* <[^>]*> ed900b00 vldr d0, \[r0\] +0+[0-9a-f]* <[^>]*> ed800b00 vstr d0, \[r0\] +0+[0-9a-f]* <[^>]*> ec900b02 vldmia r0, {d0} +0+[0-9a-f]* <[^>]*> ec900b02 vldmia r0, {d0} +0+[0-9a-f]* <[^>]*> ecb00b02 vldmia r0!, {d0} +0+[0-9a-f]* <[^>]*> ecb00b02 vldmia r0!, {d0} +0+[0-9a-f]* <[^>]*> ed300b02 vldmdb r0!, {d0} +0+[0-9a-f]* <[^>]*> ed300b02 vldmdb r0!, {d0} +0+[0-9a-f]* <[^>]*> ec800b02 vstmia r0, {d0} +0+[0-9a-f]* <[^>]*> ec800b02 vstmia r0, {d0} +0+[0-9a-f]* <[^>]*> eca00b02 vstmia r0!, {d0} +0+[0-9a-f]* <[^>]*> eca00b02 vstmia r0!, {d0} +0+[0-9a-f]* <[^>]*> ed200b02 vstmdb r0!, {d0} +0+[0-9a-f]* <[^>]*> ed200b02 vstmdb r0!, {d0} diff --git a/gas/testsuite/gas/arm/vfpv3xd.s b/gas/testsuite/gas/arm/vfpv3xd.s new file mode 100644 index 0000000..a16b969 --- /dev/null +++ b/gas/testsuite/gas/arm/vfpv3xd.s @@ -0,0 +1,19 @@ +# Check double precision load/store are allowed on single precision +# implementation + + fldd d0, [r0] + fstd d0, [r0] + + fldmiad r0, {d0} + fldmfdd r0, {d0} + fldmiad r0!, {d0} + fldmfdd r0!, {d0} + fldmdbd r0!, {d0} + fldmead r0!, {d0} + + fstmiad r0, {d0} + fstmead r0, {d0} + fstmiad r0!, {d0} + fstmead r0!, {d0} + fstmdbd r0!, {d0} + fstmfdd r0!, {d0} |