diff options
author | Thomas Koenig <tkoenig@gcc.gnu.org> | 2017-06-24 07:07:56 +0000 |
---|---|---|
committer | Thomas Koenig <tkoenig@gcc.gnu.org> | 2017-06-24 07:07:56 +0000 |
commit | e56e3fda6092548f3cd5336d131b412be986b1e6 (patch) | |
tree | 2c28733ee096cbdb641e42b511b18f7c28205330 /libgfortran/Makefile.am | |
parent | ef5b7d19b688bb92178f41f504133f0ee51bffc6 (diff) | |
download | gcc-e56e3fda6092548f3cd5336d131b412be986b1e6.zip gcc-e56e3fda6092548f3cd5336d131b412be986b1e6.tar.gz gcc-e56e3fda6092548f3cd5336d131b412be986b1e6.tar.bz2 |
re PR fortran/52473 (CSHIFT slow - inline it?)
2017-06-24 Thomas Koenig <tkoenig@gcc.gnu.org>
PR fortran/52473
* Makefile.am: Add i_cshift1a_c. Add rules to generate files
from cshift1a.m4.
* Makefile.in: Regenerated.
* m4/cshift1a.m4: New file.
* m4/cshift.m4 (cshift1): Split up inner loop by removing
condition. Use memcpy where possible. Call helper functions
based on dtype.
* libgfortran.h: Add prototypes for cshift1_16_c10,
cshift1_16_c16, cshift1_16_c4, cshift1_16_c8, cshift1_16_i1,
cshift1_16_i16, cshift1_16_i2, cshift1_16_i4, cshift1_16_i8,
cshift1_16_r10, cshift1_16_r16, cshift1_16_r4, cshift1_16_r8,
cshift1_4_c10, cshift1_4_c16, cshift1_4_c4, cshift1_4_c8,
cshift1_4_i1, cshift1_4_i16, cshift1_4_i2, cshift1_4_i4,
cshift1_4_i8, cshift1_4_r10, cshift1_4_r16, cshift1_4_r4,
cshift1_4_r8, cshift1_8_c10, cshift1_8_c16, cshift1_8_c4,
cshift1_8_c8, cshift1_8_i1, cshift1_8_i16, cshift1_8_i2,
cshift1_8_i4, cshift1_8_i8, cshift1_8_r10, cshift1_8_r16,
cshift1_8_r4 and cshift1_8_r8.
* generated/cshift1_16_c10.c: New file, generated from cshift1a.m4.
* generated/cshift1_16_c16.c: New file, generated from cshift1a.m4.
* generated/cshift1_16_c4.c: New file, generated from cshift1a.m4.
* generated/cshift1_16_c8.c: New file, generated from cshift1a.m4.
* generated/cshift1_16_i1.c: New file, generated from cshift1a.m4.
* generated/cshift1_16_i16.c: New file, generated from cshift1a.m4.
* generated/cshift1_16_i2.c: New file, generated from cshift1a.m4.
* generated/cshift1_16_i4.c: New file, generated from cshift1a.m4.
* generated/cshift1_16_i8.c: New file, generated from cshift1a.m4.
* generated/cshift1_16_r10.c: New file, generated from cshift1a.m4.
* generated/cshift1_16_r16.c: New file, generated from cshift1a.m4.
* generated/cshift1_16_r4.c: New file, generated from cshift1a.m4.
* generated/cshift1_16_r8.c: New file, generated from cshift1a.m4.
* generated/cshift1_4_c10.c: New file, generated from cshift1a.m4.
* generated/cshift1_4_c16.c: New file, generated from cshift1a.m4.
* generated/cshift1_4_c4.c: New file, generated from cshift1a.m4.
* generated/cshift1_4_c8.c: New file, generated from cshift1a.m4.
* generated/cshift1_4_i1.c: New file, generated from cshift1a.m4.
* generated/cshift1_4_i16.c: New file, generated from cshift1a.m4.
* generated/cshift1_4_i2.c: New file, generated from cshift1a.m4.
* generated/cshift1_4_i4.c: New file, generated from cshift1a.m4.
* generated/cshift1_4_i8.c: New file, generated from cshift1a.m4.
* generated/cshift1_4_r10.c: New file, generated from cshift1a.m4.
* generated/cshift1_4_r16.c: New file, generated from cshift1a.m4.
* generated/cshift1_4_r4.c: New file, generated from cshift1a.m4.
* generated/cshift1_4_r8.c: New file, generated from cshift1a.m4.
* generated/cshift1_8_c10.c: New file, generated from cshift1a.m4.
* generated/cshift1_8_c16.c: New file, generated from cshift1a.m4.
* generated/cshift1_8_c4.c: New file, generated from cshift1a.m4.
* generated/cshift1_8_c8.c: New file, generated from cshift1a.m4.
* generated/cshift1_8_i1.c: New file, generated from cshift1a.m4.
* generated/cshift1_8_i16.c: New file, generated from cshift1a.m4.
* generated/cshift1_8_i2.c: New file, generated from cshift1a.m4.
* generated/cshift1_8_i4.c: New file, generated from cshift1a.m4.
* generated/cshift1_8_i8.c: New file, generated from cshift1a.m4.
* generated/cshift1_8_r10.c: New file, generated from cshift1a.m4.
* generated/cshift1_8_r16.c: New file, generated from cshift1a.m4.
* generated/cshift1_8_r4.c: New file, generated from cshift1a.m4.
* generated/cshift1_8_r8.c: New file, generated from cshift1a.m4.
2017-06-24 Thomas Koenig <tkoenig@gcc.gnu.org>
PR fortran/52473
* gfortran.dg/cshift_2.f90: New test.
From-SVN: r249620
Diffstat (limited to 'libgfortran/Makefile.am')
-rw-r--r-- | libgfortran/Makefile.am | 48 |
1 files changed, 46 insertions, 2 deletions
diff --git a/libgfortran/Makefile.am b/libgfortran/Makefile.am index 9088812..c5982a7 100644 --- a/libgfortran/Makefile.am +++ b/libgfortran/Makefile.am @@ -524,13 +524,53 @@ $(srcdir)/generated/cshift0_c4.c \ $(srcdir)/generated/cshift0_c8.c \ $(srcdir)/generated/cshift0_c10.c \ $(srcdir)/generated/cshift0_c16.c - i_cshift1_c= \ $(srcdir)/generated/cshift1_4.c \ $(srcdir)/generated/cshift1_8.c \ $(srcdir)/generated/cshift1_16.c +i_cshift1a_c = \ +$(srcdir)/generated/cshift1_4_i1.c \ +$(srcdir)/generated/cshift1_4_i2.c \ +$(srcdir)/generated/cshift1_4_i4.c \ +$(srcdir)/generated/cshift1_4_i8.c \ +$(srcdir)/generated/cshift1_4_i16.c \ +$(srcdir)/generated/cshift1_4_r4.c \ +$(srcdir)/generated/cshift1_4_r8.c \ +$(srcdir)/generated/cshift1_4_r10.c \ +$(srcdir)/generated/cshift1_4_r16.c \ +$(srcdir)/generated/cshift1_4_c4.c \ +$(srcdir)/generated/cshift1_4_c8.c \ +$(srcdir)/generated/cshift1_4_c10.c \ +$(srcdir)/generated/cshift1_4_c16.c \ +$(srcdir)/generated/cshift1_8_i1.c \ +$(srcdir)/generated/cshift1_8_i2.c \ +$(srcdir)/generated/cshift1_8_i4.c \ +$(srcdir)/generated/cshift1_8_i8.c \ +$(srcdir)/generated/cshift1_8_i16.c \ +$(srcdir)/generated/cshift1_8_r4.c \ +$(srcdir)/generated/cshift1_8_r8.c \ +$(srcdir)/generated/cshift1_8_r10.c \ +$(srcdir)/generated/cshift1_8_r16.c \ +$(srcdir)/generated/cshift1_8_c4.c \ +$(srcdir)/generated/cshift1_8_c8.c \ +$(srcdir)/generated/cshift1_8_c10.c \ +$(srcdir)/generated/cshift1_8_c16.c \ +$(srcdir)/generated/cshift1_16_i1.c \ +$(srcdir)/generated/cshift1_16_i2.c \ +$(srcdir)/generated/cshift1_16_i4.c \ +$(srcdir)/generated/cshift1_16_i8.c \ +$(srcdir)/generated/cshift1_16_i16.c \ +$(srcdir)/generated/cshift1_16_r4.c \ +$(srcdir)/generated/cshift1_16_r8.c \ +$(srcdir)/generated/cshift1_16_r10.c \ +$(srcdir)/generated/cshift1_16_r16.c \ +$(srcdir)/generated/cshift1_16_c4.c \ +$(srcdir)/generated/cshift1_16_c8.c \ +$(srcdir)/generated/cshift1_16_c10.c \ +$(srcdir)/generated/cshift1_16_c16.c + in_pack_c = \ $(srcdir)/generated/in_pack_i1.c \ $(srcdir)/generated/in_pack_i2.c \ @@ -658,7 +698,8 @@ gfor_built_src= $(i_all_c) $(i_any_c) $(i_count_c) $(i_maxloc0_c) \ $(i_eoshift3_c) $(i_cshift1_c) $(i_reshape_c) $(in_pack_c) $(in_unpack_c) \ $(i_pow_c) $(i_pack_c) $(i_unpack_c) $(i_matmulavx128_c) \ $(i_spread_c) selected_int_kind.inc selected_real_kind.inc kinds.h \ - $(i_cshift0_c) kinds.inc c99_protos.inc fpu-target.h fpu-target.inc + $(i_cshift0_c) kinds.inc c99_protos.inc fpu-target.h fpu-target.inc \ + $(i_cshift1a_c) # Machine generated specifics gfor_built_specific_src= \ @@ -986,6 +1027,9 @@ $(i_cshift0_c): m4/cshift0.m4 $(I_M4_DEPS) $(i_cshift1_c): m4/cshift1.m4 $(I_M4_DEPS) $(M4) -Dfile=$@ -I$(srcdir)/m4 cshift1.m4 > $@ +$(i_cshift1a_c): m4/cshift1a.m4 $(I_M$_DEPS) + $(M4) -Dfile=$@ -I$(srcdir)/m4 cshift1a.m4 > $@ + $(in_pack_c): m4/in_pack.m4 $(I_M4_DEPS) $(M4) -Dfile=$@ -I$(srcdir)/m4 in_pack.m4 > $@ |