From f6b10ed8e9a00de49d0951e760cc2b5288862b47 Mon Sep 17 00:00:00 2001 From: "H.J. Lu" Date: Thu, 10 Aug 2023 11:24:30 -0700 Subject: x86_64: Add log2 with FMA On Skylake, it improves log2 bench performance by: Before After Improvement max 208.779 63.827 69% min 9.977 6.55 34% mean 10.366 6.8191 34% --- sysdeps/x86_64/fpu/multiarch/Makefile | 2 ++ sysdeps/x86_64/fpu/multiarch/e_log2-fma.c | 3 +++ sysdeps/x86_64/fpu/multiarch/e_log2.c | 43 +++++++++++++++++++++++++++++++ 3 files changed, 48 insertions(+) create mode 100644 sysdeps/x86_64/fpu/multiarch/e_log2-fma.c create mode 100644 sysdeps/x86_64/fpu/multiarch/e_log2.c (limited to 'sysdeps/x86_64') diff --git a/sysdeps/x86_64/fpu/multiarch/Makefile b/sysdeps/x86_64/fpu/multiarch/Makefile index e37e488..f773255 100644 --- a/sysdeps/x86_64/fpu/multiarch/Makefile +++ b/sysdeps/x86_64/fpu/multiarch/Makefile @@ -34,6 +34,7 @@ libm-sysdep_routines += \ e_atan2-fma \ e_exp-fma \ e_log-fma \ + e_log2-fma \ e_pow-fma \ s_atan-fma \ s_sin-fma \ @@ -45,6 +46,7 @@ CFLAGS-e_asin-fma.c = -mfma -mavx2 CFLAGS-e_atan2-fma.c = -mfma -mavx2 CFLAGS-e_exp-fma.c = -mfma -mavx2 CFLAGS-e_log-fma.c = -mfma -mavx2 +CFLAGS-e_log2-fma.c = -mfma -mavx2 CFLAGS-e_pow-fma.c = -mfma -mavx2 CFLAGS-s_atan-fma.c = -mfma -mavx2 CFLAGS-s_sin-fma.c = -mfma -mavx2 diff --git a/sysdeps/x86_64/fpu/multiarch/e_log2-fma.c b/sysdeps/x86_64/fpu/multiarch/e_log2-fma.c new file mode 100644 index 0000000..9fbebc1 --- /dev/null +++ b/sysdeps/x86_64/fpu/multiarch/e_log2-fma.c @@ -0,0 +1,3 @@ +#define __log2 __log2_fma + +#include diff --git a/sysdeps/x86_64/fpu/multiarch/e_log2.c b/sysdeps/x86_64/fpu/multiarch/e_log2.c new file mode 100644 index 0000000..c0320ca --- /dev/null +++ b/sysdeps/x86_64/fpu/multiarch/e_log2.c @@ -0,0 +1,43 @@ +/* Multiple versions of log2. + Copyright (C) 2023 Free Software Foundation, Inc. + This file is part of the GNU C Library. + + The GNU C Library is free software; you can redistribute it and/or + modify it under the terms of the GNU Lesser General Public + License as published by the Free Software Foundation; either + version 2.1 of the License, or (at your option) any later version. + + The GNU C Library is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + Lesser General Public License for more details. + + You should have received a copy of the GNU Lesser General Public + License along with the GNU C Library; if not, see + . */ + +#include +#include + +extern double __redirect_log2 (double); + +#define SYMBOL_NAME log2 +#include "ifunc-fma.h" + +libc_ifunc_redirected (__redirect_log2, __log2, IFUNC_SELECTOR ()); + +#ifdef SHARED +__hidden_ver1 (__log2, __GI___log2, __redirect_log2) + __attribute__ ((visibility ("hidden"))); + +versioned_symbol (libm, __ieee754_log2, log2, GLIBC_2_29); +libm_alias_double_other (__log2, log2) +#else +libm_alias_double (__log2, log2) +#endif + +strong_alias (__log2, __ieee754_log2) +libm_alias_finite (__log2, __log2) + +#define __log2 __log2_sse2 +#include -- cgit v1.1