aboutsummaryrefslogtreecommitdiff
path: root/gcc
diff options
context:
space:
mode:
authorliuhongt <hongtao.liu@intel.com>2022-03-28 11:12:37 +0800
committerliuhongt <hongtao.liu@intel.com>2022-03-28 16:14:37 +0800
commite4352a0fee49441a32d12e8d8b98c425cfed4a86 (patch)
tree9b1a031788c7843ad96143e09d39e60603956d04 /gcc
parent50f9148f7a8daf1fa1608cb23595c3cca191da0f (diff)
downloadgcc-e4352a0fee49441a32d12e8d8b98c425cfed4a86.zip
gcc-e4352a0fee49441a32d12e8d8b98c425cfed4a86.tar.gz
gcc-e4352a0fee49441a32d12e8d8b98c425cfed4a86.tar.bz2
Fix typo in vec_setv8hi_0.
pinsrw is available for both reg and mem operand under sse2. pextrw requires sse4.1 for mem operands. The patch change attr "isa" for pinsrw mem alternative from sse4_noavx to noavx, will enable below optimization. - movzwl (%rdi), %eax pxor %xmm1, %xmm1 - pinsrw $0, %eax, %xmm1 + pinsrw $0, (%rdi), %xmm1 movdqa %xmm1, %xmm0 gcc/ChangeLog: PR target/105066 * config/i386/sse.md (vec_set<mode>_0): Change attr "isa" of alternative 4 from sse4_noavx to noavx. gcc/testsuite/ChangeLog: * gcc.target/i386/pr105066.c: New test.
Diffstat (limited to 'gcc')
-rw-r--r--gcc/config/i386/sse.md4
-rw-r--r--gcc/testsuite/gcc.target/i386/pr105066.c10
2 files changed, 12 insertions, 2 deletions
diff --git a/gcc/config/i386/sse.md b/gcc/config/i386/sse.md
index 58d2bd9..01543af 100644
--- a/gcc/config/i386/sse.md
+++ b/gcc/config/i386/sse.md
@@ -10617,9 +10617,9 @@
[(set (attr "isa")
(cond [(eq_attr "alternative" "0,1,2")
(const_string "avx512fp16")
- (eq_attr "alternative" "3")
+ (eq_attr "alternative" "3,4")
(const_string "noavx")
- (eq_attr "alternative" "4,5,6")
+ (eq_attr "alternative" "5,6")
(const_string "sse4_noavx")
(eq_attr "alternative" "7,8,9")
(const_string "avx")
diff --git a/gcc/testsuite/gcc.target/i386/pr105066.c b/gcc/testsuite/gcc.target/i386/pr105066.c
new file mode 100644
index 0000000..c5c5b9e
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/pr105066.c
@@ -0,0 +1,10 @@
+/* { dg-do compile } */
+/* { dg-options "-O2 -msse2 -mno-sse4.1" } */
+/* { dg-final { scan-assembler-not "movzwl" } } */
+/* { dg-final { scan-assembler {(?n)pinsrw[ \t]+\$0.*\(%} } } */
+
+#include <immintrin.h>
+
+__m128i load16(void *p){
+ return _mm_loadu_si16(p);
+}