aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorSimon Pilgrim <llvm-dev@redking.me.uk>2023-11-17 09:26:09 +0000
committerSimon Pilgrim <llvm-dev@redking.me.uk>2023-11-17 10:01:31 +0000
commit58253dcbcdfafb1fb1fb5ffc43d6f11a31f35e2a (patch)
tree2535cac43a3cd976e75e8d31080a961d8fd2808d
parent1c05fe350064aa3a1784bb09829a07d501842d97 (diff)
downloadllvm-58253dcbcdfafb1fb1fb5ffc43d6f11a31f35e2a.zip
llvm-58253dcbcdfafb1fb1fb5ffc43d6f11a31f35e2a.tar.gz
llvm-58253dcbcdfafb1fb1fb5ffc43d6f11a31f35e2a.tar.bz2
[X86] getTargetConstantBitsFromNode - bail if we're loading from a constant vector element type larger than the target value size
This can be improved upon by just truncating the constant value, but the crash needs to be addressed first. Fixes #72539
-rw-r--r--llvm/lib/Target/X86/X86ISelLowering.cpp2
-rw-r--r--llvm/test/CodeGen/X86/pr72539.ll27
2 files changed, 29 insertions, 0 deletions
diff --git a/llvm/lib/Target/X86/X86ISelLowering.cpp b/llvm/lib/Target/X86/X86ISelLowering.cpp
index 7f9d971..cf66707 100644
--- a/llvm/lib/Target/X86/X86ISelLowering.cpp
+++ b/llvm/lib/Target/X86/X86ISelLowering.cpp
@@ -4664,6 +4664,8 @@ static bool getTargetConstantBitsFromNode(SDValue Op, unsigned EltSizeInBits,
unsigned SrcEltSizeInBits = CstTy->getScalarSizeInBits();
unsigned NumSrcElts = SizeInBits / SrcEltSizeInBits;
+ if ((SizeInBits % SrcEltSizeInBits) != 0)
+ return false;
APInt UndefSrcElts(NumSrcElts, 0);
SmallVector<APInt, 64> SrcEltBits(NumSrcElts, APInt(SrcEltSizeInBits, 0));
diff --git a/llvm/test/CodeGen/X86/pr72539.ll b/llvm/test/CodeGen/X86/pr72539.ll
new file mode 100644
index 0000000..fb4c98dca
--- /dev/null
+++ b/llvm/test/CodeGen/X86/pr72539.ll
@@ -0,0 +1,27 @@
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 4
+; RUN: llc < %s -mtriple=x86_64-- -mcpu=x86-64 | FileCheck %s --check-prefixes=SSE
+; RUN: llc < %s -mtriple=x86_64-- -mcpu=x86-64-v2 | FileCheck %s --check-prefixes=SSE
+; RUN: llc < %s -mtriple=x86_64-- -mcpu=x86-64-v3 | FileCheck %s --check-prefixes=AVX
+; RUN: llc < %s -mtriple=x86_64-- -mcpu=x86-64-v4 | FileCheck %s --check-prefixes=AVX
+
+define void @PR72539(<8 x i32> %insertelement){
+; SSE-LABEL: PR72539:
+; SSE: # %bb.0:
+; SSE-NEXT: xorb $7, 0
+; SSE-NEXT: retq
+;
+; AVX-LABEL: PR72539:
+; AVX: # %bb.0:
+; AVX-NEXT: movzbl {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %eax
+; AVX-NEXT: xorb %al, 0
+; AVX-NEXT: retq
+ %load671 = load i8, ptr addrspace(1) null, align 1
+ %shufflevector = shufflevector <8 x i32> %insertelement, <8 x i32> zeroinitializer, <8 x i32> zeroinitializer
+ %xor68 = xor <8 x i32> %shufflevector, <i32 7, i32 0, i32 0, i32 0, i32 0, i32 0, i32 0, i32 0>
+ %call69 = call i32 @llvm.vector.reduce.xor.v8i32(<8 x i32> %xor68)
+ %trunc70 = trunc i32 %call69 to i8
+ %xor71 = xor i8 %load671, %trunc70
+ store i8 %xor71, ptr addrspace(1) null, align 1
+ ret void
+}
+declare i32 @llvm.vector.reduce.xor.v8i32(<8 x i32>)