diff options
Diffstat (limited to 'llvm/lib/Transforms')
| -rw-r--r-- | llvm/lib/Transforms/IPO/Attributor.cpp | 3 | ||||
| -rw-r--r-- | llvm/lib/Transforms/InstCombine/InstCombineCalls.cpp | 12 | ||||
| -rw-r--r-- | llvm/lib/Transforms/InstCombine/InstCombineSelect.cpp | 26 | ||||
| -rw-r--r-- | llvm/lib/Transforms/Instrumentation/MemorySanitizer.cpp | 40 | ||||
| -rw-r--r-- | llvm/lib/Transforms/Vectorize/VPlan.h | 14 | ||||
| -rw-r--r-- | llvm/lib/Transforms/Vectorize/VPlanUtils.cpp | 57 | ||||
| -rw-r--r-- | llvm/lib/Transforms/Vectorize/VPlanUtils.h | 54 | 
7 files changed, 135 insertions, 71 deletions
| diff --git a/llvm/lib/Transforms/IPO/Attributor.cpp b/llvm/lib/Transforms/IPO/Attributor.cpp index 077d29f..3b59ebb 100644 --- a/llvm/lib/Transforms/IPO/Attributor.cpp +++ b/llvm/lib/Transforms/IPO/Attributor.cpp @@ -272,6 +272,9 @@ AA::getInitialValueForObj(Attributor &A, const AbstractAttribute &QueryingAA,    }    if (RangePtr && !RangePtr->offsetOrSizeAreUnknown()) { +    int64_t StorageSize = DL.getTypeStoreSize(&Ty); +    if (StorageSize != RangePtr->Size) +      return nullptr;      APInt Offset = APInt(64, RangePtr->Offset);      return ConstantFoldLoadFromConst(Initializer, &Ty, Offset, DL);    } diff --git a/llvm/lib/Transforms/InstCombine/InstCombineCalls.cpp b/llvm/lib/Transforms/InstCombine/InstCombineCalls.cpp index 669d4f0..8d9933b 100644 --- a/llvm/lib/Transforms/InstCombine/InstCombineCalls.cpp +++ b/llvm/lib/Transforms/InstCombine/InstCombineCalls.cpp @@ -582,6 +582,18 @@ static Instruction *foldCttzCtlz(IntrinsicInst &II, InstCombinerImpl &IC) {            IC.Builder.CreateBinaryIntrinsic(Intrinsic::ctlz, C, Op1);        return BinaryOperator::CreateSub(ConstCtlz, X);      } + +    // ctlz(~x & (x - 1)) -> bitwidth - cttz(x, false) +    if (Op0->hasOneUse() && +        match(Op0, +              m_c_And(m_Not(m_Value(X)), m_Add(m_Deferred(X), m_AllOnes())))) { +      Type *Ty = II.getType(); +      unsigned BitWidth = Ty->getScalarSizeInBits(); +      auto *Cttz = IC.Builder.CreateIntrinsic(Intrinsic::cttz, Ty, +                                              {X, IC.Builder.getFalse()}); +      auto *Bw = ConstantInt::get(Ty, APInt(BitWidth, BitWidth)); +      return IC.replaceInstUsesWith(II, IC.Builder.CreateSub(Bw, Cttz)); +    }    }    // cttz(Pow2) -> Log2(Pow2) diff --git a/llvm/lib/Transforms/InstCombine/InstCombineSelect.cpp b/llvm/lib/Transforms/InstCombine/InstCombineSelect.cpp index 5aa8de3..f5130da 100644 --- a/llvm/lib/Transforms/InstCombine/InstCombineSelect.cpp +++ b/llvm/lib/Transforms/InstCombine/InstCombineSelect.cpp @@ -4697,5 +4697,31 @@ Instruction *InstCombinerImpl::visitSelectInst(SelectInst &SI) {                  cast<IntrinsicInst>(TrueVal)->getParamAlign(0).valueOrOne(),                  CondVal, FalseVal)); +  // Canonicalize sign function ashr pattern: select (icmp slt X, 1), ashr X, +  // bitwidth-1, 1 -> scmp(X, 0) +  // Also handles: select (icmp sgt X, 0), 1, ashr X, bitwidth-1 -> scmp(X, 0) +  unsigned BitWidth = SI.getType()->getScalarSizeInBits(); +  CmpPredicate Pred; +  Value *CmpLHS, *CmpRHS; + +  // Canonicalize sign function ashr patterns: +  // select (icmp slt X, 1), ashr X, bitwidth-1, 1 -> scmp(X, 0) +  // select (icmp sgt X, 0), 1, ashr X, bitwidth-1 -> scmp(X, 0) +  if (match(&SI, m_Select(m_ICmp(Pred, m_Value(CmpLHS), m_Value(CmpRHS)), +                          m_Value(TrueVal), m_Value(FalseVal))) && +      ((Pred == ICmpInst::ICMP_SLT && match(CmpRHS, m_One()) && +        match(TrueVal, +              m_AShr(m_Specific(CmpLHS), m_SpecificInt(BitWidth - 1))) && +        match(FalseVal, m_One())) || +       (Pred == ICmpInst::ICMP_SGT && match(CmpRHS, m_Zero()) && +        match(TrueVal, m_One()) && +        match(FalseVal, +              m_AShr(m_Specific(CmpLHS), m_SpecificInt(BitWidth - 1)))))) { + +    Function *Scmp = Intrinsic::getOrInsertDeclaration( +        SI.getModule(), Intrinsic::scmp, {SI.getType(), SI.getType()}); +    return CallInst::Create(Scmp, {CmpLHS, ConstantInt::get(SI.getType(), 0)}); +  } +    return nullptr;  } diff --git a/llvm/lib/Transforms/Instrumentation/MemorySanitizer.cpp b/llvm/lib/Transforms/Instrumentation/MemorySanitizer.cpp index b6cbecb..10b03bb 100644 --- a/llvm/lib/Transforms/Instrumentation/MemorySanitizer.cpp +++ b/llvm/lib/Transforms/Instrumentation/MemorySanitizer.cpp @@ -226,6 +226,7 @@ static const Align kMinOriginAlignment = Align(4);  static const Align kShadowTLSAlignment = Align(8);  // These constants must be kept in sync with the ones in msan.h. +// TODO: increase size to match SVE/SVE2/SME/SME2 limits  static const unsigned kParamTLSSize = 800;  static const unsigned kRetvalTLSSize = 800; @@ -1544,6 +1545,22 @@ struct MemorySanitizerVisitor : public InstVisitor<MemorySanitizerVisitor> {      }    } +  static bool isAArch64SVCount(Type *Ty) { +    if (TargetExtType *TTy = dyn_cast<TargetExtType>(Ty)) +      return TTy->getName() == "aarch64.svcount"; +    return false; +  } + +  // This is intended to match the "AArch64 Predicate-as-Counter Type" (aka +  // 'target("aarch64.svcount")', but not e.g., <vscale x 4 x i32>. +  static bool isScalableNonVectorType(Type *Ty) { +    if (!isAArch64SVCount(Ty)) +      LLVM_DEBUG(dbgs() << "isScalableNonVectorType: Unexpected type " << *Ty +                        << "\n"); + +    return Ty->isScalableTy() && !isa<VectorType>(Ty); +  } +    void materializeChecks() {  #ifndef NDEBUG      // For assert below. @@ -1672,6 +1689,12 @@ struct MemorySanitizerVisitor : public InstVisitor<MemorySanitizerVisitor> {        LLVM_DEBUG(dbgs() << "getShadowTy: " << *ST << " ===> " << *Res << "\n");        return Res;      } +    if (isScalableNonVectorType(OrigTy)) { +      LLVM_DEBUG(dbgs() << "getShadowTy: Scalable non-vector type: " << *OrigTy +                        << "\n"); +      return OrigTy; +    } +      uint32_t TypeSize = DL.getTypeSizeInBits(OrigTy);      return IntegerType::get(*MS.C, TypeSize);    } @@ -2185,8 +2208,14 @@ struct MemorySanitizerVisitor : public InstVisitor<MemorySanitizerVisitor> {                          << *OrigIns << "\n");        return;      } -#ifndef NDEBUG +      Type *ShadowTy = Shadow->getType(); +    if (isScalableNonVectorType(ShadowTy)) { +      LLVM_DEBUG(dbgs() << "Skipping check of scalable non-vector " << *Shadow +                        << " before " << *OrigIns << "\n"); +      return; +    } +#ifndef NDEBUG      assert((isa<IntegerType>(ShadowTy) || isa<VectorType>(ShadowTy) ||              isa<StructType>(ShadowTy) || isa<ArrayType>(ShadowTy)) &&             "Can only insert checks for integer, vector, and aggregate shadow " @@ -6972,6 +7001,15 @@ struct MemorySanitizerVisitor : public InstVisitor<MemorySanitizerVisitor> {        // an extra "select". This results in much more compact IR.        // Sa = select Sb, poisoned, (select b, Sc, Sd)        Sa1 = getPoisonedShadow(getShadowTy(I.getType())); +    } else if (isScalableNonVectorType(I.getType())) { +      // This is intended to handle target("aarch64.svcount"), which can't be +      // handled in the else branch because of incompatibility with CreateXor +      // ("The supported LLVM operations on this type are limited to load, +      // store, phi, select and alloca instructions"). + +      // TODO: this currently underapproximates. Use Arm SVE EOR in the else +      //       branch as needed instead. +      Sa1 = getCleanShadow(getShadowTy(I.getType()));      } else {        // Sa = select Sb, [ (c^d) | Sc | Sd ], [ b ? Sc : Sd ]        // If Sb (condition is poisoned), look for bits in c and d that are equal diff --git a/llvm/lib/Transforms/Vectorize/VPlan.h b/llvm/lib/Transforms/Vectorize/VPlan.h index a1ad2db..2591df8 100644 --- a/llvm/lib/Transforms/Vectorize/VPlan.h +++ b/llvm/lib/Transforms/Vectorize/VPlan.h @@ -4172,11 +4172,6 @@ class VPlan {    /// definitions are VPValues that hold a pointer to their underlying IR.    SmallVector<VPValue *, 16> VPLiveIns; -  /// Mapping from SCEVs to the VPValues representing their expansions. -  /// NOTE: This mapping is temporary and will be removed once all users have -  /// been modeled in VPlan directly. -  DenseMap<const SCEV *, VPValue *> SCEVToExpansion; -    /// Blocks allocated and owned by the VPlan. They will be deleted once the    /// VPlan is destroyed.    SmallVector<VPBlockBase *> CreatedBlocks; @@ -4424,15 +4419,6 @@ public:    LLVM_DUMP_METHOD void dump() const;  #endif -  VPValue *getSCEVExpansion(const SCEV *S) const { -    return SCEVToExpansion.lookup(S); -  } - -  void addSCEVExpansion(const SCEV *S, VPValue *V) { -    assert(!SCEVToExpansion.contains(S) && "SCEV already expanded"); -    SCEVToExpansion[S] = V; -  } -    /// Clone the current VPlan, update all VPValues of the new VPlan and cloned    /// recipes to refer to the clones, and return it.    VPlan *duplicate(); diff --git a/llvm/lib/Transforms/Vectorize/VPlanUtils.cpp b/llvm/lib/Transforms/Vectorize/VPlanUtils.cpp index 06c3d75..4db92e7 100644 --- a/llvm/lib/Transforms/Vectorize/VPlanUtils.cpp +++ b/llvm/lib/Transforms/Vectorize/VPlanUtils.cpp @@ -32,8 +32,6 @@ bool vputils::onlyScalarValuesUsed(const VPValue *Def) {  }  VPValue *vputils::getOrCreateVPValueForSCEVExpr(VPlan &Plan, const SCEV *Expr) { -  if (auto *Expanded = Plan.getSCEVExpansion(Expr)) -    return Expanded;    VPValue *Expanded = nullptr;    if (auto *E = dyn_cast<SCEVConstant>(Expr))      Expanded = Plan.getOrAddLiveIn(E->getValue()); @@ -50,7 +48,6 @@ VPValue *vputils::getOrCreateVPValueForSCEVExpr(VPlan &Plan, const SCEV *Expr) {        Plan.getEntry()->appendRecipe(Expanded->getDefiningRecipe());      }    } -  Plan.addSCEVExpansion(Expr, Expanded);    return Expanded;  } @@ -92,6 +89,60 @@ const SCEV *vputils::getSCEVExprForVPValue(VPValue *V, ScalarEvolution &SE) {        .Default([&SE](const VPRecipeBase *) { return SE.getCouldNotCompute(); });  } +bool vputils::isSingleScalar(const VPValue *VPV) { +  auto PreservesUniformity = [](unsigned Opcode) -> bool { +    if (Instruction::isBinaryOp(Opcode) || Instruction::isCast(Opcode)) +      return true; +    switch (Opcode) { +    case Instruction::GetElementPtr: +    case Instruction::ICmp: +    case Instruction::FCmp: +    case Instruction::Select: +    case VPInstruction::Not: +    case VPInstruction::Broadcast: +    case VPInstruction::PtrAdd: +      return true; +    default: +      return false; +    } +  }; + +  // A live-in must be uniform across the scope of VPlan. +  if (VPV->isLiveIn()) +    return true; + +  if (auto *Rep = dyn_cast<VPReplicateRecipe>(VPV)) { +    const VPRegionBlock *RegionOfR = Rep->getRegion(); +    // Don't consider recipes in replicate regions as uniform yet; their first +    // lane cannot be accessed when executing the replicate region for other +    // lanes. +    if (RegionOfR && RegionOfR->isReplicator()) +      return false; +    return Rep->isSingleScalar() || (PreservesUniformity(Rep->getOpcode()) && +                                     all_of(Rep->operands(), isSingleScalar)); +  } +  if (isa<VPWidenGEPRecipe, VPDerivedIVRecipe, VPBlendRecipe, +          VPWidenSelectRecipe>(VPV)) +    return all_of(VPV->getDefiningRecipe()->operands(), isSingleScalar); +  if (auto *WidenR = dyn_cast<VPWidenRecipe>(VPV)) { +    return PreservesUniformity(WidenR->getOpcode()) && +           all_of(WidenR->operands(), isSingleScalar); +  } +  if (auto *VPI = dyn_cast<VPInstruction>(VPV)) +    return VPI->isSingleScalar() || VPI->isVectorToScalar() || +           (PreservesUniformity(VPI->getOpcode()) && +            all_of(VPI->operands(), isSingleScalar)); +  if (isa<VPPartialReductionRecipe>(VPV)) +    return false; +  if (isa<VPReductionRecipe>(VPV)) +    return true; +  if (auto *Expr = dyn_cast<VPExpressionRecipe>(VPV)) +    return Expr->isSingleScalar(); + +  // VPExpandSCEVRecipes must be placed in the entry and are always uniform. +  return isa<VPExpandSCEVRecipe>(VPV); +} +  bool vputils::isUniformAcrossVFsAndUFs(VPValue *V) {    // Live-ins are uniform.    if (V->isLiveIn()) diff --git a/llvm/lib/Transforms/Vectorize/VPlanUtils.h b/llvm/lib/Transforms/Vectorize/VPlanUtils.h index 840a5b9..37cd413 100644 --- a/llvm/lib/Transforms/Vectorize/VPlanUtils.h +++ b/llvm/lib/Transforms/Vectorize/VPlanUtils.h @@ -41,59 +41,7 @@ const SCEV *getSCEVExprForVPValue(VPValue *V, ScalarEvolution &SE);  /// Returns true if \p VPV is a single scalar, either because it produces the  /// same value for all lanes or only has its first lane used. -inline bool isSingleScalar(const VPValue *VPV) { -  auto PreservesUniformity = [](unsigned Opcode) -> bool { -    if (Instruction::isBinaryOp(Opcode) || Instruction::isCast(Opcode)) -      return true; -    switch (Opcode) { -    case Instruction::GetElementPtr: -    case Instruction::ICmp: -    case Instruction::FCmp: -    case Instruction::Select: -    case VPInstruction::Not: -    case VPInstruction::Broadcast: -    case VPInstruction::PtrAdd: -      return true; -    default: -      return false; -    } -  }; - -  // A live-in must be uniform across the scope of VPlan. -  if (VPV->isLiveIn()) -    return true; - -  if (auto *Rep = dyn_cast<VPReplicateRecipe>(VPV)) { -    const VPRegionBlock *RegionOfR = Rep->getRegion(); -    // Don't consider recipes in replicate regions as uniform yet; their first -    // lane cannot be accessed when executing the replicate region for other -    // lanes. -    if (RegionOfR && RegionOfR->isReplicator()) -      return false; -    return Rep->isSingleScalar() || (PreservesUniformity(Rep->getOpcode()) && -                                     all_of(Rep->operands(), isSingleScalar)); -  } -  if (isa<VPWidenGEPRecipe, VPDerivedIVRecipe, VPBlendRecipe, -          VPWidenSelectRecipe>(VPV)) -    return all_of(VPV->getDefiningRecipe()->operands(), isSingleScalar); -  if (auto *WidenR = dyn_cast<VPWidenRecipe>(VPV)) { -    return PreservesUniformity(WidenR->getOpcode()) && -           all_of(WidenR->operands(), isSingleScalar); -  } -  if (auto *VPI = dyn_cast<VPInstruction>(VPV)) -    return VPI->isSingleScalar() || VPI->isVectorToScalar() || -           (PreservesUniformity(VPI->getOpcode()) && -            all_of(VPI->operands(), isSingleScalar)); -  if (isa<VPPartialReductionRecipe>(VPV)) -    return false; -  if (isa<VPReductionRecipe>(VPV)) -    return true; -  if (auto *Expr = dyn_cast<VPExpressionRecipe>(VPV)) -    return Expr->isSingleScalar(); - -  // VPExpandSCEVRecipes must be placed in the entry and are alway uniform. -  return isa<VPExpandSCEVRecipe>(VPV); -} +bool isSingleScalar(const VPValue *VPV);  /// Return true if \p V is a header mask in \p Plan.  bool isHeaderMask(const VPValue *V, const VPlan &Plan); | 
