diff options
Diffstat (limited to 'llvm/lib/CodeGen/SelectionDAG')
| -rw-r--r-- | llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp | 6 | ||||
| -rw-r--r-- | llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp | 101 | ||||
| -rw-r--r-- | llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.h | 12 | ||||
| -rw-r--r-- | llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp | 12 | 
4 files changed, 97 insertions, 34 deletions
| diff --git a/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp b/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp index d2ea652..8676060 100644 --- a/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp +++ b/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp @@ -19993,8 +19993,12 @@ static SDNode *getPostIndexedLoadStoreOp(SDNode *N, bool &IsLoad,    //    nor a successor of N. Otherwise, if Op is folded that would    //    create a cycle.    unsigned MaxSteps = SelectionDAG::getHasPredecessorMaxSteps(); -  for (SDNode *Op : Ptr->users()) { +  for (SDUse &U : Ptr->uses()) { +    if (U.getResNo() != Ptr.getResNo()) +      continue; +      // Check for #1. +    SDNode *Op = U.getUser();      if (!shouldCombineToPostInc(N, Ptr, Op, BasePtr, Offset, AM, DAG, TLI))        continue; diff --git a/llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp b/llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp index bfa566a..a522650 100644 --- a/llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp +++ b/llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp @@ -1162,6 +1162,43 @@ SDValue SelectionDAGBuilder::getMemoryRoot() {    return updateRoot(PendingLoads);  } +SDValue SelectionDAGBuilder::getFPOperationRoot(fp::ExceptionBehavior EB) { +  // If the new exception behavior differs from that of the pending +  // ones, chain up them and update the root. +  switch (EB) { +  case fp::ExceptionBehavior::ebMayTrap: +  case fp::ExceptionBehavior::ebIgnore: +    // Floating-point exceptions produced by such operations are not intended +    // to be observed, so the sequence of these operations does not need to be +    // preserved. +    // +    // They however must not be mixed with the instructions that have strict +    // exception behavior. Placing an operation with 'ebIgnore' behavior between +    // 'ebStrict' operations could distort the observed exception behavior. +    if (!PendingConstrainedFPStrict.empty()) { +      assert(PendingConstrainedFP.empty()); +      updateRoot(PendingConstrainedFPStrict); +    } +    break; +  case fp::ExceptionBehavior::ebStrict: +    // Floating-point exception produced by these operations may be observed, so +    // they must be correctly chained. If trapping on FP exceptions is +    // disabled, the exceptions can be observed only by functions that read +    // exception flags, like 'llvm.get_fpenv' or 'fetestexcept'. It means that +    // the order of operations is not significant between barriers. +    // +    // If trapping is enabled, each operation becomes an implicit observation +    // point, so the operations must be sequenced according their original +    // source order. +    if (!PendingConstrainedFP.empty()) { +      assert(PendingConstrainedFPStrict.empty()); +      updateRoot(PendingConstrainedFP); +    } +    // TODO: Add support for trapping-enabled scenarios. +  } +  return DAG.getRoot(); +} +  SDValue SelectionDAGBuilder::getRoot() {    // Chain up all pending constrained intrinsics together with all    // pending loads, by simply appending them to PendingLoads and @@ -1978,9 +2015,9 @@ SDValue SelectionDAGBuilder::getValueImpl(const Value *V) {      Register InReg = FuncInfo.InitializeRegForValue(Inst);      std::optional<CallingConv::ID> CallConv; -    auto *CI = dyn_cast<CallInst>(Inst); -    if (CI && !CI->isInlineAsm()) -      CallConv = CI->getCallingConv(); +    auto *CB = dyn_cast<CallBase>(Inst); +    if (CB && !CB->isInlineAsm()) +      CallConv = CB->getCallingConv();      RegsForValue RFV(*DAG.getContext(), TLI, DAG.getDataLayout(), InReg,                       Inst->getType(), CallConv); @@ -8298,6 +8335,30 @@ void SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I,    }  } +void SelectionDAGBuilder::pushFPOpOutChain(SDValue Result, +                                           fp::ExceptionBehavior EB) { +  assert(Result.getNode()->getNumValues() == 2); +  SDValue OutChain = Result.getValue(1); +  assert(OutChain.getValueType() == MVT::Other); + +  // Instead of updating the root immediately, push the produced chain to the +  // appropriate list, deferring the update until the root is requested. In this +  // case, the nodes from the lists are chained using TokenFactor, indicating +  // that the operations are independent. +  // +  // In particular, the root is updated before any call that might access the +  // floating-point environment, except for constrained intrinsics. +  switch (EB) { +  case fp::ExceptionBehavior::ebMayTrap: +  case fp::ExceptionBehavior::ebIgnore: +    PendingConstrainedFP.push_back(OutChain); +    break; +  case fp::ExceptionBehavior::ebStrict: +    PendingConstrainedFPStrict.push_back(OutChain); +    break; +  } +} +  void SelectionDAGBuilder::visitConstrainedFPIntrinsic(      const ConstrainedFPIntrinsic &FPI) {    SDLoc sdl = getCurSDLoc(); @@ -8305,42 +8366,16 @@ void SelectionDAGBuilder::visitConstrainedFPIntrinsic(    // We do not need to serialize constrained FP intrinsics against    // each other or against (nonvolatile) loads, so they can be    // chained like loads. -  SDValue Chain = DAG.getRoot(); +  fp::ExceptionBehavior EB = *FPI.getExceptionBehavior(); +  SDValue Chain = getFPOperationRoot(EB);    SmallVector<SDValue, 4> Opers;    Opers.push_back(Chain);    for (unsigned I = 0, E = FPI.getNonMetadataArgCount(); I != E; ++I)      Opers.push_back(getValue(FPI.getArgOperand(I))); -  auto pushOutChain = [this](SDValue Result, fp::ExceptionBehavior EB) { -    assert(Result.getNode()->getNumValues() == 2); - -    // Push node to the appropriate list so that future instructions can be -    // chained up correctly. -    SDValue OutChain = Result.getValue(1); -    switch (EB) { -    case fp::ExceptionBehavior::ebIgnore: -      // The only reason why ebIgnore nodes still need to be chained is that -      // they might depend on the current rounding mode, and therefore must -      // not be moved across instruction that may change that mode. -      [[fallthrough]]; -    case fp::ExceptionBehavior::ebMayTrap: -      // These must not be moved across calls or instructions that may change -      // floating-point exception masks. -      PendingConstrainedFP.push_back(OutChain); -      break; -    case fp::ExceptionBehavior::ebStrict: -      // These must not be moved across calls or instructions that may change -      // floating-point exception masks or read floating-point exception flags. -      // In addition, they cannot be optimized out even if unused. -      PendingConstrainedFPStrict.push_back(OutChain); -      break; -    } -  }; -    const TargetLowering &TLI = DAG.getTargetLoweringInfo();    EVT VT = TLI.getValueType(DAG.getDataLayout(), FPI.getType());    SDVTList VTs = DAG.getVTList(VT, MVT::Other); -  fp::ExceptionBehavior EB = *FPI.getExceptionBehavior();    SDNodeFlags Flags;    if (EB == fp::ExceptionBehavior::ebIgnore) @@ -8364,7 +8399,7 @@ void SelectionDAGBuilder::visitConstrainedFPIntrinsic(          !TLI.isFMAFasterThanFMulAndFAdd(DAG.getMachineFunction(), VT)) {        Opers.pop_back();        SDValue Mul = DAG.getNode(ISD::STRICT_FMUL, sdl, VTs, Opers, Flags); -      pushOutChain(Mul, EB); +      pushFPOpOutChain(Mul, EB);        Opcode = ISD::STRICT_FADD;        Opers.clear();        Opers.push_back(Mul.getValue(1)); @@ -8395,7 +8430,7 @@ void SelectionDAGBuilder::visitConstrainedFPIntrinsic(    }    SDValue Result = DAG.getNode(Opcode, sdl, VTs, Opers, Flags); -  pushOutChain(Result, EB); +  pushFPOpOutChain(Result, EB);    SDValue FPResult = Result.getValue(0);    setValue(&FPI, FPResult); diff --git a/llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.h b/llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.h index c7577fa..47e19f7 100644 --- a/llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.h +++ b/llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.h @@ -195,6 +195,11 @@ private:    /// Update root to include all chains from the Pending list.    SDValue updateRoot(SmallVectorImpl<SDValue> &Pending); +  /// Given a node representing a floating-point operation and its specified +  /// exception behavior, this either updates the root or stores the node in +  /// a list to be added to chains latter. +  void pushFPOpOutChain(SDValue Result, fp::ExceptionBehavior EB); +    /// A unique monotonically increasing number used to order the SDNodes we    /// create.    unsigned SDNodeOrder; @@ -300,6 +305,13 @@ public:    /// memory node that may need to be ordered after any prior load instructions.    SDValue getMemoryRoot(); +  /// Return the current virtual root of the Selection DAG, flushing +  /// PendingConstrainedFP or PendingConstrainedFPStrict items if the new +  /// exception behavior (specified by \p EB) differs from that of the pending +  /// instructions. This must be done before emitting constrained FP operation +  /// call. +  SDValue getFPOperationRoot(fp::ExceptionBehavior EB); +    /// Similar to getMemoryRoot, but also flushes PendingConstrainedFP(Strict)    /// items. This must be done before emitting any call other any other node    /// that may need to be ordered after FP instructions due to other side diff --git a/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp b/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp index 920dff9..da4e409 100644 --- a/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp +++ b/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp @@ -9899,6 +9899,18 @@ SDValue TargetLowering::expandBSWAP(SDNode *N, SelectionDAG &DAG) const {      // Use a rotate by 8. This can be further expanded if necessary.      return DAG.getNode(ISD::ROTL, dl, VT, Op, DAG.getConstant(8, dl, SHVT));    case MVT::i32: +    // This is meant for ARM speficially, which has ROTR but no ROTL. +    if (isOperationLegalOrCustom(ISD::ROTR, VT)) { +      SDValue Mask = DAG.getConstant(0x00FF00FF, dl, VT); +      // (x & 0x00FF00FF) rotr 8 | (x rotl 8) & 0x00FF00FF +      SDValue And = DAG.getNode(ISD::AND, dl, VT, Op, Mask); +      SDValue Rotr = +          DAG.getNode(ISD::ROTR, dl, VT, And, DAG.getConstant(8, dl, SHVT)); +      SDValue Rotl = +          DAG.getNode(ISD::ROTR, dl, VT, Op, DAG.getConstant(24, dl, SHVT)); +      SDValue And2 = DAG.getNode(ISD::AND, dl, VT, Rotl, Mask); +      return DAG.getNode(ISD::OR, dl, VT, Rotr, And2); +    }      Tmp4 = DAG.getNode(ISD::SHL, dl, VT, Op, DAG.getConstant(24, dl, SHVT));      Tmp3 = DAG.getNode(ISD::AND, dl, VT, Op,                         DAG.getConstant(0xFF00, dl, VT)); | 
