//===-- NVPTX.h - Top-level interface for NVPTX representation --*- C++ -*-===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // // This file contains the entry points for global functions defined in // the LLVM NVPTX back-end. // //===----------------------------------------------------------------------===// #ifndef LLVM_LIB_TARGET_NVPTX_NVPTX_H #define LLVM_LIB_TARGET_NVPTX_NVPTX_H #include "llvm/CodeGen/ISDOpcodes.h" #include "llvm/IR/PassManager.h" #include "llvm/Pass.h" #include "llvm/Support/AtomicOrdering.h" #include "llvm/Support/CodeGen.h" #include "llvm/Target/TargetMachine.h" namespace llvm { class FunctionPass; class MachineFunctionPass; class NVPTXTargetMachine; class PassRegistry; namespace NVPTXCC { enum CondCodes { EQ, NE, LT, LE, GT, GE }; } FunctionPass *createNVPTXISelDag(NVPTXTargetMachine &TM, llvm::CodeGenOptLevel OptLevel); ModulePass *createNVPTXAssignValidGlobalNamesPass(); ModulePass *createGenericToNVVMLegacyPass(); ModulePass *createNVPTXCtorDtorLoweringLegacyPass(); FunctionPass *createNVVMIntrRangePass(); ModulePass *createNVVMReflectPass(unsigned int SmVersion); MachineFunctionPass *createNVPTXPrologEpilogPass(); MachineFunctionPass *createNVPTXReplaceImageHandlesPass(); FunctionPass *createNVPTXImageOptimizerPass(); FunctionPass *createNVPTXLowerArgsPass(); FunctionPass *createNVPTXLowerAllocaPass(); FunctionPass *createNVPTXLowerUnreachablePass(bool TrapUnreachable, bool NoTrapAfterNoreturn); FunctionPass *createNVPTXTagInvariantLoadsPass(); MachineFunctionPass *createNVPTXPeephole(); MachineFunctionPass *createNVPTXProxyRegErasurePass(); MachineFunctionPass *createNVPTXForwardParamsPass(); void initializeNVVMReflectLegacyPassPass(PassRegistry &); void initializeGenericToNVVMLegacyPassPass(PassRegistry &); void initializeNVPTXAllocaHoistingPass(PassRegistry &); void initializeNVPTXAsmPrinterPass(PassRegistry &); void initializeNVPTXAssignValidGlobalNamesPass(PassRegistry &); void initializeNVPTXAtomicLowerPass(PassRegistry &); void initializeNVPTXCtorDtorLoweringLegacyPass(PassRegistry &); void initializeNVPTXLowerAggrCopiesPass(PassRegistry &); void initializeNVPTXLowerAllocaPass(PassRegistry &); void initializeNVPTXLowerUnreachablePass(PassRegistry &); void initializeNVPTXCtorDtorLoweringLegacyPass(PassRegistry &); void initializeNVPTXLowerArgsLegacyPassPass(PassRegistry &); void initializeNVPTXProxyRegErasurePass(PassRegistry &); void initializeNVPTXForwardParamsPassPass(PassRegistry &); void initializeNVVMIntrRangePass(PassRegistry &); void initializeNVVMReflectPass(PassRegistry &); void initializeNVPTXAAWrapperPassPass(PassRegistry &); void initializeNVPTXExternalAAWrapperPass(PassRegistry &); void initializeNVPTXPeepholePass(PassRegistry &); void initializeNVPTXTagInvariantLoadLegacyPassPass(PassRegistry &); void initializeNVPTXPrologEpilogPassPass(PassRegistry &); struct NVVMIntrRangePass : PassInfoMixin { PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM); }; struct NVVMReflectPass : PassInfoMixin { NVVMReflectPass() : SmVersion(0) {} NVVMReflectPass(unsigned SmVersion) : SmVersion(SmVersion) {} PreservedAnalyses run(Module &F, ModuleAnalysisManager &AM); private: unsigned SmVersion; }; struct GenericToNVVMPass : PassInfoMixin { PreservedAnalyses run(Module &M, ModuleAnalysisManager &AM); }; struct NVPTXCopyByValArgsPass : PassInfoMixin { PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM); }; struct NVPTXLowerArgsPass : PassInfoMixin { private: TargetMachine &TM; public: NVPTXLowerArgsPass(TargetMachine &TM) : TM(TM) {}; PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM); }; struct NVPTXTagInvariantLoadsPass : PassInfoMixin { PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM); }; namespace NVPTX { enum DrvInterface { NVCL, CUDA }; // A field inside TSFlags needs a shift and a mask. The usage is // always as follows : // ((TSFlags & fieldMask) >> fieldShift) // The enum keeps the mask, the shift, and all valid values of the // field in one place. enum VecInstType { VecInstTypeShift = 0, VecInstTypeMask = 0xF, VecNOP = 0, VecLoad = 1, VecStore = 2, VecBuild = 3, VecShuffle = 4, VecExtract = 5, VecInsert = 6, VecDest = 7, VecOther = 15 }; enum SimpleMove { SimpleMoveMask = 0x10, SimpleMoveShift = 4 }; enum LoadStore { isLoadMask = 0x20, isLoadShift = 5, isStoreMask = 0x40, isStoreShift = 6 }; // Extends LLVM AtomicOrdering with PTX Orderings: using OrderingUnderlyingType = unsigned int; enum Ordering : OrderingUnderlyingType { NotAtomic = (OrderingUnderlyingType) AtomicOrdering::NotAtomic, // PTX calls these: "Weak" // Unordered = 1, // NVPTX maps LLVM Unorderd to Relaxed Relaxed = (OrderingUnderlyingType)AtomicOrdering::Monotonic, // Consume = 3, // Unimplemented in LLVM; NVPTX would map to "Acquire" Acquire = (OrderingUnderlyingType)AtomicOrdering::Acquire, Release = (OrderingUnderlyingType)AtomicOrdering::Release, AcquireRelease = (OrderingUnderlyingType)AtomicOrdering::AcquireRelease, SequentiallyConsistent = (OrderingUnderlyingType)AtomicOrdering::SequentiallyConsistent, Volatile = SequentiallyConsistent + 1, RelaxedMMIO = Volatile + 1, }; using ScopeUnderlyingType = unsigned int; enum Scope : ScopeUnderlyingType { Thread = 0, Block = 1, Cluster = 2, Device = 3, System = 4, DefaultDevice = 5, // For SM < 70: denotes PTX op implicit/default .gpu scope LASTSCOPE = DefaultDevice }; using AddressSpaceUnderlyingType = unsigned int; enum AddressSpace : AddressSpaceUnderlyingType { Generic = 0, Global = 1, Shared = 3, Const = 4, Local = 5, SharedCluster = 7, // NVPTX Backend Private: Param = 101 }; namespace PTXLdStInstCode { enum FromType { Unsigned = 0, Signed, Float, Untyped }; } // namespace PTXLdStInstCode /// PTXCvtMode - Conversion code enumeration namespace PTXCvtMode { enum CvtMode { NONE = 0, RNI, RZI, RMI, RPI, RN, RZ, RM, RP, RNA, BASE_MASK = 0x0F, FTZ_FLAG = 0x10, SAT_FLAG = 0x20, RELU_FLAG = 0x40 }; } /// PTXCmpMode - Comparison mode enumeration namespace PTXCmpMode { enum CmpMode { EQ = 0, NE, LT, LE, GT, GE, EQU, NEU, LTU, LEU, GTU, GEU, NUM, // NAN is a MACRO NotANumber, }; } namespace PTXPrmtMode { enum PrmtMode { NONE, F4E, B4E, RC8, ECL, ECR, RC16, }; } enum class DivPrecisionLevel : unsigned { Approx = 0, Full = 1, IEEE754 = 2, IEEE754_NoFTZ = 3, }; } // namespace NVPTX void initializeNVPTXDAGToDAGISelLegacyPass(PassRegistry &); } // namespace llvm // Defines symbolic names for NVPTX registers. This defines a mapping from // register name to register number. #define GET_REGINFO_ENUM #include "NVPTXGenRegisterInfo.inc" // Defines symbolic names for the NVPTX instructions. #define GET_INSTRINFO_ENUM #define GET_INSTRINFO_MC_HELPER_DECLS #include "NVPTXGenInstrInfo.inc" #endif