Subversion Repositories QNX 8.QNX8 LLVM/Clang compiler suite

Rev

Blame | Last modification | View Log | Download | RSS feed

  1. //===- Cloning.h - Clone various parts of LLVM programs ---------*- C++ -*-===//
  2. //
  3. // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
  4. // See https://llvm.org/LICENSE.txt for license information.
  5. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  6. //
  7. //===----------------------------------------------------------------------===//
  8. //
  9. // This file defines various functions that are used to clone chunks of LLVM
  10. // code for various purposes.  This varies from copying whole modules into new
  11. // modules, to cloning functions with different arguments, to inlining
  12. // functions, to copying basic blocks to support loop unrolling or superblock
  13. // formation, etc.
  14. //
  15. //===----------------------------------------------------------------------===//
  16.  
  17. #ifndef LLVM_TRANSFORMS_UTILS_CLONING_H
  18. #define LLVM_TRANSFORMS_UTILS_CLONING_H
  19.  
  20. #include "llvm/ADT/SmallVector.h"
  21. #include "llvm/ADT/Twine.h"
  22. #include "llvm/Analysis/AssumptionCache.h"
  23. #include "llvm/Analysis/InlineCost.h"
  24. #include "llvm/IR/ValueHandle.h"
  25. #include "llvm/Transforms/Utils/ValueMapper.h"
  26. #include <functional>
  27. #include <memory>
  28. #include <vector>
  29.  
  30. namespace llvm {
  31.  
  32. class AAResults;
  33. class AllocaInst;
  34. class BasicBlock;
  35. class BlockFrequencyInfo;
  36. class CallGraph;
  37. class DebugInfoFinder;
  38. class DominatorTree;
  39. class Function;
  40. class Instruction;
  41. class Loop;
  42. class LoopInfo;
  43. class Module;
  44. class ProfileSummaryInfo;
  45. class ReturnInst;
  46. class DomTreeUpdater;
  47.  
  48. /// Return an exact copy of the specified module
  49. std::unique_ptr<Module> CloneModule(const Module &M);
  50. std::unique_ptr<Module> CloneModule(const Module &M, ValueToValueMapTy &VMap);
  51.  
  52. /// Return a copy of the specified module. The ShouldCloneDefinition function
  53. /// controls whether a specific GlobalValue's definition is cloned. If the
  54. /// function returns false, the module copy will contain an external reference
  55. /// in place of the global definition.
  56. std::unique_ptr<Module>
  57. CloneModule(const Module &M, ValueToValueMapTy &VMap,
  58.             function_ref<bool(const GlobalValue *)> ShouldCloneDefinition);
  59.  
  60. /// This struct can be used to capture information about code
  61. /// being cloned, while it is being cloned.
  62. struct ClonedCodeInfo {
  63.   /// This is set to true if the cloned code contains a normal call instruction.
  64.   bool ContainsCalls = false;
  65.  
  66.   /// This is set to true if there is memprof related metadata (memprof or
  67.   /// callsite metadata) in the cloned code.
  68.   bool ContainsMemProfMetadata = false;
  69.  
  70.   /// This is set to true if the cloned code contains a 'dynamic' alloca.
  71.   /// Dynamic allocas are allocas that are either not in the entry block or they
  72.   /// are in the entry block but are not a constant size.
  73.   bool ContainsDynamicAllocas = false;
  74.  
  75.   /// All cloned call sites that have operand bundles attached are appended to
  76.   /// this vector.  This vector may contain nulls or undefs if some of the
  77.   /// originally inserted callsites were DCE'ed after they were cloned.
  78.   std::vector<WeakTrackingVH> OperandBundleCallSites;
  79.  
  80.   /// Like VMap, but maps only unsimplified instructions. Values in the map
  81.   /// may be dangling, it is only intended to be used via isSimplified(), to
  82.   /// check whether the main VMap mapping involves simplification or not.
  83.   DenseMap<const Value *, const Value *> OrigVMap;
  84.  
  85.   ClonedCodeInfo() = default;
  86.  
  87.   bool isSimplified(const Value *From, const Value *To) const {
  88.     return OrigVMap.lookup(From) != To;
  89.   }
  90. };
  91.  
  92. /// Return a copy of the specified basic block, but without
  93. /// embedding the block into a particular function.  The block returned is an
  94. /// exact copy of the specified basic block, without any remapping having been
  95. /// performed.  Because of this, this is only suitable for applications where
  96. /// the basic block will be inserted into the same function that it was cloned
  97. /// from (loop unrolling would use this, for example).
  98. ///
  99. /// Also, note that this function makes a direct copy of the basic block, and
  100. /// can thus produce illegal LLVM code.  In particular, it will copy any PHI
  101. /// nodes from the original block, even though there are no predecessors for the
  102. /// newly cloned block (thus, phi nodes will have to be updated).  Also, this
  103. /// block will branch to the old successors of the original block: these
  104. /// successors will have to have any PHI nodes updated to account for the new
  105. /// incoming edges.
  106. ///
  107. /// The correlation between instructions in the source and result basic blocks
  108. /// is recorded in the VMap map.
  109. ///
  110. /// If you have a particular suffix you'd like to use to add to any cloned
  111. /// names, specify it as the optional third parameter.
  112. ///
  113. /// If you would like the basic block to be auto-inserted into the end of a
  114. /// function, you can specify it as the optional fourth parameter.
  115. ///
  116. /// If you would like to collect additional information about the cloned
  117. /// function, you can specify a ClonedCodeInfo object with the optional fifth
  118. /// parameter.
  119. BasicBlock *CloneBasicBlock(const BasicBlock *BB, ValueToValueMapTy &VMap,
  120.                             const Twine &NameSuffix = "", Function *F = nullptr,
  121.                             ClonedCodeInfo *CodeInfo = nullptr,
  122.                             DebugInfoFinder *DIFinder = nullptr);
  123.  
  124. /// Return a copy of the specified function and add it to that
  125. /// function's module.  Also, any references specified in the VMap are changed
  126. /// to refer to their mapped value instead of the original one.  If any of the
  127. /// arguments to the function are in the VMap, the arguments are deleted from
  128. /// the resultant function.  The VMap is updated to include mappings from all of
  129. /// the instructions and basicblocks in the function from their old to new
  130. /// values.  The final argument captures information about the cloned code if
  131. /// non-null.
  132. ///
  133. /// \pre VMap contains no non-identity GlobalValue mappings.
  134. ///
  135. Function *CloneFunction(Function *F, ValueToValueMapTy &VMap,
  136.                         ClonedCodeInfo *CodeInfo = nullptr);
  137.  
  138. enum class CloneFunctionChangeType {
  139.   LocalChangesOnly,
  140.   GlobalChanges,
  141.   DifferentModule,
  142.   ClonedModule,
  143. };
  144.  
  145. /// Clone OldFunc into NewFunc, transforming the old arguments into references
  146. /// to VMap values.  Note that if NewFunc already has basic blocks, the ones
  147. /// cloned into it will be added to the end of the function.  This function
  148. /// fills in a list of return instructions, and can optionally remap types
  149. /// and/or append the specified suffix to all values cloned.
  150. ///
  151. /// If \p Changes is \a CloneFunctionChangeType::LocalChangesOnly, VMap is
  152. /// required to contain no non-identity GlobalValue mappings. Otherwise,
  153. /// referenced metadata will be cloned.
  154. ///
  155. /// If \p Changes is less than \a CloneFunctionChangeType::DifferentModule
  156. /// indicating cloning into the same module (even if it's LocalChangesOnly), if
  157. /// debug info metadata transitively references a \a DISubprogram, it will be
  158. /// cloned, effectively upgrading \p Changes to GlobalChanges while suppressing
  159. /// cloning of types and compile units.
  160. ///
  161. /// If \p Changes is \a CloneFunctionChangeType::DifferentModule, the new
  162. /// module's \c !llvm.dbg.cu will get updated with any newly created compile
  163. /// units. (\a CloneFunctionChangeType::ClonedModule leaves that work for the
  164. /// caller.)
  165. ///
  166. /// FIXME: Consider simplifying this function by splitting out \a
  167. /// CloneFunctionMetadataInto() and expecting / updating callers to call it
  168. /// first when / how it's needed.
  169. void CloneFunctionInto(Function *NewFunc, const Function *OldFunc,
  170.                        ValueToValueMapTy &VMap, CloneFunctionChangeType Changes,
  171.                        SmallVectorImpl<ReturnInst *> &Returns,
  172.                        const char *NameSuffix = "",
  173.                        ClonedCodeInfo *CodeInfo = nullptr,
  174.                        ValueMapTypeRemapper *TypeMapper = nullptr,
  175.                        ValueMaterializer *Materializer = nullptr);
  176.  
  177. void CloneAndPruneIntoFromInst(Function *NewFunc, const Function *OldFunc,
  178.                                const Instruction *StartingInst,
  179.                                ValueToValueMapTy &VMap, bool ModuleLevelChanges,
  180.                                SmallVectorImpl<ReturnInst *> &Returns,
  181.                                const char *NameSuffix = "",
  182.                                ClonedCodeInfo *CodeInfo = nullptr);
  183.  
  184. /// This works exactly like CloneFunctionInto,
  185. /// except that it does some simple constant prop and DCE on the fly.  The
  186. /// effect of this is to copy significantly less code in cases where (for
  187. /// example) a function call with constant arguments is inlined, and those
  188. /// constant arguments cause a significant amount of code in the callee to be
  189. /// dead.  Since this doesn't produce an exactly copy of the input, it can't be
  190. /// used for things like CloneFunction or CloneModule.
  191. ///
  192. /// If ModuleLevelChanges is false, VMap contains no non-identity GlobalValue
  193. /// mappings.
  194. ///
  195. void CloneAndPruneFunctionInto(Function *NewFunc, const Function *OldFunc,
  196.                                ValueToValueMapTy &VMap, bool ModuleLevelChanges,
  197.                                SmallVectorImpl<ReturnInst*> &Returns,
  198.                                const char *NameSuffix = "",
  199.                                ClonedCodeInfo *CodeInfo = nullptr);
  200.  
  201. /// This class captures the data input to the InlineFunction call, and records
  202. /// the auxiliary results produced by it.
  203. class InlineFunctionInfo {
  204. public:
  205.   explicit InlineFunctionInfo(
  206.       CallGraph *cg = nullptr,
  207.       function_ref<AssumptionCache &(Function &)> GetAssumptionCache = nullptr,
  208.       ProfileSummaryInfo *PSI = nullptr,
  209.       BlockFrequencyInfo *CallerBFI = nullptr,
  210.       BlockFrequencyInfo *CalleeBFI = nullptr, bool UpdateProfile = true)
  211.       : CG(cg), GetAssumptionCache(GetAssumptionCache), PSI(PSI),
  212.         CallerBFI(CallerBFI), CalleeBFI(CalleeBFI),
  213.         UpdateProfile(UpdateProfile) {}
  214.  
  215.   /// If non-null, InlineFunction will update the callgraph to reflect the
  216.   /// changes it makes.
  217.   CallGraph *CG;
  218.   function_ref<AssumptionCache &(Function &)> GetAssumptionCache;
  219.   ProfileSummaryInfo *PSI;
  220.   BlockFrequencyInfo *CallerBFI, *CalleeBFI;
  221.  
  222.   /// InlineFunction fills this in with all static allocas that get copied into
  223.   /// the caller.
  224.   SmallVector<AllocaInst *, 4> StaticAllocas;
  225.  
  226.   /// InlineFunction fills this in with callsites that were inlined from the
  227.   /// callee. This is only filled in if CG is non-null.
  228.   SmallVector<WeakTrackingVH, 8> InlinedCalls;
  229.  
  230.   /// All of the new call sites inlined into the caller.
  231.   ///
  232.   /// 'InlineFunction' fills this in by scanning the inlined instructions, and
  233.   /// only if CG is null. If CG is non-null, instead the value handle
  234.   /// `InlinedCalls` above is used.
  235.   SmallVector<CallBase *, 8> InlinedCallSites;
  236.  
  237.   /// Update profile for callee as well as cloned version. We need to do this
  238.   /// for regular inlining, but not for inlining from sample profile loader.
  239.   bool UpdateProfile;
  240.  
  241.   void reset() {
  242.     StaticAllocas.clear();
  243.     InlinedCalls.clear();
  244.     InlinedCallSites.clear();
  245.   }
  246. };
  247.  
  248. /// This function inlines the called function into the basic
  249. /// block of the caller.  This returns false if it is not possible to inline
  250. /// this call.  The program is still in a well defined state if this occurs
  251. /// though.
  252. ///
  253. /// Note that this only does one level of inlining.  For example, if the
  254. /// instruction 'call B' is inlined, and 'B' calls 'C', then the call to 'C' now
  255. /// exists in the instruction stream.  Similarly this will inline a recursive
  256. /// function by one level.
  257. ///
  258. /// Note that while this routine is allowed to cleanup and optimize the
  259. /// *inlined* code to minimize the actual inserted code, it must not delete
  260. /// code in the caller as users of this routine may have pointers to
  261. /// instructions in the caller that need to remain stable.
  262. ///
  263. /// If ForwardVarArgsTo is passed, inlining a function with varargs is allowed
  264. /// and all varargs at the callsite will be passed to any calls to
  265. /// ForwardVarArgsTo. The caller of InlineFunction has to make sure any varargs
  266. /// are only used by ForwardVarArgsTo.
  267. ///
  268. /// The callee's function attributes are merged into the callers' if
  269. /// MergeAttributes is set to true.
  270. InlineResult InlineFunction(CallBase &CB, InlineFunctionInfo &IFI,
  271.                             bool MergeAttributes = false,
  272.                             AAResults *CalleeAAR = nullptr,
  273.                             bool InsertLifetime = true,
  274.                             Function *ForwardVarArgsTo = nullptr);
  275.  
  276. /// Clones a loop \p OrigLoop.  Returns the loop and the blocks in \p
  277. /// Blocks.
  278. ///
  279. /// Updates LoopInfo and DominatorTree assuming the loop is dominated by block
  280. /// \p LoopDomBB.  Insert the new blocks before block specified in \p Before.
  281. /// Note: Only innermost loops are supported.
  282. Loop *cloneLoopWithPreheader(BasicBlock *Before, BasicBlock *LoopDomBB,
  283.                              Loop *OrigLoop, ValueToValueMapTy &VMap,
  284.                              const Twine &NameSuffix, LoopInfo *LI,
  285.                              DominatorTree *DT,
  286.                              SmallVectorImpl<BasicBlock *> &Blocks);
  287.  
  288. /// Remaps instructions in \p Blocks using the mapping in \p VMap.
  289. void remapInstructionsInBlocks(const SmallVectorImpl<BasicBlock *> &Blocks,
  290.                                ValueToValueMapTy &VMap);
  291.  
  292. /// Split edge between BB and PredBB and duplicate all non-Phi instructions
  293. /// from BB between its beginning and the StopAt instruction into the split
  294. /// block. Phi nodes are not duplicated, but their uses are handled correctly:
  295. /// we replace them with the uses of corresponding Phi inputs. ValueMapping
  296. /// is used to map the original instructions from BB to their newly-created
  297. /// copies. Returns the split block.
  298. BasicBlock *DuplicateInstructionsInSplitBetween(BasicBlock *BB,
  299.                                                 BasicBlock *PredBB,
  300.                                                 Instruction *StopAt,
  301.                                                 ValueToValueMapTy &ValueMapping,
  302.                                                 DomTreeUpdater &DTU);
  303.  
  304. /// Updates profile information by adjusting the entry count by adding
  305. /// EntryDelta then scaling callsite information by the new count divided by the
  306. /// old count. VMap is used during inlinng to also update the new clone
  307. void updateProfileCallee(
  308.     Function *Callee, int64_t EntryDelta,
  309.     const ValueMap<const Value *, WeakTrackingVH> *VMap = nullptr);
  310.  
  311. /// Find the 'llvm.experimental.noalias.scope.decl' intrinsics in the specified
  312. /// basic blocks and extract their scope. These are candidates for duplication
  313. /// when cloning.
  314. void identifyNoAliasScopesToClone(
  315.     ArrayRef<BasicBlock *> BBs, SmallVectorImpl<MDNode *> &NoAliasDeclScopes);
  316.  
  317. /// Find the 'llvm.experimental.noalias.scope.decl' intrinsics in the specified
  318. /// instruction range and extract their scope. These are candidates for
  319. /// duplication when cloning.
  320. void identifyNoAliasScopesToClone(
  321.     BasicBlock::iterator Start, BasicBlock::iterator End,
  322.     SmallVectorImpl<MDNode *> &NoAliasDeclScopes);
  323.  
  324. /// Duplicate the specified list of noalias decl scopes.
  325. /// The 'Ext' string is added as an extension to the name.
  326. /// Afterwards, the ClonedScopes contains the mapping of the original scope
  327. /// MDNode onto the cloned scope.
  328. /// Be aware that the cloned scopes are still part of the original scope domain.
  329. void cloneNoAliasScopes(
  330.     ArrayRef<MDNode *> NoAliasDeclScopes,
  331.     DenseMap<MDNode *, MDNode *> &ClonedScopes,
  332.     StringRef Ext, LLVMContext &Context);
  333.  
  334. /// Adapt the metadata for the specified instruction according to the
  335. /// provided mapping. This is normally used after cloning an instruction, when
  336. /// some noalias scopes needed to be cloned.
  337. void adaptNoAliasScopes(
  338.     llvm::Instruction *I, const DenseMap<MDNode *, MDNode *> &ClonedScopes,
  339.     LLVMContext &Context);
  340.  
  341. /// Clone the specified noalias decl scopes. Then adapt all instructions in the
  342. /// NewBlocks basicblocks to the cloned versions.
  343. /// 'Ext' will be added to the duplicate scope names.
  344. void cloneAndAdaptNoAliasScopes(ArrayRef<MDNode *> NoAliasDeclScopes,
  345.                                 ArrayRef<BasicBlock *> NewBlocks,
  346.                                 LLVMContext &Context, StringRef Ext);
  347.  
  348. /// Clone the specified noalias decl scopes. Then adapt all instructions in the
  349. /// [IStart, IEnd] (IEnd included !) range to the cloned versions. 'Ext' will be
  350. /// added to the duplicate scope names.
  351. void cloneAndAdaptNoAliasScopes(ArrayRef<MDNode *> NoAliasDeclScopes,
  352.                                 Instruction *IStart, Instruction *IEnd,
  353.                                 LLVMContext &Context, StringRef Ext);
  354. } // end namespace llvm
  355.  
  356. #endif // LLVM_TRANSFORMS_UTILS_CLONING_H
  357.