Home | History | Annotate | Line # | Download | only in Analysis
      1 //===- llvm/Analysis/MemoryDependenceAnalysis.h - Memory Deps ---*- C++ -*-===//
      2 //
      3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
      4 // See https://llvm.org/LICENSE.txt for license information.
      5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
      6 //
      7 //===----------------------------------------------------------------------===//
      8 //
      9 // This file defines the MemoryDependenceAnalysis analysis pass.
     10 //
     11 //===----------------------------------------------------------------------===//
     12 
     13 #ifndef LLVM_ANALYSIS_MEMORYDEPENDENCEANALYSIS_H
     14 #define LLVM_ANALYSIS_MEMORYDEPENDENCEANALYSIS_H
     15 
     16 #include "llvm/ADT/DenseMap.h"
     17 #include "llvm/ADT/Optional.h"
     18 #include "llvm/ADT/PointerEmbeddedInt.h"
     19 #include "llvm/ADT/PointerIntPair.h"
     20 #include "llvm/ADT/PointerSumType.h"
     21 #include "llvm/ADT/SmallPtrSet.h"
     22 #include "llvm/Analysis/MemoryLocation.h"
     23 #include "llvm/IR/BasicBlock.h"
     24 #include "llvm/IR/Metadata.h"
     25 #include "llvm/IR/PassManager.h"
     26 #include "llvm/IR/PredIteratorCache.h"
     27 #include "llvm/IR/ValueHandle.h"
     28 #include "llvm/Pass.h"
     29 #include "llvm/Support/ErrorHandling.h"
     30 #include <cassert>
     31 #include <cstdint>
     32 #include <utility>
     33 #include <vector>
     34 
     35 namespace llvm {
     36 
     37 class AAResults;
     38 class AssumptionCache;
     39 class BatchAAResults;
     40 class DominatorTree;
     41 class Function;
     42 class Instruction;
     43 class LoadInst;
     44 class PHITransAddr;
     45 class TargetLibraryInfo;
     46 class PhiValues;
     47 class Value;
     48 
     49 /// A memory dependence query can return one of three different answers.
     50 class MemDepResult {
     51   enum DepType {
     52     /// Clients of MemDep never see this.
     53     ///
     54     /// Entries with this marker occur in a LocalDeps map or NonLocalDeps map
     55     /// when the instruction they previously referenced was removed from
     56     /// MemDep.  In either case, the entry may include an instruction pointer.
     57     /// If so, the pointer is an instruction in the block where scanning can
     58     /// start from, saving some work.
     59     ///
     60     /// In a default-constructed MemDepResult object, the type will be Invalid
     61     /// and the instruction pointer will be null.
     62     Invalid = 0,
     63 
     64     /// This is a dependence on the specified instruction which clobbers the
     65     /// desired value.  The pointer member of the MemDepResult pair holds the
     66     /// instruction that clobbers the memory.  For example, this occurs when we
     67     /// see a may-aliased store to the memory location we care about.
     68     ///
     69     /// There are several cases that may be interesting here:
     70     ///   1. Loads are clobbered by may-alias stores.
     71     ///   2. Loads are considered clobbered by partially-aliased loads.  The
     72     ///      client may choose to analyze deeper into these cases.
     73     Clobber,
     74 
     75     /// This is a dependence on the specified instruction which defines or
     76     /// produces the desired memory location.  The pointer member of the
     77     /// MemDepResult pair holds the instruction that defines the memory.
     78     ///
     79     /// Cases of interest:
     80     ///   1. This could be a load or store for dependence queries on
     81     ///      load/store.  The value loaded or stored is the produced value.
     82     ///      Note that the pointer operand may be different than that of the
     83     ///      queried pointer due to must aliases and phi translation. Note
     84     ///      that the def may not be the same type as the query, the pointers
     85     ///      may just be must aliases.
     86     ///   2. For loads and stores, this could be an allocation instruction. In
     87     ///      this case, the load is loading an undef value or a store is the
     88     ///      first store to (that part of) the allocation.
     89     ///   3. Dependence queries on calls return Def only when they are readonly
     90     ///      calls or memory use intrinsics with identical callees and no
     91     ///      intervening clobbers.  No validation is done that the operands to
     92     ///      the calls are the same.
     93     Def,
     94 
     95     /// This marker indicates that the query has no known dependency in the
     96     /// specified block.
     97     ///
     98     /// More detailed state info is encoded in the upper part of the pair (i.e.
     99     /// the Instruction*)
    100     Other
    101   };
    102 
    103   /// If DepType is "Other", the upper part of the sum type is an encoding of
    104   /// the following more detailed type information.
    105   enum OtherType {
    106     /// This marker indicates that the query has no dependency in the specified
    107     /// block.
    108     ///
    109     /// To find out more, the client should query other predecessor blocks.
    110     NonLocal = 1,
    111     /// This marker indicates that the query has no dependency in the specified
    112     /// function.
    113     NonFuncLocal,
    114     /// This marker indicates that the query dependency is unknown.
    115     Unknown
    116   };
    117 
    118   using ValueTy = PointerSumType<
    119       DepType, PointerSumTypeMember<Invalid, Instruction *>,
    120       PointerSumTypeMember<Clobber, Instruction *>,
    121       PointerSumTypeMember<Def, Instruction *>,
    122       PointerSumTypeMember<Other, PointerEmbeddedInt<OtherType, 3>>>;
    123   ValueTy Value;
    124 
    125   explicit MemDepResult(ValueTy V) : Value(V) {}
    126 
    127 public:
    128   MemDepResult() = default;
    129 
    130   /// get methods: These are static ctor methods for creating various
    131   /// MemDepResult kinds.
    132   static MemDepResult getDef(Instruction *Inst) {
    133     assert(Inst && "Def requires inst");
    134     return MemDepResult(ValueTy::create<Def>(Inst));
    135   }
    136   static MemDepResult getClobber(Instruction *Inst) {
    137     assert(Inst && "Clobber requires inst");
    138     return MemDepResult(ValueTy::create<Clobber>(Inst));
    139   }
    140   static MemDepResult getNonLocal() {
    141     return MemDepResult(ValueTy::create<Other>(NonLocal));
    142   }
    143   static MemDepResult getNonFuncLocal() {
    144     return MemDepResult(ValueTy::create<Other>(NonFuncLocal));
    145   }
    146   static MemDepResult getUnknown() {
    147     return MemDepResult(ValueTy::create<Other>(Unknown));
    148   }
    149 
    150   /// Tests if this MemDepResult represents a query that is an instruction
    151   /// clobber dependency.
    152   bool isClobber() const { return Value.is<Clobber>(); }
    153 
    154   /// Tests if this MemDepResult represents a query that is an instruction
    155   /// definition dependency.
    156   bool isDef() const { return Value.is<Def>(); }
    157 
    158   /// Tests if this MemDepResult represents a query that is transparent to the
    159   /// start of the block, but where a non-local hasn't been done.
    160   bool isNonLocal() const {
    161     return Value.is<Other>() && Value.cast<Other>() == NonLocal;
    162   }
    163 
    164   /// Tests if this MemDepResult represents a query that is transparent to the
    165   /// start of the function.
    166   bool isNonFuncLocal() const {
    167     return Value.is<Other>() && Value.cast<Other>() == NonFuncLocal;
    168   }
    169 
    170   /// Tests if this MemDepResult represents a query which cannot and/or will
    171   /// not be computed.
    172   bool isUnknown() const {
    173     return Value.is<Other>() && Value.cast<Other>() == Unknown;
    174   }
    175 
    176   /// If this is a normal dependency, returns the instruction that is depended
    177   /// on.  Otherwise, returns null.
    178   Instruction *getInst() const {
    179     switch (Value.getTag()) {
    180     case Invalid:
    181       return Value.cast<Invalid>();
    182     case Clobber:
    183       return Value.cast<Clobber>();
    184     case Def:
    185       return Value.cast<Def>();
    186     case Other:
    187       return nullptr;
    188     }
    189     llvm_unreachable("Unknown discriminant!");
    190   }
    191 
    192   bool operator==(const MemDepResult &M) const { return Value == M.Value; }
    193   bool operator!=(const MemDepResult &M) const { return Value != M.Value; }
    194   bool operator<(const MemDepResult &M) const { return Value < M.Value; }
    195   bool operator>(const MemDepResult &M) const { return Value > M.Value; }
    196 
    197 private:
    198   friend class MemoryDependenceResults;
    199 
    200   /// Tests if this is a MemDepResult in its dirty/invalid. state.
    201   bool isDirty() const { return Value.is<Invalid>(); }
    202 
    203   static MemDepResult getDirty(Instruction *Inst) {
    204     return MemDepResult(ValueTy::create<Invalid>(Inst));
    205   }
    206 };
    207 
    208 /// This is an entry in the NonLocalDepInfo cache.
    209 ///
    210 /// For each BasicBlock (the BB entry) it keeps a MemDepResult.
    211 class NonLocalDepEntry {
    212   BasicBlock *BB;
    213   MemDepResult Result;
    214 
    215 public:
    216   NonLocalDepEntry(BasicBlock *bb, MemDepResult result)
    217       : BB(bb), Result(result) {}
    218 
    219   // This is used for searches.
    220   NonLocalDepEntry(BasicBlock *bb) : BB(bb) {}
    221 
    222   // BB is the sort key, it can't be changed.
    223   BasicBlock *getBB() const { return BB; }
    224 
    225   void setResult(const MemDepResult &R) { Result = R; }
    226 
    227   const MemDepResult &getResult() const { return Result; }
    228 
    229   bool operator<(const NonLocalDepEntry &RHS) const { return BB < RHS.BB; }
    230 };
    231 
    232 /// This is a result from a NonLocal dependence query.
    233 ///
    234 /// For each BasicBlock (the BB entry) it keeps a MemDepResult and the
    235 /// (potentially phi translated) address that was live in the block.
    236 class NonLocalDepResult {
    237   NonLocalDepEntry Entry;
    238   Value *Address;
    239 
    240 public:
    241   NonLocalDepResult(BasicBlock *bb, MemDepResult result, Value *address)
    242       : Entry(bb, result), Address(address) {}
    243 
    244   // BB is the sort key, it can't be changed.
    245   BasicBlock *getBB() const { return Entry.getBB(); }
    246 
    247   void setResult(const MemDepResult &R, Value *Addr) {
    248     Entry.setResult(R);
    249     Address = Addr;
    250   }
    251 
    252   const MemDepResult &getResult() const { return Entry.getResult(); }
    253 
    254   /// Returns the address of this pointer in this block.
    255   ///
    256   /// This can be different than the address queried for the non-local result
    257   /// because of phi translation.  This returns null if the address was not
    258   /// available in a block (i.e. because phi translation failed) or if this is
    259   /// a cached result and that address was deleted.
    260   ///
    261   /// The address is always null for a non-local 'call' dependence.
    262   Value *getAddress() const { return Address; }
    263 };
    264 
    265 /// Provides a lazy, caching interface for making common memory aliasing
    266 /// information queries, backed by LLVM's alias analysis passes.
    267 ///
    268 /// The dependency information returned is somewhat unusual, but is pragmatic.
    269 /// If queried about a store or call that might modify memory, the analysis
    270 /// will return the instruction[s] that may either load from that memory or
    271 /// store to it.  If queried with a load or call that can never modify memory,
    272 /// the analysis will return calls and stores that might modify the pointer,
    273 /// but generally does not return loads unless a) they are volatile, or
    274 /// b) they load from *must-aliased* pointers.  Returning a dependence on
    275 /// must-alias'd pointers instead of all pointers interacts well with the
    276 /// internal caching mechanism.
    277 class MemoryDependenceResults {
    278   // A map from instructions to their dependency.
    279   using LocalDepMapType = DenseMap<Instruction *, MemDepResult>;
    280   LocalDepMapType LocalDeps;
    281 
    282 public:
    283   using NonLocalDepInfo = std::vector<NonLocalDepEntry>;
    284 
    285 private:
    286   /// A pair<Value*, bool> where the bool is true if the dependence is a read
    287   /// only dependence, false if read/write.
    288   using ValueIsLoadPair = PointerIntPair<const Value *, 1, bool>;
    289 
    290   /// This pair is used when caching information for a block.
    291   ///
    292   /// If the pointer is null, the cache value is not a full query that starts
    293   /// at the specified block.  If non-null, the bool indicates whether or not
    294   /// the contents of the block was skipped.
    295   using BBSkipFirstBlockPair = PointerIntPair<BasicBlock *, 1, bool>;
    296 
    297   /// This record is the information kept for each (value, is load) pair.
    298   struct NonLocalPointerInfo {
    299     /// The pair of the block and the skip-first-block flag.
    300     BBSkipFirstBlockPair Pair;
    301     /// The results of the query for each relevant block.
    302     NonLocalDepInfo NonLocalDeps;
    303     /// The maximum size of the dereferences of the pointer.
    304     ///
    305     /// May be UnknownSize if the sizes are unknown.
    306     LocationSize Size = LocationSize::afterPointer();
    307     /// The AA tags associated with dereferences of the pointer.
    308     ///
    309     /// The members may be null if there are no tags or conflicting tags.
    310     AAMDNodes AATags;
    311 
    312     NonLocalPointerInfo() = default;
    313   };
    314 
    315   /// Cache storing single nonlocal def for the instruction.
    316   /// It is set when nonlocal def would be found in function returning only
    317   /// local dependencies.
    318   DenseMap<AssertingVH<const Value>, NonLocalDepResult> NonLocalDefsCache;
    319   using ReverseNonLocalDefsCacheTy =
    320     DenseMap<Instruction *, SmallPtrSet<const Value*, 4>>;
    321   ReverseNonLocalDefsCacheTy ReverseNonLocalDefsCache;
    322 
    323   /// This map stores the cached results of doing a pointer lookup at the
    324   /// bottom of a block.
    325   ///
    326   /// The key of this map is the pointer+isload bit, the value is a list of
    327   /// <bb->result> mappings.
    328   using CachedNonLocalPointerInfo =
    329       DenseMap<ValueIsLoadPair, NonLocalPointerInfo>;
    330   CachedNonLocalPointerInfo NonLocalPointerDeps;
    331 
    332   // A map from instructions to their non-local pointer dependencies.
    333   using ReverseNonLocalPtrDepTy =
    334       DenseMap<Instruction *, SmallPtrSet<ValueIsLoadPair, 4>>;
    335   ReverseNonLocalPtrDepTy ReverseNonLocalPtrDeps;
    336 
    337   /// This is the instruction we keep for each cached access that we have for
    338   /// an instruction.
    339   ///
    340   /// The pointer is an owning pointer and the bool indicates whether we have
    341   /// any dirty bits in the set.
    342   using PerInstNLInfo = std::pair<NonLocalDepInfo, bool>;
    343 
    344   // A map from instructions to their non-local dependencies.
    345   using NonLocalDepMapType = DenseMap<Instruction *, PerInstNLInfo>;
    346 
    347   NonLocalDepMapType NonLocalDeps;
    348 
    349   // A reverse mapping from dependencies to the dependees.  This is
    350   // used when removing instructions to keep the cache coherent.
    351   using ReverseDepMapType =
    352       DenseMap<Instruction *, SmallPtrSet<Instruction *, 4>>;
    353   ReverseDepMapType ReverseLocalDeps;
    354 
    355   // A reverse mapping from dependencies to the non-local dependees.
    356   ReverseDepMapType ReverseNonLocalDeps;
    357 
    358   /// Current AA implementation, just a cache.
    359   AAResults &AA;
    360   AssumptionCache &AC;
    361   const TargetLibraryInfo &TLI;
    362   DominatorTree &DT;
    363   PhiValues &PV;
    364   PredIteratorCache PredCache;
    365 
    366   unsigned DefaultBlockScanLimit;
    367 
    368   /// Offsets to dependant clobber loads.
    369   using ClobberOffsetsMapType = DenseMap<LoadInst *, int32_t>;
    370   ClobberOffsetsMapType ClobberOffsets;
    371 
    372 public:
    373   MemoryDependenceResults(AAResults &AA, AssumptionCache &AC,
    374                           const TargetLibraryInfo &TLI, DominatorTree &DT,
    375                           PhiValues &PV, unsigned DefaultBlockScanLimit)
    376       : AA(AA), AC(AC), TLI(TLI), DT(DT), PV(PV),
    377         DefaultBlockScanLimit(DefaultBlockScanLimit) {}
    378 
    379   /// Handle invalidation in the new PM.
    380   bool invalidate(Function &F, const PreservedAnalyses &PA,
    381                   FunctionAnalysisManager::Invalidator &Inv);
    382 
    383   /// Some methods limit the number of instructions they will examine.
    384   /// The return value of this method is the default limit that will be
    385   /// used if no limit is explicitly passed in.
    386   unsigned getDefaultBlockScanLimit() const;
    387 
    388   /// Returns the instruction on which a memory operation depends.
    389   ///
    390   /// See the class comment for more details. It is illegal to call this on
    391   /// non-memory instructions.
    392   MemDepResult getDependency(Instruction *QueryInst);
    393 
    394   /// Perform a full dependency query for the specified call, returning the set
    395   /// of blocks that the value is potentially live across.
    396   ///
    397   /// The returned set of results will include a "NonLocal" result for all
    398   /// blocks where the value is live across.
    399   ///
    400   /// This method assumes the instruction returns a "NonLocal" dependency
    401   /// within its own block.
    402   ///
    403   /// This returns a reference to an internal data structure that may be
    404   /// invalidated on the next non-local query or when an instruction is
    405   /// removed.  Clients must copy this data if they want it around longer than
    406   /// that.
    407   const NonLocalDepInfo &getNonLocalCallDependency(CallBase *QueryCall);
    408 
    409   /// Perform a full dependency query for an access to the QueryInst's
    410   /// specified memory location, returning the set of instructions that either
    411   /// define or clobber the value.
    412   ///
    413   /// Warning: For a volatile query instruction, the dependencies will be
    414   /// accurate, and thus usable for reordering, but it is never legal to
    415   /// remove the query instruction.
    416   ///
    417   /// This method assumes the pointer has a "NonLocal" dependency within
    418   /// QueryInst's parent basic block.
    419   void getNonLocalPointerDependency(Instruction *QueryInst,
    420                                     SmallVectorImpl<NonLocalDepResult> &Result);
    421 
    422   /// Removes an instruction from the dependence analysis, updating the
    423   /// dependence of instructions that previously depended on it.
    424   void removeInstruction(Instruction *InstToRemove);
    425 
    426   /// Invalidates cached information about the specified pointer, because it
    427   /// may be too conservative in memdep.
    428   ///
    429   /// This is an optional call that can be used when the client detects an
    430   /// equivalence between the pointer and some other value and replaces the
    431   /// other value with ptr. This can make Ptr available in more places that
    432   /// cached info does not necessarily keep.
    433   void invalidateCachedPointerInfo(Value *Ptr);
    434 
    435   /// Clears the PredIteratorCache info.
    436   ///
    437   /// This needs to be done when the CFG changes, e.g., due to splitting
    438   /// critical edges.
    439   void invalidateCachedPredecessors();
    440 
    441   /// Returns the instruction on which a memory location depends.
    442   ///
    443   /// If isLoad is true, this routine ignores may-aliases with read-only
    444   /// operations.  If isLoad is false, this routine ignores may-aliases
    445   /// with reads from read-only locations. If possible, pass the query
    446   /// instruction as well; this function may take advantage of the metadata
    447   /// annotated to the query instruction to refine the result. \p Limit
    448   /// can be used to set the maximum number of instructions that will be
    449   /// examined to find the pointer dependency. On return, it will be set to
    450   /// the number of instructions left to examine. If a null pointer is passed
    451   /// in, the limit will default to the value of -memdep-block-scan-limit.
    452   ///
    453   /// Note that this is an uncached query, and thus may be inefficient.
    454   MemDepResult getPointerDependencyFrom(const MemoryLocation &Loc, bool isLoad,
    455                                         BasicBlock::iterator ScanIt,
    456                                         BasicBlock *BB,
    457                                         Instruction *QueryInst = nullptr,
    458                                         unsigned *Limit = nullptr);
    459 
    460   MemDepResult getPointerDependencyFrom(const MemoryLocation &Loc, bool isLoad,
    461                                         BasicBlock::iterator ScanIt,
    462                                         BasicBlock *BB,
    463                                         Instruction *QueryInst,
    464                                         unsigned *Limit,
    465                                         BatchAAResults &BatchAA);
    466 
    467   MemDepResult
    468   getSimplePointerDependencyFrom(const MemoryLocation &MemLoc, bool isLoad,
    469                                  BasicBlock::iterator ScanIt, BasicBlock *BB,
    470                                  Instruction *QueryInst, unsigned *Limit,
    471                                  BatchAAResults &BatchAA);
    472 
    473   /// This analysis looks for other loads and stores with invariant.group
    474   /// metadata and the same pointer operand. Returns Unknown if it does not
    475   /// find anything, and Def if it can be assumed that 2 instructions load or
    476   /// store the same value and NonLocal which indicate that non-local Def was
    477   /// found, which can be retrieved by calling getNonLocalPointerDependency
    478   /// with the same queried instruction.
    479   MemDepResult getInvariantGroupPointerDependency(LoadInst *LI, BasicBlock *BB);
    480 
    481   /// Release memory in caches.
    482   void releaseMemory();
    483 
    484   /// Return the clobber offset to dependent instruction.
    485   Optional<int32_t> getClobberOffset(LoadInst *DepInst) const {
    486     const auto Off = ClobberOffsets.find(DepInst);
    487     if (Off != ClobberOffsets.end())
    488       return Off->getSecond();
    489     return None;
    490   }
    491 
    492 private:
    493   MemDepResult getCallDependencyFrom(CallBase *Call, bool isReadOnlyCall,
    494                                      BasicBlock::iterator ScanIt,
    495                                      BasicBlock *BB);
    496   bool getNonLocalPointerDepFromBB(Instruction *QueryInst,
    497                                    const PHITransAddr &Pointer,
    498                                    const MemoryLocation &Loc, bool isLoad,
    499                                    BasicBlock *BB,
    500                                    SmallVectorImpl<NonLocalDepResult> &Result,
    501                                    DenseMap<BasicBlock *, Value *> &Visited,
    502                                    bool SkipFirstBlock = false,
    503                                    bool IsIncomplete = false);
    504   MemDepResult GetNonLocalInfoForBlock(Instruction *QueryInst,
    505                                        const MemoryLocation &Loc, bool isLoad,
    506                                        BasicBlock *BB, NonLocalDepInfo *Cache,
    507                                        unsigned NumSortedEntries,
    508                                        BatchAAResults &BatchAA);
    509 
    510   void RemoveCachedNonLocalPointerDependencies(ValueIsLoadPair P);
    511 
    512   void verifyRemoved(Instruction *Inst) const;
    513 };
    514 
    515 /// An analysis that produces \c MemoryDependenceResults for a function.
    516 ///
    517 /// This is essentially a no-op because the results are computed entirely
    518 /// lazily.
    519 class MemoryDependenceAnalysis
    520     : public AnalysisInfoMixin<MemoryDependenceAnalysis> {
    521   friend AnalysisInfoMixin<MemoryDependenceAnalysis>;
    522 
    523   static AnalysisKey Key;
    524 
    525   unsigned DefaultBlockScanLimit;
    526 
    527 public:
    528   using Result = MemoryDependenceResults;
    529 
    530   MemoryDependenceAnalysis();
    531   MemoryDependenceAnalysis(unsigned DefaultBlockScanLimit) : DefaultBlockScanLimit(DefaultBlockScanLimit) { }
    532 
    533   MemoryDependenceResults run(Function &F, FunctionAnalysisManager &AM);
    534 };
    535 
    536 /// A wrapper analysis pass for the legacy pass manager that exposes a \c
    537 /// MemoryDepnedenceResults instance.
    538 class MemoryDependenceWrapperPass : public FunctionPass {
    539   Optional<MemoryDependenceResults> MemDep;
    540 
    541 public:
    542   static char ID;
    543 
    544   MemoryDependenceWrapperPass();
    545   ~MemoryDependenceWrapperPass() override;
    546 
    547   /// Pass Implementation stuff.  This doesn't do any analysis eagerly.
    548   bool runOnFunction(Function &) override;
    549 
    550   /// Clean up memory in between runs
    551   void releaseMemory() override;
    552 
    553   /// Does not modify anything.  It uses Value Numbering and Alias Analysis.
    554   void getAnalysisUsage(AnalysisUsage &AU) const override;
    555 
    556   MemoryDependenceResults &getMemDep() { return *MemDep; }
    557 };
    558 
    559 } // end namespace llvm
    560 
    561 #endif // LLVM_ANALYSIS_MEMORYDEPENDENCEANALYSIS_H
    562