Home | History | Annotate | Line # | Download | only in Analysis
      1 //===- MemoryLocation.h - Memory location descriptions ----------*- C++ -*-===//
      2 //
      3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
      4 // See https://llvm.org/LICENSE.txt for license information.
      5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
      6 //
      7 //===----------------------------------------------------------------------===//
      8 /// \file
      9 /// This file provides utility analysis objects describing memory locations.
     10 /// These are used both by the Alias Analysis infrastructure and more
     11 /// specialized memory analysis layers.
     12 ///
     13 //===----------------------------------------------------------------------===//
     14 
     15 #ifndef LLVM_ANALYSIS_MEMORYLOCATION_H
     16 #define LLVM_ANALYSIS_MEMORYLOCATION_H
     17 
     18 #include "llvm/ADT/DenseMapInfo.h"
     19 #include "llvm/ADT/Optional.h"
     20 #include "llvm/IR/Metadata.h"
     21 #include "llvm/Support/TypeSize.h"
     22 
     23 namespace llvm {
     24 
     25 class CallBase;
     26 class Instruction;
     27 class LoadInst;
     28 class StoreInst;
     29 class MemTransferInst;
     30 class MemIntrinsic;
     31 class AtomicCmpXchgInst;
     32 class AtomicMemTransferInst;
     33 class AtomicMemIntrinsic;
     34 class AtomicRMWInst;
     35 class AnyMemTransferInst;
     36 class AnyMemIntrinsic;
     37 class TargetLibraryInfo;
     38 class VAArgInst;
     39 
     40 // Represents the size of a MemoryLocation. Logically, it's an
     41 // Optional<uint63_t> that also carries a bit to represent whether the integer
     42 // it contains, N, is 'precise'. Precise, in this context, means that we know
     43 // that the area of storage referenced by the given MemoryLocation must be
     44 // precisely N bytes. An imprecise value is formed as the union of two or more
     45 // precise values, and can conservatively represent all of the values unioned
     46 // into it. Importantly, imprecise values are an *upper-bound* on the size of a
     47 // MemoryLocation.
     48 //
     49 // Concretely, a precise MemoryLocation is (%p, 4) in
     50 // store i32 0, i32* %p
     51 //
     52 // Since we know that %p must be at least 4 bytes large at this point.
     53 // Otherwise, we have UB. An example of an imprecise MemoryLocation is (%p, 4)
     54 // at the memcpy in
     55 //
     56 //   %n = select i1 %foo, i64 1, i64 4
     57 //   call void @llvm.memcpy.p0i8.p0i8.i64(i8* %p, i8* %baz, i64 %n, i32 1,
     58 //                                        i1 false)
     59 //
     60 // ...Since we'll copy *up to* 4 bytes into %p, but we can't guarantee that
     61 // we'll ever actually do so.
     62 //
     63 // If asked to represent a pathologically large value, this will degrade to
     64 // None.
     65 class LocationSize {
     66   enum : uint64_t {
     67     BeforeOrAfterPointer = ~uint64_t(0),
     68     AfterPointer = BeforeOrAfterPointer - 1,
     69     MapEmpty = BeforeOrAfterPointer - 2,
     70     MapTombstone = BeforeOrAfterPointer - 3,
     71     ImpreciseBit = uint64_t(1) << 63,
     72 
     73     // The maximum value we can represent without falling back to 'unknown'.
     74     MaxValue = (MapTombstone - 1) & ~ImpreciseBit,
     75   };
     76 
     77   uint64_t Value;
     78 
     79   // Hack to support implicit construction. This should disappear when the
     80   // public LocationSize ctor goes away.
     81   enum DirectConstruction { Direct };
     82 
     83   constexpr LocationSize(uint64_t Raw, DirectConstruction): Value(Raw) {}
     84 
     85   static_assert(AfterPointer & ImpreciseBit,
     86                 "AfterPointer is imprecise by definition.");
     87   static_assert(BeforeOrAfterPointer & ImpreciseBit,
     88                 "BeforeOrAfterPointer is imprecise by definition.");
     89 
     90 public:
     91   // FIXME: Migrate all users to construct via either `precise` or `upperBound`,
     92   // to make it more obvious at the callsite the kind of size that they're
     93   // providing.
     94   //
     95   // Since the overwhelming majority of users of this provide precise values,
     96   // this assumes the provided value is precise.
     97   constexpr LocationSize(uint64_t Raw)
     98       : Value(Raw > MaxValue ? AfterPointer : Raw) {}
     99 
    100   static LocationSize precise(uint64_t Value) { return LocationSize(Value); }
    101   static LocationSize precise(TypeSize Value) {
    102     if (Value.isScalable())
    103       return afterPointer();
    104     return precise(Value.getFixedSize());
    105   }
    106 
    107   static LocationSize upperBound(uint64_t Value) {
    108     // You can't go lower than 0, so give a precise result.
    109     if (LLVM_UNLIKELY(Value == 0))
    110       return precise(0);
    111     if (LLVM_UNLIKELY(Value > MaxValue))
    112       return afterPointer();
    113     return LocationSize(Value | ImpreciseBit, Direct);
    114   }
    115   static LocationSize upperBound(TypeSize Value) {
    116     if (Value.isScalable())
    117       return afterPointer();
    118     return upperBound(Value.getFixedSize());
    119   }
    120 
    121   /// Any location after the base pointer (but still within the underlying
    122   /// object).
    123   constexpr static LocationSize afterPointer() {
    124     return LocationSize(AfterPointer, Direct);
    125   }
    126 
    127   /// Any location before or after the base pointer (but still within the
    128   /// underlying object).
    129   constexpr static LocationSize beforeOrAfterPointer() {
    130     return LocationSize(BeforeOrAfterPointer, Direct);
    131   }
    132 
    133   // Sentinel values, generally used for maps.
    134   constexpr static LocationSize mapTombstone() {
    135     return LocationSize(MapTombstone, Direct);
    136   }
    137   constexpr static LocationSize mapEmpty() {
    138     return LocationSize(MapEmpty, Direct);
    139   }
    140 
    141   // Returns a LocationSize that can correctly represent either `*this` or
    142   // `Other`.
    143   LocationSize unionWith(LocationSize Other) const {
    144     if (Other == *this)
    145       return *this;
    146 
    147     if (Value == BeforeOrAfterPointer || Other.Value == BeforeOrAfterPointer)
    148       return beforeOrAfterPointer();
    149     if (Value == AfterPointer || Other.Value == AfterPointer)
    150       return afterPointer();
    151 
    152     return upperBound(std::max(getValue(), Other.getValue()));
    153   }
    154 
    155   bool hasValue() const {
    156     return Value != AfterPointer && Value != BeforeOrAfterPointer;
    157   }
    158   uint64_t getValue() const {
    159     assert(hasValue() && "Getting value from an unknown LocationSize!");
    160     return Value & ~ImpreciseBit;
    161   }
    162 
    163   // Returns whether or not this value is precise. Note that if a value is
    164   // precise, it's guaranteed to not be unknown.
    165   bool isPrecise() const {
    166     return (Value & ImpreciseBit) == 0;
    167   }
    168 
    169   // Convenience method to check if this LocationSize's value is 0.
    170   bool isZero() const { return hasValue() && getValue() == 0; }
    171 
    172   /// Whether accesses before the base pointer are possible.
    173   bool mayBeBeforePointer() const { return Value == BeforeOrAfterPointer; }
    174 
    175   bool operator==(const LocationSize &Other) const {
    176     return Value == Other.Value;
    177   }
    178 
    179   bool operator!=(const LocationSize &Other) const {
    180     return !(*this == Other);
    181   }
    182 
    183   // Ordering operators are not provided, since it's unclear if there's only one
    184   // reasonable way to compare:
    185   // - values that don't exist against values that do, and
    186   // - precise values to imprecise values
    187 
    188   void print(raw_ostream &OS) const;
    189 
    190   // Returns an opaque value that represents this LocationSize. Cannot be
    191   // reliably converted back into a LocationSize.
    192   uint64_t toRaw() const { return Value; }
    193 };
    194 
    195 inline raw_ostream &operator<<(raw_ostream &OS, LocationSize Size) {
    196   Size.print(OS);
    197   return OS;
    198 }
    199 
    200 /// Representation for a specific memory location.
    201 ///
    202 /// This abstraction can be used to represent a specific location in memory.
    203 /// The goal of the location is to represent enough information to describe
    204 /// abstract aliasing, modification, and reference behaviors of whatever
    205 /// value(s) are stored in memory at the particular location.
    206 ///
    207 /// The primary user of this interface is LLVM's Alias Analysis, but other
    208 /// memory analyses such as MemoryDependence can use it as well.
    209 class MemoryLocation {
    210 public:
    211   /// UnknownSize - This is a special value which can be used with the
    212   /// size arguments in alias queries to indicate that the caller does not
    213   /// know the sizes of the potential memory references.
    214   enum : uint64_t { UnknownSize = ~UINT64_C(0) };
    215 
    216   /// The address of the start of the location.
    217   const Value *Ptr;
    218 
    219   /// The maximum size of the location, in address-units, or
    220   /// UnknownSize if the size is not known.
    221   ///
    222   /// Note that an unknown size does not mean the pointer aliases the entire
    223   /// virtual address space, because there are restrictions on stepping out of
    224   /// one object and into another. See
    225   /// http://llvm.org/docs/LangRef.html#pointeraliasing
    226   LocationSize Size;
    227 
    228   /// The metadata nodes which describes the aliasing of the location (each
    229   /// member is null if that kind of information is unavailable).
    230   AAMDNodes AATags;
    231 
    232   void print(raw_ostream &OS) const { OS << *Ptr << " " << Size << "\n"; }
    233 
    234   /// Return a location with information about the memory reference by the given
    235   /// instruction.
    236   static MemoryLocation get(const LoadInst *LI);
    237   static MemoryLocation get(const StoreInst *SI);
    238   static MemoryLocation get(const VAArgInst *VI);
    239   static MemoryLocation get(const AtomicCmpXchgInst *CXI);
    240   static MemoryLocation get(const AtomicRMWInst *RMWI);
    241   static MemoryLocation get(const Instruction *Inst) {
    242     return *MemoryLocation::getOrNone(Inst);
    243   }
    244   static Optional<MemoryLocation> getOrNone(const Instruction *Inst);
    245 
    246   /// Return a location representing the source of a memory transfer.
    247   static MemoryLocation getForSource(const MemTransferInst *MTI);
    248   static MemoryLocation getForSource(const AtomicMemTransferInst *MTI);
    249   static MemoryLocation getForSource(const AnyMemTransferInst *MTI);
    250 
    251   /// Return a location representing the destination of a memory set or
    252   /// transfer.
    253   static MemoryLocation getForDest(const MemIntrinsic *MI);
    254   static MemoryLocation getForDest(const AtomicMemIntrinsic *MI);
    255   static MemoryLocation getForDest(const AnyMemIntrinsic *MI);
    256 
    257   /// Return a location representing a particular argument of a call.
    258   static MemoryLocation getForArgument(const CallBase *Call, unsigned ArgIdx,
    259                                        const TargetLibraryInfo *TLI);
    260   static MemoryLocation getForArgument(const CallBase *Call, unsigned ArgIdx,
    261                                        const TargetLibraryInfo &TLI) {
    262     return getForArgument(Call, ArgIdx, &TLI);
    263   }
    264 
    265   /// Return a location that may access any location after Ptr, while remaining
    266   /// within the underlying object.
    267   static MemoryLocation getAfter(const Value *Ptr,
    268                                  const AAMDNodes &AATags = AAMDNodes()) {
    269     return MemoryLocation(Ptr, LocationSize::afterPointer(), AATags);
    270   }
    271 
    272   /// Return a location that may access any location before or after Ptr, while
    273   /// remaining within the underlying object.
    274   static MemoryLocation
    275   getBeforeOrAfter(const Value *Ptr, const AAMDNodes &AATags = AAMDNodes()) {
    276     return MemoryLocation(Ptr, LocationSize::beforeOrAfterPointer(), AATags);
    277   }
    278 
    279   // Return the exact size if the exact size is known at compiletime,
    280   // otherwise return MemoryLocation::UnknownSize.
    281   static uint64_t getSizeOrUnknown(const TypeSize &T) {
    282     return T.isScalable() ? UnknownSize : T.getFixedSize();
    283   }
    284 
    285   MemoryLocation()
    286       : Ptr(nullptr), Size(LocationSize::beforeOrAfterPointer()), AATags() {}
    287 
    288   explicit MemoryLocation(const Value *Ptr, LocationSize Size,
    289                           const AAMDNodes &AATags = AAMDNodes())
    290       : Ptr(Ptr), Size(Size), AATags(AATags) {}
    291 
    292   MemoryLocation getWithNewPtr(const Value *NewPtr) const {
    293     MemoryLocation Copy(*this);
    294     Copy.Ptr = NewPtr;
    295     return Copy;
    296   }
    297 
    298   MemoryLocation getWithNewSize(LocationSize NewSize) const {
    299     MemoryLocation Copy(*this);
    300     Copy.Size = NewSize;
    301     return Copy;
    302   }
    303 
    304   MemoryLocation getWithoutAATags() const {
    305     MemoryLocation Copy(*this);
    306     Copy.AATags = AAMDNodes();
    307     return Copy;
    308   }
    309 
    310   bool operator==(const MemoryLocation &Other) const {
    311     return Ptr == Other.Ptr && Size == Other.Size && AATags == Other.AATags;
    312   }
    313 };
    314 
    315 // Specialize DenseMapInfo.
    316 template <> struct DenseMapInfo<LocationSize> {
    317   static inline LocationSize getEmptyKey() {
    318     return LocationSize::mapEmpty();
    319   }
    320   static inline LocationSize getTombstoneKey() {
    321     return LocationSize::mapTombstone();
    322   }
    323   static unsigned getHashValue(const LocationSize &Val) {
    324     return DenseMapInfo<uint64_t>::getHashValue(Val.toRaw());
    325   }
    326   static bool isEqual(const LocationSize &LHS, const LocationSize &RHS) {
    327     return LHS == RHS;
    328   }
    329 };
    330 
    331 template <> struct DenseMapInfo<MemoryLocation> {
    332   static inline MemoryLocation getEmptyKey() {
    333     return MemoryLocation(DenseMapInfo<const Value *>::getEmptyKey(),
    334                           DenseMapInfo<LocationSize>::getEmptyKey());
    335   }
    336   static inline MemoryLocation getTombstoneKey() {
    337     return MemoryLocation(DenseMapInfo<const Value *>::getTombstoneKey(),
    338                           DenseMapInfo<LocationSize>::getTombstoneKey());
    339   }
    340   static unsigned getHashValue(const MemoryLocation &Val) {
    341     return DenseMapInfo<const Value *>::getHashValue(Val.Ptr) ^
    342            DenseMapInfo<LocationSize>::getHashValue(Val.Size) ^
    343            DenseMapInfo<AAMDNodes>::getHashValue(Val.AATags);
    344   }
    345   static bool isEqual(const MemoryLocation &LHS, const MemoryLocation &RHS) {
    346     return LHS == RHS;
    347   }
    348 };
    349 }
    350 
    351 #endif
    352