Home | History | Annotate | Line # | Download | only in Analysis
      1 //===- TypeBasedAliasAnalysis.cpp - Type-Based Alias Analysis -------------===//
      2 //
      3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
      4 // See https://llvm.org/LICENSE.txt for license information.
      5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
      6 //
      7 //===----------------------------------------------------------------------===//
      8 //
      9 // This file defines the TypeBasedAliasAnalysis pass, which implements
     10 // metadata-based TBAA.
     11 //
     12 // In LLVM IR, memory does not have types, so LLVM's own type system is not
     13 // suitable for doing TBAA. Instead, metadata is added to the IR to describe
     14 // a type system of a higher level language. This can be used to implement
     15 // typical C/C++ TBAA, but it can also be used to implement custom alias
     16 // analysis behavior for other languages.
     17 //
     18 // We now support two types of metadata format: scalar TBAA and struct-path
     19 // aware TBAA. After all testing cases are upgraded to use struct-path aware
     20 // TBAA and we can auto-upgrade existing bc files, the support for scalar TBAA
     21 // can be dropped.
     22 //
     23 // The scalar TBAA metadata format is very simple. TBAA MDNodes have up to
     24 // three fields, e.g.:
     25 //   !0 = !{ !"an example type tree" }
     26 //   !1 = !{ !"int", !0 }
     27 //   !2 = !{ !"float", !0 }
     28 //   !3 = !{ !"const float", !2, i64 1 }
     29 //
     30 // The first field is an identity field. It can be any value, usually
     31 // an MDString, which uniquely identifies the type. The most important
     32 // name in the tree is the name of the root node. Two trees with
     33 // different root node names are entirely disjoint, even if they
     34 // have leaves with common names.
     35 //
     36 // The second field identifies the type's parent node in the tree, or
     37 // is null or omitted for a root node. A type is considered to alias
     38 // all of its descendants and all of its ancestors in the tree. Also,
     39 // a type is considered to alias all types in other trees, so that
     40 // bitcode produced from multiple front-ends is handled conservatively.
     41 //
     42 // If the third field is present, it's an integer which if equal to 1
     43 // indicates that the type is "constant" (meaning pointsToConstantMemory
     44 // should return true; see
     45 // http://llvm.org/docs/AliasAnalysis.html#OtherItfs).
     46 //
     47 // With struct-path aware TBAA, the MDNodes attached to an instruction using
     48 // "!tbaa" are called path tag nodes.
     49 //
     50 // The path tag node has 4 fields with the last field being optional.
     51 //
     52 // The first field is the base type node, it can be a struct type node
     53 // or a scalar type node. The second field is the access type node, it
     54 // must be a scalar type node. The third field is the offset into the base type.
     55 // The last field has the same meaning as the last field of our scalar TBAA:
     56 // it's an integer which if equal to 1 indicates that the access is "constant".
     57 //
     58 // The struct type node has a name and a list of pairs, one pair for each member
     59 // of the struct. The first element of each pair is a type node (a struct type
     60 // node or a scalar type node), specifying the type of the member, the second
     61 // element of each pair is the offset of the member.
     62 //
     63 // Given an example
     64 // typedef struct {
     65 //   short s;
     66 // } A;
     67 // typedef struct {
     68 //   uint16_t s;
     69 //   A a;
     70 // } B;
     71 //
     72 // For an access to B.a.s, we attach !5 (a path tag node) to the load/store
     73 // instruction. The base type is !4 (struct B), the access type is !2 (scalar
     74 // type short) and the offset is 4.
     75 //
     76 // !0 = !{!"Simple C/C++ TBAA"}
     77 // !1 = !{!"omnipotent char", !0} // Scalar type node
     78 // !2 = !{!"short", !1}           // Scalar type node
     79 // !3 = !{!"A", !2, i64 0}        // Struct type node
     80 // !4 = !{!"B", !2, i64 0, !3, i64 4}
     81 //                                                           // Struct type node
     82 // !5 = !{!4, !2, i64 4}          // Path tag node
     83 //
     84 // The struct type nodes and the scalar type nodes form a type DAG.
     85 //         Root (!0)
     86 //         char (!1)  -- edge to Root
     87 //         short (!2) -- edge to char
     88 //         A (!3) -- edge with offset 0 to short
     89 //         B (!4) -- edge with offset 0 to short and edge with offset 4 to A
     90 //
     91 // To check if two tags (tagX and tagY) can alias, we start from the base type
     92 // of tagX, follow the edge with the correct offset in the type DAG and adjust
     93 // the offset until we reach the base type of tagY or until we reach the Root
     94 // node.
     95 // If we reach the base type of tagY, compare the adjusted offset with
     96 // offset of tagY, return Alias if the offsets are the same, return NoAlias
     97 // otherwise.
     98 // If we reach the Root node, perform the above starting from base type of tagY
     99 // to see if we reach base type of tagX.
    100 //
    101 // If they have different roots, they're part of different potentially
    102 // unrelated type systems, so we return Alias to be conservative.
    103 // If neither node is an ancestor of the other and they have the same root,
    104 // then we say NoAlias.
    105 //
    106 //===----------------------------------------------------------------------===//
    107 
    108 #include "llvm/Analysis/TypeBasedAliasAnalysis.h"
    109 #include "llvm/ADT/SetVector.h"
    110 #include "llvm/Analysis/AliasAnalysis.h"
    111 #include "llvm/Analysis/MemoryLocation.h"
    112 #include "llvm/IR/Constants.h"
    113 #include "llvm/IR/DerivedTypes.h"
    114 #include "llvm/IR/InstrTypes.h"
    115 #include "llvm/IR/Instruction.h"
    116 #include "llvm/IR/LLVMContext.h"
    117 #include "llvm/IR/Metadata.h"
    118 #include "llvm/InitializePasses.h"
    119 #include "llvm/Pass.h"
    120 #include "llvm/Support/Casting.h"
    121 #include "llvm/Support/CommandLine.h"
    122 #include "llvm/Support/ErrorHandling.h"
    123 #include <cassert>
    124 #include <cstdint>
    125 
    126 using namespace llvm;
    127 
    128 // A handy option for disabling TBAA functionality. The same effect can also be
    129 // achieved by stripping the !tbaa tags from IR, but this option is sometimes
    130 // more convenient.
    131 static cl::opt<bool> EnableTBAA("enable-tbaa", cl::init(true), cl::Hidden);
    132 
    133 namespace {
    134 
    135 /// isNewFormatTypeNode - Return true iff the given type node is in the new
    136 /// size-aware format.
    137 static bool isNewFormatTypeNode(const MDNode *N) {
    138   if (N->getNumOperands() < 3)
    139     return false;
    140   // In the old format the first operand is a string.
    141   if (!isa<MDNode>(N->getOperand(0)))
    142     return false;
    143   return true;
    144 }
    145 
    146 /// This is a simple wrapper around an MDNode which provides a higher-level
    147 /// interface by hiding the details of how alias analysis information is encoded
    148 /// in its operands.
    149 template<typename MDNodeTy>
    150 class TBAANodeImpl {
    151   MDNodeTy *Node = nullptr;
    152 
    153 public:
    154   TBAANodeImpl() = default;
    155   explicit TBAANodeImpl(MDNodeTy *N) : Node(N) {}
    156 
    157   /// getNode - Get the MDNode for this TBAANode.
    158   MDNodeTy *getNode() const { return Node; }
    159 
    160   /// isNewFormat - Return true iff the wrapped type node is in the new
    161   /// size-aware format.
    162   bool isNewFormat() const { return isNewFormatTypeNode(Node); }
    163 
    164   /// getParent - Get this TBAANode's Alias tree parent.
    165   TBAANodeImpl<MDNodeTy> getParent() const {
    166     if (isNewFormat())
    167       return TBAANodeImpl(cast<MDNodeTy>(Node->getOperand(0)));
    168 
    169     if (Node->getNumOperands() < 2)
    170       return TBAANodeImpl<MDNodeTy>();
    171     MDNodeTy *P = dyn_cast_or_null<MDNodeTy>(Node->getOperand(1));
    172     if (!P)
    173       return TBAANodeImpl<MDNodeTy>();
    174     // Ok, this node has a valid parent. Return it.
    175     return TBAANodeImpl<MDNodeTy>(P);
    176   }
    177 
    178   /// Test if this TBAANode represents a type for objects which are
    179   /// not modified (by any means) in the context where this
    180   /// AliasAnalysis is relevant.
    181   bool isTypeImmutable() const {
    182     if (Node->getNumOperands() < 3)
    183       return false;
    184     ConstantInt *CI = mdconst::dyn_extract<ConstantInt>(Node->getOperand(2));
    185     if (!CI)
    186       return false;
    187     return CI->getValue()[0];
    188   }
    189 };
    190 
    191 /// \name Specializations of \c TBAANodeImpl for const and non const qualified
    192 /// \c MDNode.
    193 /// @{
    194 using TBAANode = TBAANodeImpl<const MDNode>;
    195 using MutableTBAANode = TBAANodeImpl<MDNode>;
    196 /// @}
    197 
    198 /// This is a simple wrapper around an MDNode which provides a
    199 /// higher-level interface by hiding the details of how alias analysis
    200 /// information is encoded in its operands.
    201 template<typename MDNodeTy>
    202 class TBAAStructTagNodeImpl {
    203   /// This node should be created with createTBAAAccessTag().
    204   MDNodeTy *Node;
    205 
    206 public:
    207   explicit TBAAStructTagNodeImpl(MDNodeTy *N) : Node(N) {}
    208 
    209   /// Get the MDNode for this TBAAStructTagNode.
    210   MDNodeTy *getNode() const { return Node; }
    211 
    212   /// isNewFormat - Return true iff the wrapped access tag is in the new
    213   /// size-aware format.
    214   bool isNewFormat() const {
    215     if (Node->getNumOperands() < 4)
    216       return false;
    217     if (MDNodeTy *AccessType = getAccessType())
    218       if (!TBAANodeImpl<MDNodeTy>(AccessType).isNewFormat())
    219         return false;
    220     return true;
    221   }
    222 
    223   MDNodeTy *getBaseType() const {
    224     return dyn_cast_or_null<MDNode>(Node->getOperand(0));
    225   }
    226 
    227   MDNodeTy *getAccessType() const {
    228     return dyn_cast_or_null<MDNode>(Node->getOperand(1));
    229   }
    230 
    231   uint64_t getOffset() const {
    232     return mdconst::extract<ConstantInt>(Node->getOperand(2))->getZExtValue();
    233   }
    234 
    235   uint64_t getSize() const {
    236     if (!isNewFormat())
    237       return UINT64_MAX;
    238     return mdconst::extract<ConstantInt>(Node->getOperand(3))->getZExtValue();
    239   }
    240 
    241   /// Test if this TBAAStructTagNode represents a type for objects
    242   /// which are not modified (by any means) in the context where this
    243   /// AliasAnalysis is relevant.
    244   bool isTypeImmutable() const {
    245     unsigned OpNo = isNewFormat() ? 4 : 3;
    246     if (Node->getNumOperands() < OpNo + 1)
    247       return false;
    248     ConstantInt *CI = mdconst::dyn_extract<ConstantInt>(Node->getOperand(OpNo));
    249     if (!CI)
    250       return false;
    251     return CI->getValue()[0];
    252   }
    253 };
    254 
    255 /// \name Specializations of \c TBAAStructTagNodeImpl for const and non const
    256 /// qualified \c MDNods.
    257 /// @{
    258 using TBAAStructTagNode = TBAAStructTagNodeImpl<const MDNode>;
    259 using MutableTBAAStructTagNode = TBAAStructTagNodeImpl<MDNode>;
    260 /// @}
    261 
    262 /// This is a simple wrapper around an MDNode which provides a
    263 /// higher-level interface by hiding the details of how alias analysis
    264 /// information is encoded in its operands.
    265 class TBAAStructTypeNode {
    266   /// This node should be created with createTBAATypeNode().
    267   const MDNode *Node = nullptr;
    268 
    269 public:
    270   TBAAStructTypeNode() = default;
    271   explicit TBAAStructTypeNode(const MDNode *N) : Node(N) {}
    272 
    273   /// Get the MDNode for this TBAAStructTypeNode.
    274   const MDNode *getNode() const { return Node; }
    275 
    276   /// isNewFormat - Return true iff the wrapped type node is in the new
    277   /// size-aware format.
    278   bool isNewFormat() const { return isNewFormatTypeNode(Node); }
    279 
    280   bool operator==(const TBAAStructTypeNode &Other) const {
    281     return getNode() == Other.getNode();
    282   }
    283 
    284   /// getId - Return type identifier.
    285   Metadata *getId() const {
    286     return Node->getOperand(isNewFormat() ? 2 : 0);
    287   }
    288 
    289   unsigned getNumFields() const {
    290     unsigned FirstFieldOpNo = isNewFormat() ? 3 : 1;
    291     unsigned NumOpsPerField = isNewFormat() ? 3 : 2;
    292     return (getNode()->getNumOperands() - FirstFieldOpNo) / NumOpsPerField;
    293   }
    294 
    295   TBAAStructTypeNode getFieldType(unsigned FieldIndex) const {
    296     unsigned FirstFieldOpNo = isNewFormat() ? 3 : 1;
    297     unsigned NumOpsPerField = isNewFormat() ? 3 : 2;
    298     unsigned OpIndex = FirstFieldOpNo + FieldIndex * NumOpsPerField;
    299     auto *TypeNode = cast<MDNode>(getNode()->getOperand(OpIndex));
    300     return TBAAStructTypeNode(TypeNode);
    301   }
    302 
    303   /// Get this TBAAStructTypeNode's field in the type DAG with
    304   /// given offset. Update the offset to be relative to the field type.
    305   TBAAStructTypeNode getField(uint64_t &Offset) const {
    306     bool NewFormat = isNewFormat();
    307     if (NewFormat) {
    308       // New-format root and scalar type nodes have no fields.
    309       if (Node->getNumOperands() < 6)
    310         return TBAAStructTypeNode();
    311     } else {
    312       // Parent can be omitted for the root node.
    313       if (Node->getNumOperands() < 2)
    314         return TBAAStructTypeNode();
    315 
    316       // Fast path for a scalar type node and a struct type node with a single
    317       // field.
    318       if (Node->getNumOperands() <= 3) {
    319         uint64_t Cur = Node->getNumOperands() == 2
    320                            ? 0
    321                            : mdconst::extract<ConstantInt>(Node->getOperand(2))
    322                                  ->getZExtValue();
    323         Offset -= Cur;
    324         MDNode *P = dyn_cast_or_null<MDNode>(Node->getOperand(1));
    325         if (!P)
    326           return TBAAStructTypeNode();
    327         return TBAAStructTypeNode(P);
    328       }
    329     }
    330 
    331     // Assume the offsets are in order. We return the previous field if
    332     // the current offset is bigger than the given offset.
    333     unsigned FirstFieldOpNo = NewFormat ? 3 : 1;
    334     unsigned NumOpsPerField = NewFormat ? 3 : 2;
    335     unsigned TheIdx = 0;
    336     for (unsigned Idx = FirstFieldOpNo; Idx < Node->getNumOperands();
    337          Idx += NumOpsPerField) {
    338       uint64_t Cur = mdconst::extract<ConstantInt>(Node->getOperand(Idx + 1))
    339                          ->getZExtValue();
    340       if (Cur > Offset) {
    341         assert(Idx >= FirstFieldOpNo + NumOpsPerField &&
    342                "TBAAStructTypeNode::getField should have an offset match!");
    343         TheIdx = Idx - NumOpsPerField;
    344         break;
    345       }
    346     }
    347     // Move along the last field.
    348     if (TheIdx == 0)
    349       TheIdx = Node->getNumOperands() - NumOpsPerField;
    350     uint64_t Cur = mdconst::extract<ConstantInt>(Node->getOperand(TheIdx + 1))
    351                        ->getZExtValue();
    352     Offset -= Cur;
    353     MDNode *P = dyn_cast_or_null<MDNode>(Node->getOperand(TheIdx));
    354     if (!P)
    355       return TBAAStructTypeNode();
    356     return TBAAStructTypeNode(P);
    357   }
    358 };
    359 
    360 } // end anonymous namespace
    361 
    362 /// Check the first operand of the tbaa tag node, if it is a MDNode, we treat
    363 /// it as struct-path aware TBAA format, otherwise, we treat it as scalar TBAA
    364 /// format.
    365 static bool isStructPathTBAA(const MDNode *MD) {
    366   // Anonymous TBAA root starts with a MDNode and dragonegg uses it as
    367   // a TBAA tag.
    368   return isa<MDNode>(MD->getOperand(0)) && MD->getNumOperands() >= 3;
    369 }
    370 
    371 AliasResult TypeBasedAAResult::alias(const MemoryLocation &LocA,
    372                                      const MemoryLocation &LocB,
    373                                      AAQueryInfo &AAQI) {
    374   if (!EnableTBAA)
    375     return AAResultBase::alias(LocA, LocB, AAQI);
    376 
    377   // If accesses may alias, chain to the next AliasAnalysis.
    378   if (Aliases(LocA.AATags.TBAA, LocB.AATags.TBAA))
    379     return AAResultBase::alias(LocA, LocB, AAQI);
    380 
    381   // Otherwise return a definitive result.
    382   return AliasResult::NoAlias;
    383 }
    384 
    385 bool TypeBasedAAResult::pointsToConstantMemory(const MemoryLocation &Loc,
    386                                                AAQueryInfo &AAQI,
    387                                                bool OrLocal) {
    388   if (!EnableTBAA)
    389     return AAResultBase::pointsToConstantMemory(Loc, AAQI, OrLocal);
    390 
    391   const MDNode *M = Loc.AATags.TBAA;
    392   if (!M)
    393     return AAResultBase::pointsToConstantMemory(Loc, AAQI, OrLocal);
    394 
    395   // If this is an "immutable" type, we can assume the pointer is pointing
    396   // to constant memory.
    397   if ((!isStructPathTBAA(M) && TBAANode(M).isTypeImmutable()) ||
    398       (isStructPathTBAA(M) && TBAAStructTagNode(M).isTypeImmutable()))
    399     return true;
    400 
    401   return AAResultBase::pointsToConstantMemory(Loc, AAQI, OrLocal);
    402 }
    403 
    404 FunctionModRefBehavior
    405 TypeBasedAAResult::getModRefBehavior(const CallBase *Call) {
    406   if (!EnableTBAA)
    407     return AAResultBase::getModRefBehavior(Call);
    408 
    409   FunctionModRefBehavior Min = FMRB_UnknownModRefBehavior;
    410 
    411   // If this is an "immutable" type, we can assume the call doesn't write
    412   // to memory.
    413   if (const MDNode *M = Call->getMetadata(LLVMContext::MD_tbaa))
    414     if ((!isStructPathTBAA(M) && TBAANode(M).isTypeImmutable()) ||
    415         (isStructPathTBAA(M) && TBAAStructTagNode(M).isTypeImmutable()))
    416       Min = FMRB_OnlyReadsMemory;
    417 
    418   return FunctionModRefBehavior(AAResultBase::getModRefBehavior(Call) & Min);
    419 }
    420 
    421 FunctionModRefBehavior TypeBasedAAResult::getModRefBehavior(const Function *F) {
    422   // Functions don't have metadata. Just chain to the next implementation.
    423   return AAResultBase::getModRefBehavior(F);
    424 }
    425 
    426 ModRefInfo TypeBasedAAResult::getModRefInfo(const CallBase *Call,
    427                                             const MemoryLocation &Loc,
    428                                             AAQueryInfo &AAQI) {
    429   if (!EnableTBAA)
    430     return AAResultBase::getModRefInfo(Call, Loc, AAQI);
    431 
    432   if (const MDNode *L = Loc.AATags.TBAA)
    433     if (const MDNode *M = Call->getMetadata(LLVMContext::MD_tbaa))
    434       if (!Aliases(L, M))
    435         return ModRefInfo::NoModRef;
    436 
    437   return AAResultBase::getModRefInfo(Call, Loc, AAQI);
    438 }
    439 
    440 ModRefInfo TypeBasedAAResult::getModRefInfo(const CallBase *Call1,
    441                                             const CallBase *Call2,
    442                                             AAQueryInfo &AAQI) {
    443   if (!EnableTBAA)
    444     return AAResultBase::getModRefInfo(Call1, Call2, AAQI);
    445 
    446   if (const MDNode *M1 = Call1->getMetadata(LLVMContext::MD_tbaa))
    447     if (const MDNode *M2 = Call2->getMetadata(LLVMContext::MD_tbaa))
    448       if (!Aliases(M1, M2))
    449         return ModRefInfo::NoModRef;
    450 
    451   return AAResultBase::getModRefInfo(Call1, Call2, AAQI);
    452 }
    453 
    454 bool MDNode::isTBAAVtableAccess() const {
    455   if (!isStructPathTBAA(this)) {
    456     if (getNumOperands() < 1)
    457       return false;
    458     if (MDString *Tag1 = dyn_cast<MDString>(getOperand(0))) {
    459       if (Tag1->getString() == "vtable pointer")
    460         return true;
    461     }
    462     return false;
    463   }
    464 
    465   // For struct-path aware TBAA, we use the access type of the tag.
    466   TBAAStructTagNode Tag(this);
    467   TBAAStructTypeNode AccessType(Tag.getAccessType());
    468   if(auto *Id = dyn_cast<MDString>(AccessType.getId()))
    469     if (Id->getString() == "vtable pointer")
    470       return true;
    471   return false;
    472 }
    473 
    474 static bool matchAccessTags(const MDNode *A, const MDNode *B,
    475                             const MDNode **GenericTag = nullptr);
    476 
    477 MDNode *MDNode::getMostGenericTBAA(MDNode *A, MDNode *B) {
    478   const MDNode *GenericTag;
    479   matchAccessTags(A, B, &GenericTag);
    480   return const_cast<MDNode*>(GenericTag);
    481 }
    482 
    483 static const MDNode *getLeastCommonType(const MDNode *A, const MDNode *B) {
    484   if (!A || !B)
    485     return nullptr;
    486 
    487   if (A == B)
    488     return A;
    489 
    490   SmallSetVector<const MDNode *, 4> PathA;
    491   TBAANode TA(A);
    492   while (TA.getNode()) {
    493     if (PathA.count(TA.getNode()))
    494       report_fatal_error("Cycle found in TBAA metadata.");
    495     PathA.insert(TA.getNode());
    496     TA = TA.getParent();
    497   }
    498 
    499   SmallSetVector<const MDNode *, 4> PathB;
    500   TBAANode TB(B);
    501   while (TB.getNode()) {
    502     if (PathB.count(TB.getNode()))
    503       report_fatal_error("Cycle found in TBAA metadata.");
    504     PathB.insert(TB.getNode());
    505     TB = TB.getParent();
    506   }
    507 
    508   int IA = PathA.size() - 1;
    509   int IB = PathB.size() - 1;
    510 
    511   const MDNode *Ret = nullptr;
    512   while (IA >= 0 && IB >= 0) {
    513     if (PathA[IA] == PathB[IB])
    514       Ret = PathA[IA];
    515     else
    516       break;
    517     --IA;
    518     --IB;
    519   }
    520 
    521   return Ret;
    522 }
    523 
    524 void Instruction::getAAMetadata(AAMDNodes &N, bool Merge) const {
    525   if (Merge) {
    526     N.TBAA =
    527         MDNode::getMostGenericTBAA(N.TBAA, getMetadata(LLVMContext::MD_tbaa));
    528     N.TBAAStruct = nullptr;
    529     N.Scope = MDNode::getMostGenericAliasScope(
    530         N.Scope, getMetadata(LLVMContext::MD_alias_scope));
    531     N.NoAlias =
    532         MDNode::intersect(N.NoAlias, getMetadata(LLVMContext::MD_noalias));
    533   } else {
    534     N.TBAA = getMetadata(LLVMContext::MD_tbaa);
    535     N.TBAAStruct = getMetadata(LLVMContext::MD_tbaa_struct);
    536     N.Scope = getMetadata(LLVMContext::MD_alias_scope);
    537     N.NoAlias = getMetadata(LLVMContext::MD_noalias);
    538   }
    539 }
    540 
    541 static const MDNode *createAccessTag(const MDNode *AccessType) {
    542   // If there is no access type or the access type is the root node, then
    543   // we don't have any useful access tag to return.
    544   if (!AccessType || AccessType->getNumOperands() < 2)
    545     return nullptr;
    546 
    547   Type *Int64 = IntegerType::get(AccessType->getContext(), 64);
    548   auto *OffsetNode = ConstantAsMetadata::get(ConstantInt::get(Int64, 0));
    549 
    550   if (TBAAStructTypeNode(AccessType).isNewFormat()) {
    551     // TODO: Take access ranges into account when matching access tags and
    552     // fix this code to generate actual access sizes for generic tags.
    553     uint64_t AccessSize = UINT64_MAX;
    554     auto *SizeNode =
    555         ConstantAsMetadata::get(ConstantInt::get(Int64, AccessSize));
    556     Metadata *Ops[] = {const_cast<MDNode*>(AccessType),
    557                        const_cast<MDNode*>(AccessType),
    558                        OffsetNode, SizeNode};
    559     return MDNode::get(AccessType->getContext(), Ops);
    560   }
    561 
    562   Metadata *Ops[] = {const_cast<MDNode*>(AccessType),
    563                      const_cast<MDNode*>(AccessType),
    564                      OffsetNode};
    565   return MDNode::get(AccessType->getContext(), Ops);
    566 }
    567 
    568 static bool hasField(TBAAStructTypeNode BaseType,
    569                      TBAAStructTypeNode FieldType) {
    570   for (unsigned I = 0, E = BaseType.getNumFields(); I != E; ++I) {
    571     TBAAStructTypeNode T = BaseType.getFieldType(I);
    572     if (T == FieldType || hasField(T, FieldType))
    573       return true;
    574   }
    575   return false;
    576 }
    577 
    578 /// Return true if for two given accesses, one of the accessed objects may be a
    579 /// subobject of the other. The \p BaseTag and \p SubobjectTag parameters
    580 /// describe the accesses to the base object and the subobject respectively.
    581 /// \p CommonType must be the metadata node describing the common type of the
    582 /// accessed objects. On return, \p MayAlias is set to true iff these accesses
    583 /// may alias and \p Generic, if not null, points to the most generic access
    584 /// tag for the given two.
    585 static bool mayBeAccessToSubobjectOf(TBAAStructTagNode BaseTag,
    586                                      TBAAStructTagNode SubobjectTag,
    587                                      const MDNode *CommonType,
    588                                      const MDNode **GenericTag,
    589                                      bool &MayAlias) {
    590   // If the base object is of the least common type, then this may be an access
    591   // to its subobject.
    592   if (BaseTag.getAccessType() == BaseTag.getBaseType() &&
    593       BaseTag.getAccessType() == CommonType) {
    594     if (GenericTag)
    595       *GenericTag = createAccessTag(CommonType);
    596     MayAlias = true;
    597     return true;
    598   }
    599 
    600   // If the access to the base object is through a field of the subobject's
    601   // type, then this may be an access to that field. To check for that we start
    602   // from the base type, follow the edge with the correct offset in the type DAG
    603   // and adjust the offset until we reach the field type or until we reach the
    604   // access type.
    605   bool NewFormat = BaseTag.isNewFormat();
    606   TBAAStructTypeNode BaseType(BaseTag.getBaseType());
    607   uint64_t OffsetInBase = BaseTag.getOffset();
    608 
    609   for (;;) {
    610     // In the old format there is no distinction between fields and parent
    611     // types, so in this case we consider all nodes up to the root.
    612     if (!BaseType.getNode()) {
    613       assert(!NewFormat && "Did not see access type in access path!");
    614       break;
    615     }
    616 
    617     if (BaseType.getNode() == SubobjectTag.getBaseType()) {
    618       bool SameMemberAccess = OffsetInBase == SubobjectTag.getOffset();
    619       if (GenericTag) {
    620         *GenericTag = SameMemberAccess ? SubobjectTag.getNode() :
    621                                          createAccessTag(CommonType);
    622       }
    623       MayAlias = SameMemberAccess;
    624       return true;
    625     }
    626 
    627     // With new-format nodes we stop at the access type.
    628     if (NewFormat && BaseType.getNode() == BaseTag.getAccessType())
    629       break;
    630 
    631     // Follow the edge with the correct offset. Offset will be adjusted to
    632     // be relative to the field type.
    633     BaseType = BaseType.getField(OffsetInBase);
    634   }
    635 
    636   // If the base object has a direct or indirect field of the subobject's type,
    637   // then this may be an access to that field. We need this to check now that
    638   // we support aggregates as access types.
    639   if (NewFormat) {
    640     // TBAAStructTypeNode BaseAccessType(BaseTag.getAccessType());
    641     TBAAStructTypeNode FieldType(SubobjectTag.getBaseType());
    642     if (hasField(BaseType, FieldType)) {
    643       if (GenericTag)
    644         *GenericTag = createAccessTag(CommonType);
    645       MayAlias = true;
    646       return true;
    647     }
    648   }
    649 
    650   return false;
    651 }
    652 
    653 /// matchTags - Return true if the given couple of accesses are allowed to
    654 /// overlap. If \arg GenericTag is not null, then on return it points to the
    655 /// most generic access descriptor for the given two.
    656 static bool matchAccessTags(const MDNode *A, const MDNode *B,
    657                             const MDNode **GenericTag) {
    658   if (A == B) {
    659     if (GenericTag)
    660       *GenericTag = A;
    661     return true;
    662   }
    663 
    664   // Accesses with no TBAA information may alias with any other accesses.
    665   if (!A || !B) {
    666     if (GenericTag)
    667       *GenericTag = nullptr;
    668     return true;
    669   }
    670 
    671   // Verify that both input nodes are struct-path aware.  Auto-upgrade should
    672   // have taken care of this.
    673   assert(isStructPathTBAA(A) && "Access A is not struct-path aware!");
    674   assert(isStructPathTBAA(B) && "Access B is not struct-path aware!");
    675 
    676   TBAAStructTagNode TagA(A), TagB(B);
    677   const MDNode *CommonType = getLeastCommonType(TagA.getAccessType(),
    678                                                 TagB.getAccessType());
    679 
    680   // If the final access types have different roots, they're part of different
    681   // potentially unrelated type systems, so we must be conservative.
    682   if (!CommonType) {
    683     if (GenericTag)
    684       *GenericTag = nullptr;
    685     return true;
    686   }
    687 
    688   // If one of the accessed objects may be a subobject of the other, then such
    689   // accesses may alias.
    690   bool MayAlias;
    691   if (mayBeAccessToSubobjectOf(/* BaseTag= */ TagA, /* SubobjectTag= */ TagB,
    692                                CommonType, GenericTag, MayAlias) ||
    693       mayBeAccessToSubobjectOf(/* BaseTag= */ TagB, /* SubobjectTag= */ TagA,
    694                                CommonType, GenericTag, MayAlias))
    695     return MayAlias;
    696 
    697   // Otherwise, we've proved there's no alias.
    698   if (GenericTag)
    699     *GenericTag = createAccessTag(CommonType);
    700   return false;
    701 }
    702 
    703 /// Aliases - Test whether the access represented by tag A may alias the
    704 /// access represented by tag B.
    705 bool TypeBasedAAResult::Aliases(const MDNode *A, const MDNode *B) const {
    706   return matchAccessTags(A, B);
    707 }
    708 
    709 AnalysisKey TypeBasedAA::Key;
    710 
    711 TypeBasedAAResult TypeBasedAA::run(Function &F, FunctionAnalysisManager &AM) {
    712   return TypeBasedAAResult();
    713 }
    714 
    715 char TypeBasedAAWrapperPass::ID = 0;
    716 INITIALIZE_PASS(TypeBasedAAWrapperPass, "tbaa", "Type-Based Alias Analysis",
    717                 false, true)
    718 
    719 ImmutablePass *llvm::createTypeBasedAAWrapperPass() {
    720   return new TypeBasedAAWrapperPass();
    721 }
    722 
    723 TypeBasedAAWrapperPass::TypeBasedAAWrapperPass() : ImmutablePass(ID) {
    724   initializeTypeBasedAAWrapperPassPass(*PassRegistry::getPassRegistry());
    725 }
    726 
    727 bool TypeBasedAAWrapperPass::doInitialization(Module &M) {
    728   Result.reset(new TypeBasedAAResult());
    729   return false;
    730 }
    731 
    732 bool TypeBasedAAWrapperPass::doFinalization(Module &M) {
    733   Result.reset();
    734   return false;
    735 }
    736 
    737 void TypeBasedAAWrapperPass::getAnalysisUsage(AnalysisUsage &AU) const {
    738   AU.setPreservesAll();
    739 }
    740 
    741 MDNode *AAMDNodes::ShiftTBAA(MDNode *MD, size_t Offset) {
    742   // Fast path if there's no offset
    743   if (Offset == 0)
    744     return MD;
    745   // Fast path if there's no path tbaa node (and thus scalar)
    746   if (!isStructPathTBAA(MD))
    747     return MD;
    748 
    749   // The correct behavior here is to add the offset into the TBAA
    750   // struct node offset. The base type, however may not have defined
    751   // a type at this additional offset, resulting in errors. Since
    752   // this method is only used within a given load/store access
    753   // the offset provided is only used to subdivide the previous load
    754   // maintaining the validity of the previous TBAA.
    755   //
    756   // This, however, should be revisited in the future.
    757   return MD;
    758 }
    759 
    760 MDNode *AAMDNodes::ShiftTBAAStruct(MDNode *MD, size_t Offset) {
    761   // Fast path if there's no offset
    762   if (Offset == 0)
    763     return MD;
    764   SmallVector<Metadata *, 3> Sub;
    765   for (size_t i = 0, size = MD->getNumOperands(); i < size; i += 3) {
    766     ConstantInt *InnerOffset = mdconst::extract<ConstantInt>(MD->getOperand(i));
    767     ConstantInt *InnerSize =
    768         mdconst::extract<ConstantInt>(MD->getOperand(i + 1));
    769     // Don't include any triples that aren't in bounds
    770     if (InnerOffset->getZExtValue() + InnerSize->getZExtValue() <= Offset)
    771       continue;
    772 
    773     uint64_t NewSize = InnerSize->getZExtValue();
    774     uint64_t NewOffset = InnerOffset->getZExtValue() - Offset;
    775     if (InnerOffset->getZExtValue() < Offset) {
    776       NewOffset = 0;
    777       NewSize -= Offset - InnerOffset->getZExtValue();
    778     }
    779 
    780     // Shift the offset of the triple
    781     Sub.push_back(ConstantAsMetadata::get(
    782         ConstantInt::get(InnerOffset->getType(), NewOffset)));
    783     Sub.push_back(ConstantAsMetadata::get(
    784         ConstantInt::get(InnerSize->getType(), NewSize)));
    785     Sub.push_back(MD->getOperand(i + 2));
    786   }
    787   return MDNode::get(MD->getContext(), Sub);
    788 }
    789