Home | History | Annotate | Line # | Download | only in IPO
      1 //===- LowerTypeTests.cpp - type metadata lowering pass -------------------===//
      2 //
      3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
      4 // See https://llvm.org/LICENSE.txt for license information.
      5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
      6 //
      7 //===----------------------------------------------------------------------===//
      8 //
      9 // This pass lowers type metadata and calls to the llvm.type.test intrinsic.
     10 // It also ensures that globals are properly laid out for the
     11 // llvm.icall.branch.funnel intrinsic.
     12 // See http://llvm.org/docs/TypeMetadata.html for more information.
     13 //
     14 //===----------------------------------------------------------------------===//
     15 
     16 #include "llvm/Transforms/IPO/LowerTypeTests.h"
     17 #include "llvm/ADT/APInt.h"
     18 #include "llvm/ADT/ArrayRef.h"
     19 #include "llvm/ADT/DenseMap.h"
     20 #include "llvm/ADT/EquivalenceClasses.h"
     21 #include "llvm/ADT/PointerUnion.h"
     22 #include "llvm/ADT/SetVector.h"
     23 #include "llvm/ADT/SmallVector.h"
     24 #include "llvm/ADT/Statistic.h"
     25 #include "llvm/ADT/StringRef.h"
     26 #include "llvm/ADT/TinyPtrVector.h"
     27 #include "llvm/ADT/Triple.h"
     28 #include "llvm/Analysis/TypeMetadataUtils.h"
     29 #include "llvm/Analysis/ValueTracking.h"
     30 #include "llvm/IR/Attributes.h"
     31 #include "llvm/IR/BasicBlock.h"
     32 #include "llvm/IR/Constant.h"
     33 #include "llvm/IR/Constants.h"
     34 #include "llvm/IR/DataLayout.h"
     35 #include "llvm/IR/DerivedTypes.h"
     36 #include "llvm/IR/Function.h"
     37 #include "llvm/IR/GlobalAlias.h"
     38 #include "llvm/IR/GlobalObject.h"
     39 #include "llvm/IR/GlobalValue.h"
     40 #include "llvm/IR/GlobalVariable.h"
     41 #include "llvm/IR/IRBuilder.h"
     42 #include "llvm/IR/InlineAsm.h"
     43 #include "llvm/IR/Instruction.h"
     44 #include "llvm/IR/Instructions.h"
     45 #include "llvm/IR/Intrinsics.h"
     46 #include "llvm/IR/LLVMContext.h"
     47 #include "llvm/IR/Metadata.h"
     48 #include "llvm/IR/Module.h"
     49 #include "llvm/IR/ModuleSummaryIndex.h"
     50 #include "llvm/IR/ModuleSummaryIndexYAML.h"
     51 #include "llvm/IR/Operator.h"
     52 #include "llvm/IR/PassManager.h"
     53 #include "llvm/IR/Type.h"
     54 #include "llvm/IR/Use.h"
     55 #include "llvm/IR/User.h"
     56 #include "llvm/IR/Value.h"
     57 #include "llvm/InitializePasses.h"
     58 #include "llvm/Pass.h"
     59 #include "llvm/Support/Allocator.h"
     60 #include "llvm/Support/Casting.h"
     61 #include "llvm/Support/CommandLine.h"
     62 #include "llvm/Support/Debug.h"
     63 #include "llvm/Support/Error.h"
     64 #include "llvm/Support/ErrorHandling.h"
     65 #include "llvm/Support/FileSystem.h"
     66 #include "llvm/Support/MathExtras.h"
     67 #include "llvm/Support/MemoryBuffer.h"
     68 #include "llvm/Support/TrailingObjects.h"
     69 #include "llvm/Support/YAMLTraits.h"
     70 #include "llvm/Support/raw_ostream.h"
     71 #include "llvm/Transforms/IPO.h"
     72 #include "llvm/Transforms/Utils/BasicBlockUtils.h"
     73 #include "llvm/Transforms/Utils/ModuleUtils.h"
     74 #include <algorithm>
     75 #include <cassert>
     76 #include <cstdint>
     77 #include <memory>
     78 #include <set>
     79 #include <string>
     80 #include <system_error>
     81 #include <utility>
     82 #include <vector>
     83 
     84 using namespace llvm;
     85 using namespace lowertypetests;
     86 
     87 #define DEBUG_TYPE "lowertypetests"
     88 
     89 STATISTIC(ByteArraySizeBits, "Byte array size in bits");
     90 STATISTIC(ByteArraySizeBytes, "Byte array size in bytes");
     91 STATISTIC(NumByteArraysCreated, "Number of byte arrays created");
     92 STATISTIC(NumTypeTestCallsLowered, "Number of type test calls lowered");
     93 STATISTIC(NumTypeIdDisjointSets, "Number of disjoint sets of type identifiers");
     94 
     95 static cl::opt<bool> AvoidReuse(
     96     "lowertypetests-avoid-reuse",
     97     cl::desc("Try to avoid reuse of byte array addresses using aliases"),
     98     cl::Hidden, cl::init(true));
     99 
    100 static cl::opt<PassSummaryAction> ClSummaryAction(
    101     "lowertypetests-summary-action",
    102     cl::desc("What to do with the summary when running this pass"),
    103     cl::values(clEnumValN(PassSummaryAction::None, "none", "Do nothing"),
    104                clEnumValN(PassSummaryAction::Import, "import",
    105                           "Import typeid resolutions from summary and globals"),
    106                clEnumValN(PassSummaryAction::Export, "export",
    107                           "Export typeid resolutions to summary and globals")),
    108     cl::Hidden);
    109 
    110 static cl::opt<std::string> ClReadSummary(
    111     "lowertypetests-read-summary",
    112     cl::desc("Read summary from given YAML file before running pass"),
    113     cl::Hidden);
    114 
    115 static cl::opt<std::string> ClWriteSummary(
    116     "lowertypetests-write-summary",
    117     cl::desc("Write summary to given YAML file after running pass"),
    118     cl::Hidden);
    119 
    120 bool BitSetInfo::containsGlobalOffset(uint64_t Offset) const {
    121   if (Offset < ByteOffset)
    122     return false;
    123 
    124   if ((Offset - ByteOffset) % (uint64_t(1) << AlignLog2) != 0)
    125     return false;
    126 
    127   uint64_t BitOffset = (Offset - ByteOffset) >> AlignLog2;
    128   if (BitOffset >= BitSize)
    129     return false;
    130 
    131   return Bits.count(BitOffset);
    132 }
    133 
    134 void BitSetInfo::print(raw_ostream &OS) const {
    135   OS << "offset " << ByteOffset << " size " << BitSize << " align "
    136      << (1 << AlignLog2);
    137 
    138   if (isAllOnes()) {
    139     OS << " all-ones\n";
    140     return;
    141   }
    142 
    143   OS << " { ";
    144   for (uint64_t B : Bits)
    145     OS << B << ' ';
    146   OS << "}\n";
    147 }
    148 
    149 BitSetInfo BitSetBuilder::build() {
    150   if (Min > Max)
    151     Min = 0;
    152 
    153   // Normalize each offset against the minimum observed offset, and compute
    154   // the bitwise OR of each of the offsets. The number of trailing zeros
    155   // in the mask gives us the log2 of the alignment of all offsets, which
    156   // allows us to compress the bitset by only storing one bit per aligned
    157   // address.
    158   uint64_t Mask = 0;
    159   for (uint64_t &Offset : Offsets) {
    160     Offset -= Min;
    161     Mask |= Offset;
    162   }
    163 
    164   BitSetInfo BSI;
    165   BSI.ByteOffset = Min;
    166 
    167   BSI.AlignLog2 = 0;
    168   if (Mask != 0)
    169     BSI.AlignLog2 = countTrailingZeros(Mask, ZB_Undefined);
    170 
    171   // Build the compressed bitset while normalizing the offsets against the
    172   // computed alignment.
    173   BSI.BitSize = ((Max - Min) >> BSI.AlignLog2) + 1;
    174   for (uint64_t Offset : Offsets) {
    175     Offset >>= BSI.AlignLog2;
    176     BSI.Bits.insert(Offset);
    177   }
    178 
    179   return BSI;
    180 }
    181 
    182 void GlobalLayoutBuilder::addFragment(const std::set<uint64_t> &F) {
    183   // Create a new fragment to hold the layout for F.
    184   Fragments.emplace_back();
    185   std::vector<uint64_t> &Fragment = Fragments.back();
    186   uint64_t FragmentIndex = Fragments.size() - 1;
    187 
    188   for (auto ObjIndex : F) {
    189     uint64_t OldFragmentIndex = FragmentMap[ObjIndex];
    190     if (OldFragmentIndex == 0) {
    191       // We haven't seen this object index before, so just add it to the current
    192       // fragment.
    193       Fragment.push_back(ObjIndex);
    194     } else {
    195       // This index belongs to an existing fragment. Copy the elements of the
    196       // old fragment into this one and clear the old fragment. We don't update
    197       // the fragment map just yet, this ensures that any further references to
    198       // indices from the old fragment in this fragment do not insert any more
    199       // indices.
    200       std::vector<uint64_t> &OldFragment = Fragments[OldFragmentIndex];
    201       llvm::append_range(Fragment, OldFragment);
    202       OldFragment.clear();
    203     }
    204   }
    205 
    206   // Update the fragment map to point our object indices to this fragment.
    207   for (uint64_t ObjIndex : Fragment)
    208     FragmentMap[ObjIndex] = FragmentIndex;
    209 }
    210 
    211 void ByteArrayBuilder::allocate(const std::set<uint64_t> &Bits,
    212                                 uint64_t BitSize, uint64_t &AllocByteOffset,
    213                                 uint8_t &AllocMask) {
    214   // Find the smallest current allocation.
    215   unsigned Bit = 0;
    216   for (unsigned I = 1; I != BitsPerByte; ++I)
    217     if (BitAllocs[I] < BitAllocs[Bit])
    218       Bit = I;
    219 
    220   AllocByteOffset = BitAllocs[Bit];
    221 
    222   // Add our size to it.
    223   unsigned ReqSize = AllocByteOffset + BitSize;
    224   BitAllocs[Bit] = ReqSize;
    225   if (Bytes.size() < ReqSize)
    226     Bytes.resize(ReqSize);
    227 
    228   // Set our bits.
    229   AllocMask = 1 << Bit;
    230   for (uint64_t B : Bits)
    231     Bytes[AllocByteOffset + B] |= AllocMask;
    232 }
    233 
    234 bool lowertypetests::isJumpTableCanonical(Function *F) {
    235   if (F->isDeclarationForLinker())
    236     return false;
    237   auto *CI = mdconst::extract_or_null<ConstantInt>(
    238       F->getParent()->getModuleFlag("CFI Canonical Jump Tables"));
    239   if (!CI || CI->getZExtValue() != 0)
    240     return true;
    241   return F->hasFnAttribute("cfi-canonical-jump-table");
    242 }
    243 
    244 namespace {
    245 
    246 struct ByteArrayInfo {
    247   std::set<uint64_t> Bits;
    248   uint64_t BitSize;
    249   GlobalVariable *ByteArray;
    250   GlobalVariable *MaskGlobal;
    251   uint8_t *MaskPtr = nullptr;
    252 };
    253 
    254 /// A POD-like structure that we use to store a global reference together with
    255 /// its metadata types. In this pass we frequently need to query the set of
    256 /// metadata types referenced by a global, which at the IR level is an expensive
    257 /// operation involving a map lookup; this data structure helps to reduce the
    258 /// number of times we need to do this lookup.
    259 class GlobalTypeMember final : TrailingObjects<GlobalTypeMember, MDNode *> {
    260   friend TrailingObjects;
    261 
    262   GlobalObject *GO;
    263   size_t NTypes;
    264 
    265   // For functions: true if the jump table is canonical. This essentially means
    266   // whether the canonical address (i.e. the symbol table entry) of the function
    267   // is provided by the local jump table. This is normally the same as whether
    268   // the function is defined locally, but if canonical jump tables are disabled
    269   // by the user then the jump table never provides a canonical definition.
    270   bool IsJumpTableCanonical;
    271 
    272   // For functions: true if this function is either defined or used in a thinlto
    273   // module and its jumptable entry needs to be exported to thinlto backends.
    274   bool IsExported;
    275 
    276   size_t numTrailingObjects(OverloadToken<MDNode *>) const { return NTypes; }
    277 
    278 public:
    279   static GlobalTypeMember *create(BumpPtrAllocator &Alloc, GlobalObject *GO,
    280                                   bool IsJumpTableCanonical, bool IsExported,
    281                                   ArrayRef<MDNode *> Types) {
    282     auto *GTM = static_cast<GlobalTypeMember *>(Alloc.Allocate(
    283         totalSizeToAlloc<MDNode *>(Types.size()), alignof(GlobalTypeMember)));
    284     GTM->GO = GO;
    285     GTM->NTypes = Types.size();
    286     GTM->IsJumpTableCanonical = IsJumpTableCanonical;
    287     GTM->IsExported = IsExported;
    288     std::uninitialized_copy(Types.begin(), Types.end(),
    289                             GTM->getTrailingObjects<MDNode *>());
    290     return GTM;
    291   }
    292 
    293   GlobalObject *getGlobal() const {
    294     return GO;
    295   }
    296 
    297   bool isJumpTableCanonical() const {
    298     return IsJumpTableCanonical;
    299   }
    300 
    301   bool isExported() const {
    302     return IsExported;
    303   }
    304 
    305   ArrayRef<MDNode *> types() const {
    306     return makeArrayRef(getTrailingObjects<MDNode *>(), NTypes);
    307   }
    308 };
    309 
    310 struct ICallBranchFunnel final
    311     : TrailingObjects<ICallBranchFunnel, GlobalTypeMember *> {
    312   static ICallBranchFunnel *create(BumpPtrAllocator &Alloc, CallInst *CI,
    313                                    ArrayRef<GlobalTypeMember *> Targets,
    314                                    unsigned UniqueId) {
    315     auto *Call = static_cast<ICallBranchFunnel *>(
    316         Alloc.Allocate(totalSizeToAlloc<GlobalTypeMember *>(Targets.size()),
    317                        alignof(ICallBranchFunnel)));
    318     Call->CI = CI;
    319     Call->UniqueId = UniqueId;
    320     Call->NTargets = Targets.size();
    321     std::uninitialized_copy(Targets.begin(), Targets.end(),
    322                             Call->getTrailingObjects<GlobalTypeMember *>());
    323     return Call;
    324   }
    325 
    326   CallInst *CI;
    327   ArrayRef<GlobalTypeMember *> targets() const {
    328     return makeArrayRef(getTrailingObjects<GlobalTypeMember *>(), NTargets);
    329   }
    330 
    331   unsigned UniqueId;
    332 
    333 private:
    334   size_t NTargets;
    335 };
    336 
    337 struct ScopedSaveAliaseesAndUsed {
    338   Module &M;
    339   SmallVector<GlobalValue *, 4> Used, CompilerUsed;
    340   std::vector<std::pair<GlobalIndirectSymbol *, Function *>> FunctionAliases;
    341 
    342   ScopedSaveAliaseesAndUsed(Module &M) : M(M) {
    343     // The users of this class want to replace all function references except
    344     // for aliases and llvm.used/llvm.compiler.used with references to a jump
    345     // table. We avoid replacing aliases in order to avoid introducing a double
    346     // indirection (or an alias pointing to a declaration in ThinLTO mode), and
    347     // we avoid replacing llvm.used/llvm.compiler.used because these global
    348     // variables describe properties of the global, not the jump table (besides,
    349     // offseted references to the jump table in llvm.used are invalid).
    350     // Unfortunately, LLVM doesn't have a "RAUW except for these (possibly
    351     // indirect) users", so what we do is save the list of globals referenced by
    352     // llvm.used/llvm.compiler.used and aliases, erase the used lists, let RAUW
    353     // replace the aliasees and then set them back to their original values at
    354     // the end.
    355     if (GlobalVariable *GV = collectUsedGlobalVariables(M, Used, false))
    356       GV->eraseFromParent();
    357     if (GlobalVariable *GV = collectUsedGlobalVariables(M, CompilerUsed, true))
    358       GV->eraseFromParent();
    359 
    360     for (auto &GIS : concat<GlobalIndirectSymbol>(M.aliases(), M.ifuncs())) {
    361       // FIXME: This should look past all aliases not just interposable ones,
    362       // see discussion on D65118.
    363       if (auto *F =
    364               dyn_cast<Function>(GIS.getIndirectSymbol()->stripPointerCasts()))
    365         FunctionAliases.push_back({&GIS, F});
    366     }
    367   }
    368 
    369   ~ScopedSaveAliaseesAndUsed() {
    370     appendToUsed(M, Used);
    371     appendToCompilerUsed(M, CompilerUsed);
    372 
    373     for (auto P : FunctionAliases)
    374       P.first->setIndirectSymbol(
    375           ConstantExpr::getBitCast(P.second, P.first->getType()));
    376   }
    377 };
    378 
    379 class LowerTypeTestsModule {
    380   Module &M;
    381 
    382   ModuleSummaryIndex *ExportSummary;
    383   const ModuleSummaryIndex *ImportSummary;
    384   // Set when the client has invoked this to simply drop all type test assume
    385   // sequences.
    386   bool DropTypeTests;
    387 
    388   Triple::ArchType Arch;
    389   Triple::OSType OS;
    390   Triple::ObjectFormatType ObjectFormat;
    391 
    392   IntegerType *Int1Ty = Type::getInt1Ty(M.getContext());
    393   IntegerType *Int8Ty = Type::getInt8Ty(M.getContext());
    394   PointerType *Int8PtrTy = Type::getInt8PtrTy(M.getContext());
    395   ArrayType *Int8Arr0Ty = ArrayType::get(Type::getInt8Ty(M.getContext()), 0);
    396   IntegerType *Int32Ty = Type::getInt32Ty(M.getContext());
    397   PointerType *Int32PtrTy = PointerType::getUnqual(Int32Ty);
    398   IntegerType *Int64Ty = Type::getInt64Ty(M.getContext());
    399   IntegerType *IntPtrTy = M.getDataLayout().getIntPtrType(M.getContext(), 0);
    400 
    401   // Indirect function call index assignment counter for WebAssembly
    402   uint64_t IndirectIndex = 1;
    403 
    404   // Mapping from type identifiers to the call sites that test them, as well as
    405   // whether the type identifier needs to be exported to ThinLTO backends as
    406   // part of the regular LTO phase of the ThinLTO pipeline (see exportTypeId).
    407   struct TypeIdUserInfo {
    408     std::vector<CallInst *> CallSites;
    409     bool IsExported = false;
    410   };
    411   DenseMap<Metadata *, TypeIdUserInfo> TypeIdUsers;
    412 
    413   /// This structure describes how to lower type tests for a particular type
    414   /// identifier. It is either built directly from the global analysis (during
    415   /// regular LTO or the regular LTO phase of ThinLTO), or indirectly using type
    416   /// identifier summaries and external symbol references (in ThinLTO backends).
    417   struct TypeIdLowering {
    418     TypeTestResolution::Kind TheKind = TypeTestResolution::Unsat;
    419 
    420     /// All except Unsat: the start address within the combined global.
    421     Constant *OffsetedGlobal;
    422 
    423     /// ByteArray, Inline, AllOnes: log2 of the required global alignment
    424     /// relative to the start address.
    425     Constant *AlignLog2;
    426 
    427     /// ByteArray, Inline, AllOnes: one less than the size of the memory region
    428     /// covering members of this type identifier as a multiple of 2^AlignLog2.
    429     Constant *SizeM1;
    430 
    431     /// ByteArray: the byte array to test the address against.
    432     Constant *TheByteArray;
    433 
    434     /// ByteArray: the bit mask to apply to bytes loaded from the byte array.
    435     Constant *BitMask;
    436 
    437     /// Inline: the bit mask to test the address against.
    438     Constant *InlineBits;
    439   };
    440 
    441   std::vector<ByteArrayInfo> ByteArrayInfos;
    442 
    443   Function *WeakInitializerFn = nullptr;
    444 
    445   bool shouldExportConstantsAsAbsoluteSymbols();
    446   uint8_t *exportTypeId(StringRef TypeId, const TypeIdLowering &TIL);
    447   TypeIdLowering importTypeId(StringRef TypeId);
    448   void importTypeTest(CallInst *CI);
    449   void importFunction(Function *F, bool isJumpTableCanonical,
    450                       std::vector<GlobalAlias *> &AliasesToErase);
    451 
    452   BitSetInfo
    453   buildBitSet(Metadata *TypeId,
    454               const DenseMap<GlobalTypeMember *, uint64_t> &GlobalLayout);
    455   ByteArrayInfo *createByteArray(BitSetInfo &BSI);
    456   void allocateByteArrays();
    457   Value *createBitSetTest(IRBuilder<> &B, const TypeIdLowering &TIL,
    458                           Value *BitOffset);
    459   void lowerTypeTestCalls(
    460       ArrayRef<Metadata *> TypeIds, Constant *CombinedGlobalAddr,
    461       const DenseMap<GlobalTypeMember *, uint64_t> &GlobalLayout);
    462   Value *lowerTypeTestCall(Metadata *TypeId, CallInst *CI,
    463                            const TypeIdLowering &TIL);
    464 
    465   void buildBitSetsFromGlobalVariables(ArrayRef<Metadata *> TypeIds,
    466                                        ArrayRef<GlobalTypeMember *> Globals);
    467   unsigned getJumpTableEntrySize();
    468   Type *getJumpTableEntryType();
    469   void createJumpTableEntry(raw_ostream &AsmOS, raw_ostream &ConstraintOS,
    470                             Triple::ArchType JumpTableArch,
    471                             SmallVectorImpl<Value *> &AsmArgs, Function *Dest);
    472   void verifyTypeMDNode(GlobalObject *GO, MDNode *Type);
    473   void buildBitSetsFromFunctions(ArrayRef<Metadata *> TypeIds,
    474                                  ArrayRef<GlobalTypeMember *> Functions);
    475   void buildBitSetsFromFunctionsNative(ArrayRef<Metadata *> TypeIds,
    476                                        ArrayRef<GlobalTypeMember *> Functions);
    477   void buildBitSetsFromFunctionsWASM(ArrayRef<Metadata *> TypeIds,
    478                                      ArrayRef<GlobalTypeMember *> Functions);
    479   void
    480   buildBitSetsFromDisjointSet(ArrayRef<Metadata *> TypeIds,
    481                               ArrayRef<GlobalTypeMember *> Globals,
    482                               ArrayRef<ICallBranchFunnel *> ICallBranchFunnels);
    483 
    484   void replaceWeakDeclarationWithJumpTablePtr(Function *F, Constant *JT,
    485                                               bool IsJumpTableCanonical);
    486   void moveInitializerToModuleConstructor(GlobalVariable *GV);
    487   void findGlobalVariableUsersOf(Constant *C,
    488                                  SmallSetVector<GlobalVariable *, 8> &Out);
    489 
    490   void createJumpTable(Function *F, ArrayRef<GlobalTypeMember *> Functions);
    491 
    492   /// replaceCfiUses - Go through the uses list for this definition
    493   /// and make each use point to "V" instead of "this" when the use is outside
    494   /// the block. 'This's use list is expected to have at least one element.
    495   /// Unlike replaceAllUsesWith this function skips blockaddr and direct call
    496   /// uses.
    497   void replaceCfiUses(Function *Old, Value *New, bool IsJumpTableCanonical);
    498 
    499   /// replaceDirectCalls - Go through the uses list for this definition and
    500   /// replace each use, which is a direct function call.
    501   void replaceDirectCalls(Value *Old, Value *New);
    502 
    503 public:
    504   LowerTypeTestsModule(Module &M, ModuleSummaryIndex *ExportSummary,
    505                        const ModuleSummaryIndex *ImportSummary,
    506                        bool DropTypeTests);
    507 
    508   bool lower();
    509 
    510   // Lower the module using the action and summary passed as command line
    511   // arguments. For testing purposes only.
    512   static bool runForTesting(Module &M);
    513 };
    514 
    515 struct LowerTypeTests : public ModulePass {
    516   static char ID;
    517 
    518   bool UseCommandLine = false;
    519 
    520   ModuleSummaryIndex *ExportSummary;
    521   const ModuleSummaryIndex *ImportSummary;
    522   bool DropTypeTests;
    523 
    524   LowerTypeTests() : ModulePass(ID), UseCommandLine(true) {
    525     initializeLowerTypeTestsPass(*PassRegistry::getPassRegistry());
    526   }
    527 
    528   LowerTypeTests(ModuleSummaryIndex *ExportSummary,
    529                  const ModuleSummaryIndex *ImportSummary, bool DropTypeTests)
    530       : ModulePass(ID), ExportSummary(ExportSummary),
    531         ImportSummary(ImportSummary), DropTypeTests(DropTypeTests) {
    532     initializeLowerTypeTestsPass(*PassRegistry::getPassRegistry());
    533   }
    534 
    535   bool runOnModule(Module &M) override {
    536     if (UseCommandLine)
    537       return LowerTypeTestsModule::runForTesting(M);
    538     return LowerTypeTestsModule(M, ExportSummary, ImportSummary, DropTypeTests)
    539         .lower();
    540   }
    541 };
    542 
    543 } // end anonymous namespace
    544 
    545 char LowerTypeTests::ID = 0;
    546 
    547 INITIALIZE_PASS(LowerTypeTests, "lowertypetests", "Lower type metadata", false,
    548                 false)
    549 
    550 ModulePass *
    551 llvm::createLowerTypeTestsPass(ModuleSummaryIndex *ExportSummary,
    552                                const ModuleSummaryIndex *ImportSummary,
    553                                bool DropTypeTests) {
    554   return new LowerTypeTests(ExportSummary, ImportSummary, DropTypeTests);
    555 }
    556 
    557 /// Build a bit set for TypeId using the object layouts in
    558 /// GlobalLayout.
    559 BitSetInfo LowerTypeTestsModule::buildBitSet(
    560     Metadata *TypeId,
    561     const DenseMap<GlobalTypeMember *, uint64_t> &GlobalLayout) {
    562   BitSetBuilder BSB;
    563 
    564   // Compute the byte offset of each address associated with this type
    565   // identifier.
    566   for (auto &GlobalAndOffset : GlobalLayout) {
    567     for (MDNode *Type : GlobalAndOffset.first->types()) {
    568       if (Type->getOperand(1) != TypeId)
    569         continue;
    570       uint64_t Offset =
    571           cast<ConstantInt>(
    572               cast<ConstantAsMetadata>(Type->getOperand(0))->getValue())
    573               ->getZExtValue();
    574       BSB.addOffset(GlobalAndOffset.second + Offset);
    575     }
    576   }
    577 
    578   return BSB.build();
    579 }
    580 
    581 /// Build a test that bit BitOffset mod sizeof(Bits)*8 is set in
    582 /// Bits. This pattern matches to the bt instruction on x86.
    583 static Value *createMaskedBitTest(IRBuilder<> &B, Value *Bits,
    584                                   Value *BitOffset) {
    585   auto BitsType = cast<IntegerType>(Bits->getType());
    586   unsigned BitWidth = BitsType->getBitWidth();
    587 
    588   BitOffset = B.CreateZExtOrTrunc(BitOffset, BitsType);
    589   Value *BitIndex =
    590       B.CreateAnd(BitOffset, ConstantInt::get(BitsType, BitWidth - 1));
    591   Value *BitMask = B.CreateShl(ConstantInt::get(BitsType, 1), BitIndex);
    592   Value *MaskedBits = B.CreateAnd(Bits, BitMask);
    593   return B.CreateICmpNE(MaskedBits, ConstantInt::get(BitsType, 0));
    594 }
    595 
    596 ByteArrayInfo *LowerTypeTestsModule::createByteArray(BitSetInfo &BSI) {
    597   // Create globals to stand in for byte arrays and masks. These never actually
    598   // get initialized, we RAUW and erase them later in allocateByteArrays() once
    599   // we know the offset and mask to use.
    600   auto ByteArrayGlobal = new GlobalVariable(
    601       M, Int8Ty, /*isConstant=*/true, GlobalValue::PrivateLinkage, nullptr);
    602   auto MaskGlobal = new GlobalVariable(M, Int8Ty, /*isConstant=*/true,
    603                                        GlobalValue::PrivateLinkage, nullptr);
    604 
    605   ByteArrayInfos.emplace_back();
    606   ByteArrayInfo *BAI = &ByteArrayInfos.back();
    607 
    608   BAI->Bits = BSI.Bits;
    609   BAI->BitSize = BSI.BitSize;
    610   BAI->ByteArray = ByteArrayGlobal;
    611   BAI->MaskGlobal = MaskGlobal;
    612   return BAI;
    613 }
    614 
    615 void LowerTypeTestsModule::allocateByteArrays() {
    616   llvm::stable_sort(ByteArrayInfos,
    617                     [](const ByteArrayInfo &BAI1, const ByteArrayInfo &BAI2) {
    618                       return BAI1.BitSize > BAI2.BitSize;
    619                     });
    620 
    621   std::vector<uint64_t> ByteArrayOffsets(ByteArrayInfos.size());
    622 
    623   ByteArrayBuilder BAB;
    624   for (unsigned I = 0; I != ByteArrayInfos.size(); ++I) {
    625     ByteArrayInfo *BAI = &ByteArrayInfos[I];
    626 
    627     uint8_t Mask;
    628     BAB.allocate(BAI->Bits, BAI->BitSize, ByteArrayOffsets[I], Mask);
    629 
    630     BAI->MaskGlobal->replaceAllUsesWith(
    631         ConstantExpr::getIntToPtr(ConstantInt::get(Int8Ty, Mask), Int8PtrTy));
    632     BAI->MaskGlobal->eraseFromParent();
    633     if (BAI->MaskPtr)
    634       *BAI->MaskPtr = Mask;
    635   }
    636 
    637   Constant *ByteArrayConst = ConstantDataArray::get(M.getContext(), BAB.Bytes);
    638   auto ByteArray =
    639       new GlobalVariable(M, ByteArrayConst->getType(), /*isConstant=*/true,
    640                          GlobalValue::PrivateLinkage, ByteArrayConst);
    641 
    642   for (unsigned I = 0; I != ByteArrayInfos.size(); ++I) {
    643     ByteArrayInfo *BAI = &ByteArrayInfos[I];
    644 
    645     Constant *Idxs[] = {ConstantInt::get(IntPtrTy, 0),
    646                         ConstantInt::get(IntPtrTy, ByteArrayOffsets[I])};
    647     Constant *GEP = ConstantExpr::getInBoundsGetElementPtr(
    648         ByteArrayConst->getType(), ByteArray, Idxs);
    649 
    650     // Create an alias instead of RAUW'ing the gep directly. On x86 this ensures
    651     // that the pc-relative displacement is folded into the lea instead of the
    652     // test instruction getting another displacement.
    653     GlobalAlias *Alias = GlobalAlias::create(
    654         Int8Ty, 0, GlobalValue::PrivateLinkage, "bits", GEP, &M);
    655     BAI->ByteArray->replaceAllUsesWith(Alias);
    656     BAI->ByteArray->eraseFromParent();
    657   }
    658 
    659   ByteArraySizeBits = BAB.BitAllocs[0] + BAB.BitAllocs[1] + BAB.BitAllocs[2] +
    660                       BAB.BitAllocs[3] + BAB.BitAllocs[4] + BAB.BitAllocs[5] +
    661                       BAB.BitAllocs[6] + BAB.BitAllocs[7];
    662   ByteArraySizeBytes = BAB.Bytes.size();
    663 }
    664 
    665 /// Build a test that bit BitOffset is set in the type identifier that was
    666 /// lowered to TIL, which must be either an Inline or a ByteArray.
    667 Value *LowerTypeTestsModule::createBitSetTest(IRBuilder<> &B,
    668                                               const TypeIdLowering &TIL,
    669                                               Value *BitOffset) {
    670   if (TIL.TheKind == TypeTestResolution::Inline) {
    671     // If the bit set is sufficiently small, we can avoid a load by bit testing
    672     // a constant.
    673     return createMaskedBitTest(B, TIL.InlineBits, BitOffset);
    674   } else {
    675     Constant *ByteArray = TIL.TheByteArray;
    676     if (AvoidReuse && !ImportSummary) {
    677       // Each use of the byte array uses a different alias. This makes the
    678       // backend less likely to reuse previously computed byte array addresses,
    679       // improving the security of the CFI mechanism based on this pass.
    680       // This won't work when importing because TheByteArray is external.
    681       ByteArray = GlobalAlias::create(Int8Ty, 0, GlobalValue::PrivateLinkage,
    682                                       "bits_use", ByteArray, &M);
    683     }
    684 
    685     Value *ByteAddr = B.CreateGEP(Int8Ty, ByteArray, BitOffset);
    686     Value *Byte = B.CreateLoad(Int8Ty, ByteAddr);
    687 
    688     Value *ByteAndMask =
    689         B.CreateAnd(Byte, ConstantExpr::getPtrToInt(TIL.BitMask, Int8Ty));
    690     return B.CreateICmpNE(ByteAndMask, ConstantInt::get(Int8Ty, 0));
    691   }
    692 }
    693 
    694 static bool isKnownTypeIdMember(Metadata *TypeId, const DataLayout &DL,
    695                                 Value *V, uint64_t COffset) {
    696   if (auto GV = dyn_cast<GlobalObject>(V)) {
    697     SmallVector<MDNode *, 2> Types;
    698     GV->getMetadata(LLVMContext::MD_type, Types);
    699     for (MDNode *Type : Types) {
    700       if (Type->getOperand(1) != TypeId)
    701         continue;
    702       uint64_t Offset =
    703           cast<ConstantInt>(
    704               cast<ConstantAsMetadata>(Type->getOperand(0))->getValue())
    705               ->getZExtValue();
    706       if (COffset == Offset)
    707         return true;
    708     }
    709     return false;
    710   }
    711 
    712   if (auto GEP = dyn_cast<GEPOperator>(V)) {
    713     APInt APOffset(DL.getPointerSizeInBits(0), 0);
    714     bool Result = GEP->accumulateConstantOffset(DL, APOffset);
    715     if (!Result)
    716       return false;
    717     COffset += APOffset.getZExtValue();
    718     return isKnownTypeIdMember(TypeId, DL, GEP->getPointerOperand(), COffset);
    719   }
    720 
    721   if (auto Op = dyn_cast<Operator>(V)) {
    722     if (Op->getOpcode() == Instruction::BitCast)
    723       return isKnownTypeIdMember(TypeId, DL, Op->getOperand(0), COffset);
    724 
    725     if (Op->getOpcode() == Instruction::Select)
    726       return isKnownTypeIdMember(TypeId, DL, Op->getOperand(1), COffset) &&
    727              isKnownTypeIdMember(TypeId, DL, Op->getOperand(2), COffset);
    728   }
    729 
    730   return false;
    731 }
    732 
    733 /// Lower a llvm.type.test call to its implementation. Returns the value to
    734 /// replace the call with.
    735 Value *LowerTypeTestsModule::lowerTypeTestCall(Metadata *TypeId, CallInst *CI,
    736                                                const TypeIdLowering &TIL) {
    737   // Delay lowering if the resolution is currently unknown.
    738   if (TIL.TheKind == TypeTestResolution::Unknown)
    739     return nullptr;
    740   if (TIL.TheKind == TypeTestResolution::Unsat)
    741     return ConstantInt::getFalse(M.getContext());
    742 
    743   Value *Ptr = CI->getArgOperand(0);
    744   const DataLayout &DL = M.getDataLayout();
    745   if (isKnownTypeIdMember(TypeId, DL, Ptr, 0))
    746     return ConstantInt::getTrue(M.getContext());
    747 
    748   BasicBlock *InitialBB = CI->getParent();
    749 
    750   IRBuilder<> B(CI);
    751 
    752   Value *PtrAsInt = B.CreatePtrToInt(Ptr, IntPtrTy);
    753 
    754   Constant *OffsetedGlobalAsInt =
    755       ConstantExpr::getPtrToInt(TIL.OffsetedGlobal, IntPtrTy);
    756   if (TIL.TheKind == TypeTestResolution::Single)
    757     return B.CreateICmpEQ(PtrAsInt, OffsetedGlobalAsInt);
    758 
    759   Value *PtrOffset = B.CreateSub(PtrAsInt, OffsetedGlobalAsInt);
    760 
    761   // We need to check that the offset both falls within our range and is
    762   // suitably aligned. We can check both properties at the same time by
    763   // performing a right rotate by log2(alignment) followed by an integer
    764   // comparison against the bitset size. The rotate will move the lower
    765   // order bits that need to be zero into the higher order bits of the
    766   // result, causing the comparison to fail if they are nonzero. The rotate
    767   // also conveniently gives us a bit offset to use during the load from
    768   // the bitset.
    769   Value *OffsetSHR =
    770       B.CreateLShr(PtrOffset, ConstantExpr::getZExt(TIL.AlignLog2, IntPtrTy));
    771   Value *OffsetSHL = B.CreateShl(
    772       PtrOffset, ConstantExpr::getZExt(
    773                      ConstantExpr::getSub(
    774                          ConstantInt::get(Int8Ty, DL.getPointerSizeInBits(0)),
    775                          TIL.AlignLog2),
    776                      IntPtrTy));
    777   Value *BitOffset = B.CreateOr(OffsetSHR, OffsetSHL);
    778 
    779   Value *OffsetInRange = B.CreateICmpULE(BitOffset, TIL.SizeM1);
    780 
    781   // If the bit set is all ones, testing against it is unnecessary.
    782   if (TIL.TheKind == TypeTestResolution::AllOnes)
    783     return OffsetInRange;
    784 
    785   // See if the intrinsic is used in the following common pattern:
    786   //   br(llvm.type.test(...), thenbb, elsebb)
    787   // where nothing happens between the type test and the br.
    788   // If so, create slightly simpler IR.
    789   if (CI->hasOneUse())
    790     if (auto *Br = dyn_cast<BranchInst>(*CI->user_begin()))
    791       if (CI->getNextNode() == Br) {
    792         BasicBlock *Then = InitialBB->splitBasicBlock(CI->getIterator());
    793         BasicBlock *Else = Br->getSuccessor(1);
    794         BranchInst *NewBr = BranchInst::Create(Then, Else, OffsetInRange);
    795         NewBr->setMetadata(LLVMContext::MD_prof,
    796                            Br->getMetadata(LLVMContext::MD_prof));
    797         ReplaceInstWithInst(InitialBB->getTerminator(), NewBr);
    798 
    799         // Update phis in Else resulting from InitialBB being split
    800         for (auto &Phi : Else->phis())
    801           Phi.addIncoming(Phi.getIncomingValueForBlock(Then), InitialBB);
    802 
    803         IRBuilder<> ThenB(CI);
    804         return createBitSetTest(ThenB, TIL, BitOffset);
    805       }
    806 
    807   IRBuilder<> ThenB(SplitBlockAndInsertIfThen(OffsetInRange, CI, false));
    808 
    809   // Now that we know that the offset is in range and aligned, load the
    810   // appropriate bit from the bitset.
    811   Value *Bit = createBitSetTest(ThenB, TIL, BitOffset);
    812 
    813   // The value we want is 0 if we came directly from the initial block
    814   // (having failed the range or alignment checks), or the loaded bit if
    815   // we came from the block in which we loaded it.
    816   B.SetInsertPoint(CI);
    817   PHINode *P = B.CreatePHI(Int1Ty, 2);
    818   P->addIncoming(ConstantInt::get(Int1Ty, 0), InitialBB);
    819   P->addIncoming(Bit, ThenB.GetInsertBlock());
    820   return P;
    821 }
    822 
    823 /// Given a disjoint set of type identifiers and globals, lay out the globals,
    824 /// build the bit sets and lower the llvm.type.test calls.
    825 void LowerTypeTestsModule::buildBitSetsFromGlobalVariables(
    826     ArrayRef<Metadata *> TypeIds, ArrayRef<GlobalTypeMember *> Globals) {
    827   // Build a new global with the combined contents of the referenced globals.
    828   // This global is a struct whose even-indexed elements contain the original
    829   // contents of the referenced globals and whose odd-indexed elements contain
    830   // any padding required to align the next element to the next power of 2 plus
    831   // any additional padding required to meet its alignment requirements.
    832   std::vector<Constant *> GlobalInits;
    833   const DataLayout &DL = M.getDataLayout();
    834   DenseMap<GlobalTypeMember *, uint64_t> GlobalLayout;
    835   Align MaxAlign;
    836   uint64_t CurOffset = 0;
    837   uint64_t DesiredPadding = 0;
    838   for (GlobalTypeMember *G : Globals) {
    839     auto *GV = cast<GlobalVariable>(G->getGlobal());
    840     Align Alignment =
    841         DL.getValueOrABITypeAlignment(GV->getAlign(), GV->getValueType());
    842     MaxAlign = std::max(MaxAlign, Alignment);
    843     uint64_t GVOffset = alignTo(CurOffset + DesiredPadding, Alignment);
    844     GlobalLayout[G] = GVOffset;
    845     if (GVOffset != 0) {
    846       uint64_t Padding = GVOffset - CurOffset;
    847       GlobalInits.push_back(
    848           ConstantAggregateZero::get(ArrayType::get(Int8Ty, Padding)));
    849     }
    850 
    851     GlobalInits.push_back(GV->getInitializer());
    852     uint64_t InitSize = DL.getTypeAllocSize(GV->getValueType());
    853     CurOffset = GVOffset + InitSize;
    854 
    855     // Compute the amount of padding that we'd like for the next element.
    856     DesiredPadding = NextPowerOf2(InitSize - 1) - InitSize;
    857 
    858     // Experiments of different caps with Chromium on both x64 and ARM64
    859     // have shown that the 32-byte cap generates the smallest binary on
    860     // both platforms while different caps yield similar performance.
    861     // (see https://lists.llvm.org/pipermail/llvm-dev/2018-July/124694.html)
    862     if (DesiredPadding > 32)
    863       DesiredPadding = alignTo(InitSize, 32) - InitSize;
    864   }
    865 
    866   Constant *NewInit = ConstantStruct::getAnon(M.getContext(), GlobalInits);
    867   auto *CombinedGlobal =
    868       new GlobalVariable(M, NewInit->getType(), /*isConstant=*/true,
    869                          GlobalValue::PrivateLinkage, NewInit);
    870   CombinedGlobal->setAlignment(MaxAlign);
    871 
    872   StructType *NewTy = cast<StructType>(NewInit->getType());
    873   lowerTypeTestCalls(TypeIds, CombinedGlobal, GlobalLayout);
    874 
    875   // Build aliases pointing to offsets into the combined global for each
    876   // global from which we built the combined global, and replace references
    877   // to the original globals with references to the aliases.
    878   for (unsigned I = 0; I != Globals.size(); ++I) {
    879     GlobalVariable *GV = cast<GlobalVariable>(Globals[I]->getGlobal());
    880 
    881     // Multiply by 2 to account for padding elements.
    882     Constant *CombinedGlobalIdxs[] = {ConstantInt::get(Int32Ty, 0),
    883                                       ConstantInt::get(Int32Ty, I * 2)};
    884     Constant *CombinedGlobalElemPtr = ConstantExpr::getGetElementPtr(
    885         NewInit->getType(), CombinedGlobal, CombinedGlobalIdxs);
    886     assert(GV->getType()->getAddressSpace() == 0);
    887     GlobalAlias *GAlias =
    888         GlobalAlias::create(NewTy->getElementType(I * 2), 0, GV->getLinkage(),
    889                             "", CombinedGlobalElemPtr, &M);
    890     GAlias->setVisibility(GV->getVisibility());
    891     GAlias->takeName(GV);
    892     GV->replaceAllUsesWith(GAlias);
    893     GV->eraseFromParent();
    894   }
    895 }
    896 
    897 bool LowerTypeTestsModule::shouldExportConstantsAsAbsoluteSymbols() {
    898   return (Arch == Triple::x86 || Arch == Triple::x86_64) &&
    899          ObjectFormat == Triple::ELF;
    900 }
    901 
    902 /// Export the given type identifier so that ThinLTO backends may import it.
    903 /// Type identifiers are exported by adding coarse-grained information about how
    904 /// to test the type identifier to the summary, and creating symbols in the
    905 /// object file (aliases and absolute symbols) containing fine-grained
    906 /// information about the type identifier.
    907 ///
    908 /// Returns a pointer to the location in which to store the bitmask, if
    909 /// applicable.
    910 uint8_t *LowerTypeTestsModule::exportTypeId(StringRef TypeId,
    911                                             const TypeIdLowering &TIL) {
    912   TypeTestResolution &TTRes =
    913       ExportSummary->getOrInsertTypeIdSummary(TypeId).TTRes;
    914   TTRes.TheKind = TIL.TheKind;
    915 
    916   auto ExportGlobal = [&](StringRef Name, Constant *C) {
    917     GlobalAlias *GA =
    918         GlobalAlias::create(Int8Ty, 0, GlobalValue::ExternalLinkage,
    919                             "__typeid_" + TypeId + "_" + Name, C, &M);
    920     GA->setVisibility(GlobalValue::HiddenVisibility);
    921   };
    922 
    923   auto ExportConstant = [&](StringRef Name, uint64_t &Storage, Constant *C) {
    924     if (shouldExportConstantsAsAbsoluteSymbols())
    925       ExportGlobal(Name, ConstantExpr::getIntToPtr(C, Int8PtrTy));
    926     else
    927       Storage = cast<ConstantInt>(C)->getZExtValue();
    928   };
    929 
    930   if (TIL.TheKind != TypeTestResolution::Unsat)
    931     ExportGlobal("global_addr", TIL.OffsetedGlobal);
    932 
    933   if (TIL.TheKind == TypeTestResolution::ByteArray ||
    934       TIL.TheKind == TypeTestResolution::Inline ||
    935       TIL.TheKind == TypeTestResolution::AllOnes) {
    936     ExportConstant("align", TTRes.AlignLog2, TIL.AlignLog2);
    937     ExportConstant("size_m1", TTRes.SizeM1, TIL.SizeM1);
    938 
    939     uint64_t BitSize = cast<ConstantInt>(TIL.SizeM1)->getZExtValue() + 1;
    940     if (TIL.TheKind == TypeTestResolution::Inline)
    941       TTRes.SizeM1BitWidth = (BitSize <= 32) ? 5 : 6;
    942     else
    943       TTRes.SizeM1BitWidth = (BitSize <= 128) ? 7 : 32;
    944   }
    945 
    946   if (TIL.TheKind == TypeTestResolution::ByteArray) {
    947     ExportGlobal("byte_array", TIL.TheByteArray);
    948     if (shouldExportConstantsAsAbsoluteSymbols())
    949       ExportGlobal("bit_mask", TIL.BitMask);
    950     else
    951       return &TTRes.BitMask;
    952   }
    953 
    954   if (TIL.TheKind == TypeTestResolution::Inline)
    955     ExportConstant("inline_bits", TTRes.InlineBits, TIL.InlineBits);
    956 
    957   return nullptr;
    958 }
    959 
    960 LowerTypeTestsModule::TypeIdLowering
    961 LowerTypeTestsModule::importTypeId(StringRef TypeId) {
    962   const TypeIdSummary *TidSummary = ImportSummary->getTypeIdSummary(TypeId);
    963   if (!TidSummary)
    964     return {}; // Unsat: no globals match this type id.
    965   const TypeTestResolution &TTRes = TidSummary->TTRes;
    966 
    967   TypeIdLowering TIL;
    968   TIL.TheKind = TTRes.TheKind;
    969 
    970   auto ImportGlobal = [&](StringRef Name) {
    971     // Give the global a type of length 0 so that it is not assumed not to alias
    972     // with any other global.
    973     Constant *C = M.getOrInsertGlobal(("__typeid_" + TypeId + "_" + Name).str(),
    974                                       Int8Arr0Ty);
    975     if (auto *GV = dyn_cast<GlobalVariable>(C))
    976       GV->setVisibility(GlobalValue::HiddenVisibility);
    977     C = ConstantExpr::getBitCast(C, Int8PtrTy);
    978     return C;
    979   };
    980 
    981   auto ImportConstant = [&](StringRef Name, uint64_t Const, unsigned AbsWidth,
    982                             Type *Ty) {
    983     if (!shouldExportConstantsAsAbsoluteSymbols()) {
    984       Constant *C =
    985           ConstantInt::get(isa<IntegerType>(Ty) ? Ty : Int64Ty, Const);
    986       if (!isa<IntegerType>(Ty))
    987         C = ConstantExpr::getIntToPtr(C, Ty);
    988       return C;
    989     }
    990 
    991     Constant *C = ImportGlobal(Name);
    992     auto *GV = cast<GlobalVariable>(C->stripPointerCasts());
    993     if (isa<IntegerType>(Ty))
    994       C = ConstantExpr::getPtrToInt(C, Ty);
    995     if (GV->getMetadata(LLVMContext::MD_absolute_symbol))
    996       return C;
    997 
    998     auto SetAbsRange = [&](uint64_t Min, uint64_t Max) {
    999       auto *MinC = ConstantAsMetadata::get(ConstantInt::get(IntPtrTy, Min));
   1000       auto *MaxC = ConstantAsMetadata::get(ConstantInt::get(IntPtrTy, Max));
   1001       GV->setMetadata(LLVMContext::MD_absolute_symbol,
   1002                       MDNode::get(M.getContext(), {MinC, MaxC}));
   1003     };
   1004     if (AbsWidth == IntPtrTy->getBitWidth())
   1005       SetAbsRange(~0ull, ~0ull); // Full set.
   1006     else
   1007       SetAbsRange(0, 1ull << AbsWidth);
   1008     return C;
   1009   };
   1010 
   1011   if (TIL.TheKind != TypeTestResolution::Unsat)
   1012     TIL.OffsetedGlobal = ImportGlobal("global_addr");
   1013 
   1014   if (TIL.TheKind == TypeTestResolution::ByteArray ||
   1015       TIL.TheKind == TypeTestResolution::Inline ||
   1016       TIL.TheKind == TypeTestResolution::AllOnes) {
   1017     TIL.AlignLog2 = ImportConstant("align", TTRes.AlignLog2, 8, Int8Ty);
   1018     TIL.SizeM1 =
   1019         ImportConstant("size_m1", TTRes.SizeM1, TTRes.SizeM1BitWidth, IntPtrTy);
   1020   }
   1021 
   1022   if (TIL.TheKind == TypeTestResolution::ByteArray) {
   1023     TIL.TheByteArray = ImportGlobal("byte_array");
   1024     TIL.BitMask = ImportConstant("bit_mask", TTRes.BitMask, 8, Int8PtrTy);
   1025   }
   1026 
   1027   if (TIL.TheKind == TypeTestResolution::Inline)
   1028     TIL.InlineBits = ImportConstant(
   1029         "inline_bits", TTRes.InlineBits, 1 << TTRes.SizeM1BitWidth,
   1030         TTRes.SizeM1BitWidth <= 5 ? Int32Ty : Int64Ty);
   1031 
   1032   return TIL;
   1033 }
   1034 
   1035 void LowerTypeTestsModule::importTypeTest(CallInst *CI) {
   1036   auto TypeIdMDVal = dyn_cast<MetadataAsValue>(CI->getArgOperand(1));
   1037   if (!TypeIdMDVal)
   1038     report_fatal_error("Second argument of llvm.type.test must be metadata");
   1039 
   1040   auto TypeIdStr = dyn_cast<MDString>(TypeIdMDVal->getMetadata());
   1041   // If this is a local unpromoted type, which doesn't have a metadata string,
   1042   // treat as Unknown and delay lowering, so that we can still utilize it for
   1043   // later optimizations.
   1044   if (!TypeIdStr)
   1045     return;
   1046 
   1047   TypeIdLowering TIL = importTypeId(TypeIdStr->getString());
   1048   Value *Lowered = lowerTypeTestCall(TypeIdStr, CI, TIL);
   1049   if (Lowered) {
   1050     CI->replaceAllUsesWith(Lowered);
   1051     CI->eraseFromParent();
   1052   }
   1053 }
   1054 
   1055 // ThinLTO backend: the function F has a jump table entry; update this module
   1056 // accordingly. isJumpTableCanonical describes the type of the jump table entry.
   1057 void LowerTypeTestsModule::importFunction(
   1058     Function *F, bool isJumpTableCanonical,
   1059     std::vector<GlobalAlias *> &AliasesToErase) {
   1060   assert(F->getType()->getAddressSpace() == 0);
   1061 
   1062   GlobalValue::VisibilityTypes Visibility = F->getVisibility();
   1063   std::string Name = std::string(F->getName());
   1064 
   1065   if (F->isDeclarationForLinker() && isJumpTableCanonical) {
   1066     // Non-dso_local functions may be overriden at run time,
   1067     // don't short curcuit them
   1068     if (F->isDSOLocal()) {
   1069       Function *RealF = Function::Create(F->getFunctionType(),
   1070                                          GlobalValue::ExternalLinkage,
   1071                                          F->getAddressSpace(),
   1072                                          Name + ".cfi", &M);
   1073       RealF->setVisibility(GlobalVariable::HiddenVisibility);
   1074       replaceDirectCalls(F, RealF);
   1075     }
   1076     return;
   1077   }
   1078 
   1079   Function *FDecl;
   1080   if (!isJumpTableCanonical) {
   1081     // Either a declaration of an external function or a reference to a locally
   1082     // defined jump table.
   1083     FDecl = Function::Create(F->getFunctionType(), GlobalValue::ExternalLinkage,
   1084                              F->getAddressSpace(), Name + ".cfi_jt", &M);
   1085     FDecl->setVisibility(GlobalValue::HiddenVisibility);
   1086   } else {
   1087     F->setName(Name + ".cfi");
   1088     F->setLinkage(GlobalValue::ExternalLinkage);
   1089     FDecl = Function::Create(F->getFunctionType(), GlobalValue::ExternalLinkage,
   1090                              F->getAddressSpace(), Name, &M);
   1091     FDecl->setVisibility(Visibility);
   1092     Visibility = GlobalValue::HiddenVisibility;
   1093 
   1094     // Delete aliases pointing to this function, they'll be re-created in the
   1095     // merged output. Don't do it yet though because ScopedSaveAliaseesAndUsed
   1096     // will want to reset the aliasees first.
   1097     for (auto &U : F->uses()) {
   1098       if (auto *A = dyn_cast<GlobalAlias>(U.getUser())) {
   1099         Function *AliasDecl = Function::Create(
   1100             F->getFunctionType(), GlobalValue::ExternalLinkage,
   1101             F->getAddressSpace(), "", &M);
   1102         AliasDecl->takeName(A);
   1103         A->replaceAllUsesWith(AliasDecl);
   1104         AliasesToErase.push_back(A);
   1105       }
   1106     }
   1107   }
   1108 
   1109   if (F->hasExternalWeakLinkage())
   1110     replaceWeakDeclarationWithJumpTablePtr(F, FDecl, isJumpTableCanonical);
   1111   else
   1112     replaceCfiUses(F, FDecl, isJumpTableCanonical);
   1113 
   1114   // Set visibility late because it's used in replaceCfiUses() to determine
   1115   // whether uses need to to be replaced.
   1116   F->setVisibility(Visibility);
   1117 }
   1118 
   1119 void LowerTypeTestsModule::lowerTypeTestCalls(
   1120     ArrayRef<Metadata *> TypeIds, Constant *CombinedGlobalAddr,
   1121     const DenseMap<GlobalTypeMember *, uint64_t> &GlobalLayout) {
   1122   CombinedGlobalAddr = ConstantExpr::getBitCast(CombinedGlobalAddr, Int8PtrTy);
   1123 
   1124   // For each type identifier in this disjoint set...
   1125   for (Metadata *TypeId : TypeIds) {
   1126     // Build the bitset.
   1127     BitSetInfo BSI = buildBitSet(TypeId, GlobalLayout);
   1128     LLVM_DEBUG({
   1129       if (auto MDS = dyn_cast<MDString>(TypeId))
   1130         dbgs() << MDS->getString() << ": ";
   1131       else
   1132         dbgs() << "<unnamed>: ";
   1133       BSI.print(dbgs());
   1134     });
   1135 
   1136     ByteArrayInfo *BAI = nullptr;
   1137     TypeIdLowering TIL;
   1138     TIL.OffsetedGlobal = ConstantExpr::getGetElementPtr(
   1139         Int8Ty, CombinedGlobalAddr, ConstantInt::get(IntPtrTy, BSI.ByteOffset)),
   1140     TIL.AlignLog2 = ConstantInt::get(Int8Ty, BSI.AlignLog2);
   1141     TIL.SizeM1 = ConstantInt::get(IntPtrTy, BSI.BitSize - 1);
   1142     if (BSI.isAllOnes()) {
   1143       TIL.TheKind = (BSI.BitSize == 1) ? TypeTestResolution::Single
   1144                                        : TypeTestResolution::AllOnes;
   1145     } else if (BSI.BitSize <= 64) {
   1146       TIL.TheKind = TypeTestResolution::Inline;
   1147       uint64_t InlineBits = 0;
   1148       for (auto Bit : BSI.Bits)
   1149         InlineBits |= uint64_t(1) << Bit;
   1150       if (InlineBits == 0)
   1151         TIL.TheKind = TypeTestResolution::Unsat;
   1152       else
   1153         TIL.InlineBits = ConstantInt::get(
   1154             (BSI.BitSize <= 32) ? Int32Ty : Int64Ty, InlineBits);
   1155     } else {
   1156       TIL.TheKind = TypeTestResolution::ByteArray;
   1157       ++NumByteArraysCreated;
   1158       BAI = createByteArray(BSI);
   1159       TIL.TheByteArray = BAI->ByteArray;
   1160       TIL.BitMask = BAI->MaskGlobal;
   1161     }
   1162 
   1163     TypeIdUserInfo &TIUI = TypeIdUsers[TypeId];
   1164 
   1165     if (TIUI.IsExported) {
   1166       uint8_t *MaskPtr = exportTypeId(cast<MDString>(TypeId)->getString(), TIL);
   1167       if (BAI)
   1168         BAI->MaskPtr = MaskPtr;
   1169     }
   1170 
   1171     // Lower each call to llvm.type.test for this type identifier.
   1172     for (CallInst *CI : TIUI.CallSites) {
   1173       ++NumTypeTestCallsLowered;
   1174       Value *Lowered = lowerTypeTestCall(TypeId, CI, TIL);
   1175       if (Lowered) {
   1176         CI->replaceAllUsesWith(Lowered);
   1177         CI->eraseFromParent();
   1178       }
   1179     }
   1180   }
   1181 }
   1182 
   1183 void LowerTypeTestsModule::verifyTypeMDNode(GlobalObject *GO, MDNode *Type) {
   1184   if (Type->getNumOperands() != 2)
   1185     report_fatal_error("All operands of type metadata must have 2 elements");
   1186 
   1187   if (GO->isThreadLocal())
   1188     report_fatal_error("Bit set element may not be thread-local");
   1189   if (isa<GlobalVariable>(GO) && GO->hasSection())
   1190     report_fatal_error(
   1191         "A member of a type identifier may not have an explicit section");
   1192 
   1193   // FIXME: We previously checked that global var member of a type identifier
   1194   // must be a definition, but the IR linker may leave type metadata on
   1195   // declarations. We should restore this check after fixing PR31759.
   1196 
   1197   auto OffsetConstMD = dyn_cast<ConstantAsMetadata>(Type->getOperand(0));
   1198   if (!OffsetConstMD)
   1199     report_fatal_error("Type offset must be a constant");
   1200   auto OffsetInt = dyn_cast<ConstantInt>(OffsetConstMD->getValue());
   1201   if (!OffsetInt)
   1202     report_fatal_error("Type offset must be an integer constant");
   1203 }
   1204 
   1205 static const unsigned kX86JumpTableEntrySize = 8;
   1206 static const unsigned kARMJumpTableEntrySize = 4;
   1207 static const unsigned kARMBTIJumpTableEntrySize = 8;
   1208 
   1209 unsigned LowerTypeTestsModule::getJumpTableEntrySize() {
   1210   switch (Arch) {
   1211     case Triple::x86:
   1212     case Triple::x86_64:
   1213       return kX86JumpTableEntrySize;
   1214     case Triple::arm:
   1215     case Triple::thumb:
   1216       return kARMJumpTableEntrySize;
   1217     case Triple::aarch64:
   1218       if (const auto *BTE = mdconst::extract_or_null<ConstantInt>(
   1219             M.getModuleFlag("branch-target-enforcement")))
   1220         if (BTE->getZExtValue())
   1221           return kARMBTIJumpTableEntrySize;
   1222       return kARMJumpTableEntrySize;
   1223     default:
   1224       report_fatal_error("Unsupported architecture for jump tables");
   1225   }
   1226 }
   1227 
   1228 // Create a jump table entry for the target. This consists of an instruction
   1229 // sequence containing a relative branch to Dest. Appends inline asm text,
   1230 // constraints and arguments to AsmOS, ConstraintOS and AsmArgs.
   1231 void LowerTypeTestsModule::createJumpTableEntry(
   1232     raw_ostream &AsmOS, raw_ostream &ConstraintOS,
   1233     Triple::ArchType JumpTableArch, SmallVectorImpl<Value *> &AsmArgs,
   1234     Function *Dest) {
   1235   unsigned ArgIndex = AsmArgs.size();
   1236 
   1237   if (JumpTableArch == Triple::x86 || JumpTableArch == Triple::x86_64) {
   1238     AsmOS << "jmp ${" << ArgIndex << ":c}@plt\n";
   1239     AsmOS << "int3\nint3\nint3\n";
   1240   } else if (JumpTableArch == Triple::arm) {
   1241     AsmOS << "b $" << ArgIndex << "\n";
   1242   } else if (JumpTableArch == Triple::aarch64) {
   1243     if (const auto *BTE = mdconst::extract_or_null<ConstantInt>(
   1244           Dest->getParent()->getModuleFlag("branch-target-enforcement")))
   1245       if (BTE->getZExtValue())
   1246         AsmOS << "bti c\n";
   1247     AsmOS << "b $" << ArgIndex << "\n";
   1248   } else if (JumpTableArch == Triple::thumb) {
   1249     AsmOS << "b.w $" << ArgIndex << "\n";
   1250   } else {
   1251     report_fatal_error("Unsupported architecture for jump tables");
   1252   }
   1253 
   1254   ConstraintOS << (ArgIndex > 0 ? ",s" : "s");
   1255   AsmArgs.push_back(Dest);
   1256 }
   1257 
   1258 Type *LowerTypeTestsModule::getJumpTableEntryType() {
   1259   return ArrayType::get(Int8Ty, getJumpTableEntrySize());
   1260 }
   1261 
   1262 /// Given a disjoint set of type identifiers and functions, build the bit sets
   1263 /// and lower the llvm.type.test calls, architecture dependently.
   1264 void LowerTypeTestsModule::buildBitSetsFromFunctions(
   1265     ArrayRef<Metadata *> TypeIds, ArrayRef<GlobalTypeMember *> Functions) {
   1266   if (Arch == Triple::x86 || Arch == Triple::x86_64 || Arch == Triple::arm ||
   1267       Arch == Triple::thumb || Arch == Triple::aarch64)
   1268     buildBitSetsFromFunctionsNative(TypeIds, Functions);
   1269   else if (Arch == Triple::wasm32 || Arch == Triple::wasm64)
   1270     buildBitSetsFromFunctionsWASM(TypeIds, Functions);
   1271   else
   1272     report_fatal_error("Unsupported architecture for jump tables");
   1273 }
   1274 
   1275 void LowerTypeTestsModule::moveInitializerToModuleConstructor(
   1276     GlobalVariable *GV) {
   1277   if (WeakInitializerFn == nullptr) {
   1278     WeakInitializerFn = Function::Create(
   1279         FunctionType::get(Type::getVoidTy(M.getContext()),
   1280                           /* IsVarArg */ false),
   1281         GlobalValue::InternalLinkage,
   1282         M.getDataLayout().getProgramAddressSpace(),
   1283         "__cfi_global_var_init", &M);
   1284     BasicBlock *BB =
   1285         BasicBlock::Create(M.getContext(), "entry", WeakInitializerFn);
   1286     ReturnInst::Create(M.getContext(), BB);
   1287     WeakInitializerFn->setSection(
   1288         ObjectFormat == Triple::MachO
   1289             ? "__TEXT,__StaticInit,regular,pure_instructions"
   1290             : ".text.startup");
   1291     // This code is equivalent to relocation application, and should run at the
   1292     // earliest possible time (i.e. with the highest priority).
   1293     appendToGlobalCtors(M, WeakInitializerFn, /* Priority */ 0);
   1294   }
   1295 
   1296   IRBuilder<> IRB(WeakInitializerFn->getEntryBlock().getTerminator());
   1297   GV->setConstant(false);
   1298   IRB.CreateAlignedStore(GV->getInitializer(), GV, GV->getAlign());
   1299   GV->setInitializer(Constant::getNullValue(GV->getValueType()));
   1300 }
   1301 
   1302 void LowerTypeTestsModule::findGlobalVariableUsersOf(
   1303     Constant *C, SmallSetVector<GlobalVariable *, 8> &Out) {
   1304   for (auto *U : C->users()){
   1305     if (auto *GV = dyn_cast<GlobalVariable>(U))
   1306       Out.insert(GV);
   1307     else if (auto *C2 = dyn_cast<Constant>(U))
   1308       findGlobalVariableUsersOf(C2, Out);
   1309   }
   1310 }
   1311 
   1312 // Replace all uses of F with (F ? JT : 0).
   1313 void LowerTypeTestsModule::replaceWeakDeclarationWithJumpTablePtr(
   1314     Function *F, Constant *JT, bool IsJumpTableCanonical) {
   1315   // The target expression can not appear in a constant initializer on most
   1316   // (all?) targets. Switch to a runtime initializer.
   1317   SmallSetVector<GlobalVariable *, 8> GlobalVarUsers;
   1318   findGlobalVariableUsersOf(F, GlobalVarUsers);
   1319   for (auto GV : GlobalVarUsers)
   1320     moveInitializerToModuleConstructor(GV);
   1321 
   1322   // Can not RAUW F with an expression that uses F. Replace with a temporary
   1323   // placeholder first.
   1324   Function *PlaceholderFn =
   1325       Function::Create(cast<FunctionType>(F->getValueType()),
   1326                        GlobalValue::ExternalWeakLinkage,
   1327                        F->getAddressSpace(), "", &M);
   1328   replaceCfiUses(F, PlaceholderFn, IsJumpTableCanonical);
   1329 
   1330   Constant *Target = ConstantExpr::getSelect(
   1331       ConstantExpr::getICmp(CmpInst::ICMP_NE, F,
   1332                             Constant::getNullValue(F->getType())),
   1333       JT, Constant::getNullValue(F->getType()));
   1334   PlaceholderFn->replaceAllUsesWith(Target);
   1335   PlaceholderFn->eraseFromParent();
   1336 }
   1337 
   1338 static bool isThumbFunction(Function *F, Triple::ArchType ModuleArch) {
   1339   Attribute TFAttr = F->getFnAttribute("target-features");
   1340   if (TFAttr.isValid()) {
   1341     SmallVector<StringRef, 6> Features;
   1342     TFAttr.getValueAsString().split(Features, ',');
   1343     for (StringRef Feature : Features) {
   1344       if (Feature == "-thumb-mode")
   1345         return false;
   1346       else if (Feature == "+thumb-mode")
   1347         return true;
   1348     }
   1349   }
   1350 
   1351   return ModuleArch == Triple::thumb;
   1352 }
   1353 
   1354 // Each jump table must be either ARM or Thumb as a whole for the bit-test math
   1355 // to work. Pick one that matches the majority of members to minimize interop
   1356 // veneers inserted by the linker.
   1357 static Triple::ArchType
   1358 selectJumpTableArmEncoding(ArrayRef<GlobalTypeMember *> Functions,
   1359                            Triple::ArchType ModuleArch) {
   1360   if (ModuleArch != Triple::arm && ModuleArch != Triple::thumb)
   1361     return ModuleArch;
   1362 
   1363   unsigned ArmCount = 0, ThumbCount = 0;
   1364   for (const auto GTM : Functions) {
   1365     if (!GTM->isJumpTableCanonical()) {
   1366       // PLT stubs are always ARM.
   1367       // FIXME: This is the wrong heuristic for non-canonical jump tables.
   1368       ++ArmCount;
   1369       continue;
   1370     }
   1371 
   1372     Function *F = cast<Function>(GTM->getGlobal());
   1373     ++(isThumbFunction(F, ModuleArch) ? ThumbCount : ArmCount);
   1374   }
   1375 
   1376   return ArmCount > ThumbCount ? Triple::arm : Triple::thumb;
   1377 }
   1378 
   1379 void LowerTypeTestsModule::createJumpTable(
   1380     Function *F, ArrayRef<GlobalTypeMember *> Functions) {
   1381   std::string AsmStr, ConstraintStr;
   1382   raw_string_ostream AsmOS(AsmStr), ConstraintOS(ConstraintStr);
   1383   SmallVector<Value *, 16> AsmArgs;
   1384   AsmArgs.reserve(Functions.size() * 2);
   1385 
   1386   Triple::ArchType JumpTableArch = selectJumpTableArmEncoding(Functions, Arch);
   1387 
   1388   for (unsigned I = 0; I != Functions.size(); ++I)
   1389     createJumpTableEntry(AsmOS, ConstraintOS, JumpTableArch, AsmArgs,
   1390                          cast<Function>(Functions[I]->getGlobal()));
   1391 
   1392   // Align the whole table by entry size.
   1393   F->setAlignment(Align(getJumpTableEntrySize()));
   1394   // Skip prologue.
   1395   // Disabled on win32 due to https://llvm.org/bugs/show_bug.cgi?id=28641#c3.
   1396   // Luckily, this function does not get any prologue even without the
   1397   // attribute.
   1398   if (OS != Triple::Win32)
   1399     F->addFnAttr(Attribute::Naked);
   1400   if (JumpTableArch == Triple::arm)
   1401     F->addFnAttr("target-features", "-thumb-mode");
   1402   if (JumpTableArch == Triple::thumb) {
   1403     F->addFnAttr("target-features", "+thumb-mode");
   1404     // Thumb jump table assembly needs Thumb2. The following attribute is added
   1405     // by Clang for -march=armv7.
   1406     F->addFnAttr("target-cpu", "cortex-a8");
   1407   }
   1408   if (JumpTableArch == Triple::aarch64) {
   1409     F->addFnAttr("branch-target-enforcement", "false");
   1410     F->addFnAttr("sign-return-address", "none");
   1411   }
   1412   // Make sure we don't emit .eh_frame for this function.
   1413   F->addFnAttr(Attribute::NoUnwind);
   1414 
   1415   BasicBlock *BB = BasicBlock::Create(M.getContext(), "entry", F);
   1416   IRBuilder<> IRB(BB);
   1417 
   1418   SmallVector<Type *, 16> ArgTypes;
   1419   ArgTypes.reserve(AsmArgs.size());
   1420   for (const auto &Arg : AsmArgs)
   1421     ArgTypes.push_back(Arg->getType());
   1422   InlineAsm *JumpTableAsm =
   1423       InlineAsm::get(FunctionType::get(IRB.getVoidTy(), ArgTypes, false),
   1424                      AsmOS.str(), ConstraintOS.str(),
   1425                      /*hasSideEffects=*/true);
   1426 
   1427   IRB.CreateCall(JumpTableAsm, AsmArgs);
   1428   IRB.CreateUnreachable();
   1429 }
   1430 
   1431 /// Given a disjoint set of type identifiers and functions, build a jump table
   1432 /// for the functions, build the bit sets and lower the llvm.type.test calls.
   1433 void LowerTypeTestsModule::buildBitSetsFromFunctionsNative(
   1434     ArrayRef<Metadata *> TypeIds, ArrayRef<GlobalTypeMember *> Functions) {
   1435   // Unlike the global bitset builder, the function bitset builder cannot
   1436   // re-arrange functions in a particular order and base its calculations on the
   1437   // layout of the functions' entry points, as we have no idea how large a
   1438   // particular function will end up being (the size could even depend on what
   1439   // this pass does!) Instead, we build a jump table, which is a block of code
   1440   // consisting of one branch instruction for each of the functions in the bit
   1441   // set that branches to the target function, and redirect any taken function
   1442   // addresses to the corresponding jump table entry. In the object file's
   1443   // symbol table, the symbols for the target functions also refer to the jump
   1444   // table entries, so that addresses taken outside the module will pass any
   1445   // verification done inside the module.
   1446   //
   1447   // In more concrete terms, suppose we have three functions f, g, h which are
   1448   // of the same type, and a function foo that returns their addresses:
   1449   //
   1450   // f:
   1451   // mov 0, %eax
   1452   // ret
   1453   //
   1454   // g:
   1455   // mov 1, %eax
   1456   // ret
   1457   //
   1458   // h:
   1459   // mov 2, %eax
   1460   // ret
   1461   //
   1462   // foo:
   1463   // mov f, %eax
   1464   // mov g, %edx
   1465   // mov h, %ecx
   1466   // ret
   1467   //
   1468   // We output the jump table as module-level inline asm string. The end result
   1469   // will (conceptually) look like this:
   1470   //
   1471   // f = .cfi.jumptable
   1472   // g = .cfi.jumptable + 4
   1473   // h = .cfi.jumptable + 8
   1474   // .cfi.jumptable:
   1475   // jmp f.cfi  ; 5 bytes
   1476   // int3       ; 1 byte
   1477   // int3       ; 1 byte
   1478   // int3       ; 1 byte
   1479   // jmp g.cfi  ; 5 bytes
   1480   // int3       ; 1 byte
   1481   // int3       ; 1 byte
   1482   // int3       ; 1 byte
   1483   // jmp h.cfi  ; 5 bytes
   1484   // int3       ; 1 byte
   1485   // int3       ; 1 byte
   1486   // int3       ; 1 byte
   1487   //
   1488   // f.cfi:
   1489   // mov 0, %eax
   1490   // ret
   1491   //
   1492   // g.cfi:
   1493   // mov 1, %eax
   1494   // ret
   1495   //
   1496   // h.cfi:
   1497   // mov 2, %eax
   1498   // ret
   1499   //
   1500   // foo:
   1501   // mov f, %eax
   1502   // mov g, %edx
   1503   // mov h, %ecx
   1504   // ret
   1505   //
   1506   // Because the addresses of f, g, h are evenly spaced at a power of 2, in the
   1507   // normal case the check can be carried out using the same kind of simple
   1508   // arithmetic that we normally use for globals.
   1509 
   1510   // FIXME: find a better way to represent the jumptable in the IR.
   1511   assert(!Functions.empty());
   1512 
   1513   // Build a simple layout based on the regular layout of jump tables.
   1514   DenseMap<GlobalTypeMember *, uint64_t> GlobalLayout;
   1515   unsigned EntrySize = getJumpTableEntrySize();
   1516   for (unsigned I = 0; I != Functions.size(); ++I)
   1517     GlobalLayout[Functions[I]] = I * EntrySize;
   1518 
   1519   Function *JumpTableFn =
   1520       Function::Create(FunctionType::get(Type::getVoidTy(M.getContext()),
   1521                                          /* IsVarArg */ false),
   1522                        GlobalValue::PrivateLinkage,
   1523                        M.getDataLayout().getProgramAddressSpace(),
   1524                        ".cfi.jumptable", &M);
   1525   ArrayType *JumpTableType =
   1526       ArrayType::get(getJumpTableEntryType(), Functions.size());
   1527   auto JumpTable =
   1528       ConstantExpr::getPointerCast(JumpTableFn, JumpTableType->getPointerTo(0));
   1529 
   1530   lowerTypeTestCalls(TypeIds, JumpTable, GlobalLayout);
   1531 
   1532   {
   1533     ScopedSaveAliaseesAndUsed S(M);
   1534 
   1535     // Build aliases pointing to offsets into the jump table, and replace
   1536     // references to the original functions with references to the aliases.
   1537     for (unsigned I = 0; I != Functions.size(); ++I) {
   1538       Function *F = cast<Function>(Functions[I]->getGlobal());
   1539       bool IsJumpTableCanonical = Functions[I]->isJumpTableCanonical();
   1540 
   1541       Constant *CombinedGlobalElemPtr = ConstantExpr::getBitCast(
   1542           ConstantExpr::getInBoundsGetElementPtr(
   1543               JumpTableType, JumpTable,
   1544               ArrayRef<Constant *>{ConstantInt::get(IntPtrTy, 0),
   1545                                    ConstantInt::get(IntPtrTy, I)}),
   1546           F->getType());
   1547       if (Functions[I]->isExported()) {
   1548         if (IsJumpTableCanonical) {
   1549           ExportSummary->cfiFunctionDefs().insert(std::string(F->getName()));
   1550         } else {
   1551           GlobalAlias *JtAlias = GlobalAlias::create(
   1552               F->getValueType(), 0, GlobalValue::ExternalLinkage,
   1553               F->getName() + ".cfi_jt", CombinedGlobalElemPtr, &M);
   1554           JtAlias->setVisibility(GlobalValue::HiddenVisibility);
   1555           ExportSummary->cfiFunctionDecls().insert(std::string(F->getName()));
   1556         }
   1557       }
   1558       if (!IsJumpTableCanonical) {
   1559         if (F->hasExternalWeakLinkage())
   1560           replaceWeakDeclarationWithJumpTablePtr(F, CombinedGlobalElemPtr,
   1561                                                  IsJumpTableCanonical);
   1562         else
   1563           replaceCfiUses(F, CombinedGlobalElemPtr, IsJumpTableCanonical);
   1564       } else {
   1565         assert(F->getType()->getAddressSpace() == 0);
   1566 
   1567         GlobalAlias *FAlias =
   1568             GlobalAlias::create(F->getValueType(), 0, F->getLinkage(), "",
   1569                                 CombinedGlobalElemPtr, &M);
   1570         FAlias->setVisibility(F->getVisibility());
   1571         FAlias->takeName(F);
   1572         if (FAlias->hasName())
   1573           F->setName(FAlias->getName() + ".cfi");
   1574         replaceCfiUses(F, FAlias, IsJumpTableCanonical);
   1575         if (!F->hasLocalLinkage())
   1576           F->setVisibility(GlobalVariable::HiddenVisibility);
   1577       }
   1578     }
   1579   }
   1580 
   1581   createJumpTable(JumpTableFn, Functions);
   1582 }
   1583 
   1584 /// Assign a dummy layout using an incrementing counter, tag each function
   1585 /// with its index represented as metadata, and lower each type test to an
   1586 /// integer range comparison. During generation of the indirect function call
   1587 /// table in the backend, it will assign the given indexes.
   1588 /// Note: Dynamic linking is not supported, as the WebAssembly ABI has not yet
   1589 /// been finalized.
   1590 void LowerTypeTestsModule::buildBitSetsFromFunctionsWASM(
   1591     ArrayRef<Metadata *> TypeIds, ArrayRef<GlobalTypeMember *> Functions) {
   1592   assert(!Functions.empty());
   1593 
   1594   // Build consecutive monotonic integer ranges for each call target set
   1595   DenseMap<GlobalTypeMember *, uint64_t> GlobalLayout;
   1596 
   1597   for (GlobalTypeMember *GTM : Functions) {
   1598     Function *F = cast<Function>(GTM->getGlobal());
   1599 
   1600     // Skip functions that are not address taken, to avoid bloating the table
   1601     if (!F->hasAddressTaken())
   1602       continue;
   1603 
   1604     // Store metadata with the index for each function
   1605     MDNode *MD = MDNode::get(F->getContext(),
   1606                              ArrayRef<Metadata *>(ConstantAsMetadata::get(
   1607                                  ConstantInt::get(Int64Ty, IndirectIndex))));
   1608     F->setMetadata("wasm.index", MD);
   1609 
   1610     // Assign the counter value
   1611     GlobalLayout[GTM] = IndirectIndex++;
   1612   }
   1613 
   1614   // The indirect function table index space starts at zero, so pass a NULL
   1615   // pointer as the subtracted "jump table" offset.
   1616   lowerTypeTestCalls(TypeIds, ConstantPointerNull::get(Int32PtrTy),
   1617                      GlobalLayout);
   1618 }
   1619 
   1620 void LowerTypeTestsModule::buildBitSetsFromDisjointSet(
   1621     ArrayRef<Metadata *> TypeIds, ArrayRef<GlobalTypeMember *> Globals,
   1622     ArrayRef<ICallBranchFunnel *> ICallBranchFunnels) {
   1623   DenseMap<Metadata *, uint64_t> TypeIdIndices;
   1624   for (unsigned I = 0; I != TypeIds.size(); ++I)
   1625     TypeIdIndices[TypeIds[I]] = I;
   1626 
   1627   // For each type identifier, build a set of indices that refer to members of
   1628   // the type identifier.
   1629   std::vector<std::set<uint64_t>> TypeMembers(TypeIds.size());
   1630   unsigned GlobalIndex = 0;
   1631   DenseMap<GlobalTypeMember *, uint64_t> GlobalIndices;
   1632   for (GlobalTypeMember *GTM : Globals) {
   1633     for (MDNode *Type : GTM->types()) {
   1634       // Type = { offset, type identifier }
   1635       auto I = TypeIdIndices.find(Type->getOperand(1));
   1636       if (I != TypeIdIndices.end())
   1637         TypeMembers[I->second].insert(GlobalIndex);
   1638     }
   1639     GlobalIndices[GTM] = GlobalIndex;
   1640     GlobalIndex++;
   1641   }
   1642 
   1643   for (ICallBranchFunnel *JT : ICallBranchFunnels) {
   1644     TypeMembers.emplace_back();
   1645     std::set<uint64_t> &TMSet = TypeMembers.back();
   1646     for (GlobalTypeMember *T : JT->targets())
   1647       TMSet.insert(GlobalIndices[T]);
   1648   }
   1649 
   1650   // Order the sets of indices by size. The GlobalLayoutBuilder works best
   1651   // when given small index sets first.
   1652   llvm::stable_sort(TypeMembers, [](const std::set<uint64_t> &O1,
   1653                                     const std::set<uint64_t> &O2) {
   1654     return O1.size() < O2.size();
   1655   });
   1656 
   1657   // Create a GlobalLayoutBuilder and provide it with index sets as layout
   1658   // fragments. The GlobalLayoutBuilder tries to lay out members of fragments as
   1659   // close together as possible.
   1660   GlobalLayoutBuilder GLB(Globals.size());
   1661   for (auto &&MemSet : TypeMembers)
   1662     GLB.addFragment(MemSet);
   1663 
   1664   // Build a vector of globals with the computed layout.
   1665   bool IsGlobalSet =
   1666       Globals.empty() || isa<GlobalVariable>(Globals[0]->getGlobal());
   1667   std::vector<GlobalTypeMember *> OrderedGTMs(Globals.size());
   1668   auto OGTMI = OrderedGTMs.begin();
   1669   for (auto &&F : GLB.Fragments) {
   1670     for (auto &&Offset : F) {
   1671       if (IsGlobalSet != isa<GlobalVariable>(Globals[Offset]->getGlobal()))
   1672         report_fatal_error("Type identifier may not contain both global "
   1673                            "variables and functions");
   1674       *OGTMI++ = Globals[Offset];
   1675     }
   1676   }
   1677 
   1678   // Build the bitsets from this disjoint set.
   1679   if (IsGlobalSet)
   1680     buildBitSetsFromGlobalVariables(TypeIds, OrderedGTMs);
   1681   else
   1682     buildBitSetsFromFunctions(TypeIds, OrderedGTMs);
   1683 }
   1684 
   1685 /// Lower all type tests in this module.
   1686 LowerTypeTestsModule::LowerTypeTestsModule(
   1687     Module &M, ModuleSummaryIndex *ExportSummary,
   1688     const ModuleSummaryIndex *ImportSummary, bool DropTypeTests)
   1689     : M(M), ExportSummary(ExportSummary), ImportSummary(ImportSummary),
   1690       DropTypeTests(DropTypeTests) {
   1691   assert(!(ExportSummary && ImportSummary));
   1692   Triple TargetTriple(M.getTargetTriple());
   1693   Arch = TargetTriple.getArch();
   1694   OS = TargetTriple.getOS();
   1695   ObjectFormat = TargetTriple.getObjectFormat();
   1696 }
   1697 
   1698 bool LowerTypeTestsModule::runForTesting(Module &M) {
   1699   ModuleSummaryIndex Summary(/*HaveGVs=*/false);
   1700 
   1701   // Handle the command-line summary arguments. This code is for testing
   1702   // purposes only, so we handle errors directly.
   1703   if (!ClReadSummary.empty()) {
   1704     ExitOnError ExitOnErr("-lowertypetests-read-summary: " + ClReadSummary +
   1705                           ": ");
   1706     auto ReadSummaryFile =
   1707         ExitOnErr(errorOrToExpected(MemoryBuffer::getFile(ClReadSummary)));
   1708 
   1709     yaml::Input In(ReadSummaryFile->getBuffer());
   1710     In >> Summary;
   1711     ExitOnErr(errorCodeToError(In.error()));
   1712   }
   1713 
   1714   bool Changed =
   1715       LowerTypeTestsModule(
   1716           M, ClSummaryAction == PassSummaryAction::Export ? &Summary : nullptr,
   1717           ClSummaryAction == PassSummaryAction::Import ? &Summary : nullptr,
   1718           /*DropTypeTests*/ false)
   1719           .lower();
   1720 
   1721   if (!ClWriteSummary.empty()) {
   1722     ExitOnError ExitOnErr("-lowertypetests-write-summary: " + ClWriteSummary +
   1723                           ": ");
   1724     std::error_code EC;
   1725     raw_fd_ostream OS(ClWriteSummary, EC, sys::fs::OF_TextWithCRLF);
   1726     ExitOnErr(errorCodeToError(EC));
   1727 
   1728     yaml::Output Out(OS);
   1729     Out << Summary;
   1730   }
   1731 
   1732   return Changed;
   1733 }
   1734 
   1735 static bool isDirectCall(Use& U) {
   1736   auto *Usr = dyn_cast<CallInst>(U.getUser());
   1737   if (Usr) {
   1738     auto *CB = dyn_cast<CallBase>(Usr);
   1739     if (CB && CB->isCallee(&U))
   1740       return true;
   1741   }
   1742   return false;
   1743 }
   1744 
   1745 void LowerTypeTestsModule::replaceCfiUses(Function *Old, Value *New,
   1746                                           bool IsJumpTableCanonical) {
   1747   SmallSetVector<Constant *, 4> Constants;
   1748   auto UI = Old->use_begin(), E = Old->use_end();
   1749   for (; UI != E;) {
   1750     Use &U = *UI;
   1751     ++UI;
   1752 
   1753     // Skip block addresses
   1754     if (isa<BlockAddress>(U.getUser()))
   1755       continue;
   1756 
   1757     // Skip direct calls to externally defined or non-dso_local functions
   1758     if (isDirectCall(U) && (Old->isDSOLocal() || !IsJumpTableCanonical))
   1759       continue;
   1760 
   1761     // Must handle Constants specially, we cannot call replaceUsesOfWith on a
   1762     // constant because they are uniqued.
   1763     if (auto *C = dyn_cast<Constant>(U.getUser())) {
   1764       if (!isa<GlobalValue>(C)) {
   1765         // Save unique users to avoid processing operand replacement
   1766         // more than once.
   1767         Constants.insert(C);
   1768         continue;
   1769       }
   1770     }
   1771 
   1772     U.set(New);
   1773   }
   1774 
   1775   // Process operand replacement of saved constants.
   1776   for (auto *C : Constants)
   1777     C->handleOperandChange(Old, New);
   1778 }
   1779 
   1780 void LowerTypeTestsModule::replaceDirectCalls(Value *Old, Value *New) {
   1781   Old->replaceUsesWithIf(New, [](Use &U) { return isDirectCall(U); });
   1782 }
   1783 
   1784 bool LowerTypeTestsModule::lower() {
   1785   Function *TypeTestFunc =
   1786       M.getFunction(Intrinsic::getName(Intrinsic::type_test));
   1787 
   1788   if (DropTypeTests && TypeTestFunc) {
   1789     for (auto UI = TypeTestFunc->use_begin(), UE = TypeTestFunc->use_end();
   1790          UI != UE;) {
   1791       auto *CI = cast<CallInst>((*UI++).getUser());
   1792       // Find and erase llvm.assume intrinsics for this llvm.type.test call.
   1793       for (auto CIU = CI->use_begin(), CIUE = CI->use_end(); CIU != CIUE;)
   1794         if (auto *Assume = dyn_cast<AssumeInst>((*CIU++).getUser()))
   1795           Assume->eraseFromParent();
   1796       CI->eraseFromParent();
   1797     }
   1798 
   1799     // We have deleted the type intrinsics, so we no longer have enough
   1800     // information to reason about the liveness of virtual function pointers
   1801     // in GlobalDCE.
   1802     for (GlobalVariable &GV : M.globals())
   1803       GV.eraseMetadata(LLVMContext::MD_vcall_visibility);
   1804 
   1805     return true;
   1806   }
   1807 
   1808   // If only some of the modules were split, we cannot correctly perform
   1809   // this transformation. We already checked for the presense of type tests
   1810   // with partially split modules during the thin link, and would have emitted
   1811   // an error if any were found, so here we can simply return.
   1812   if ((ExportSummary && ExportSummary->partiallySplitLTOUnits()) ||
   1813       (ImportSummary && ImportSummary->partiallySplitLTOUnits()))
   1814     return false;
   1815 
   1816   Function *ICallBranchFunnelFunc =
   1817       M.getFunction(Intrinsic::getName(Intrinsic::icall_branch_funnel));
   1818   if ((!TypeTestFunc || TypeTestFunc->use_empty()) &&
   1819       (!ICallBranchFunnelFunc || ICallBranchFunnelFunc->use_empty()) &&
   1820       !ExportSummary && !ImportSummary)
   1821     return false;
   1822 
   1823   if (ImportSummary) {
   1824     if (TypeTestFunc) {
   1825       for (auto UI = TypeTestFunc->use_begin(), UE = TypeTestFunc->use_end();
   1826            UI != UE;) {
   1827         auto *CI = cast<CallInst>((*UI++).getUser());
   1828         importTypeTest(CI);
   1829       }
   1830     }
   1831 
   1832     if (ICallBranchFunnelFunc && !ICallBranchFunnelFunc->use_empty())
   1833       report_fatal_error(
   1834           "unexpected call to llvm.icall.branch.funnel during import phase");
   1835 
   1836     SmallVector<Function *, 8> Defs;
   1837     SmallVector<Function *, 8> Decls;
   1838     for (auto &F : M) {
   1839       // CFI functions are either external, or promoted. A local function may
   1840       // have the same name, but it's not the one we are looking for.
   1841       if (F.hasLocalLinkage())
   1842         continue;
   1843       if (ImportSummary->cfiFunctionDefs().count(std::string(F.getName())))
   1844         Defs.push_back(&F);
   1845       else if (ImportSummary->cfiFunctionDecls().count(
   1846                    std::string(F.getName())))
   1847         Decls.push_back(&F);
   1848     }
   1849 
   1850     std::vector<GlobalAlias *> AliasesToErase;
   1851     {
   1852       ScopedSaveAliaseesAndUsed S(M);
   1853       for (auto F : Defs)
   1854         importFunction(F, /*isJumpTableCanonical*/ true, AliasesToErase);
   1855       for (auto F : Decls)
   1856         importFunction(F, /*isJumpTableCanonical*/ false, AliasesToErase);
   1857     }
   1858     for (GlobalAlias *GA : AliasesToErase)
   1859       GA->eraseFromParent();
   1860 
   1861     return true;
   1862   }
   1863 
   1864   // Equivalence class set containing type identifiers and the globals that
   1865   // reference them. This is used to partition the set of type identifiers in
   1866   // the module into disjoint sets.
   1867   using GlobalClassesTy = EquivalenceClasses<
   1868       PointerUnion<GlobalTypeMember *, Metadata *, ICallBranchFunnel *>>;
   1869   GlobalClassesTy GlobalClasses;
   1870 
   1871   // Verify the type metadata and build a few data structures to let us
   1872   // efficiently enumerate the type identifiers associated with a global:
   1873   // a list of GlobalTypeMembers (a GlobalObject stored alongside a vector
   1874   // of associated type metadata) and a mapping from type identifiers to their
   1875   // list of GlobalTypeMembers and last observed index in the list of globals.
   1876   // The indices will be used later to deterministically order the list of type
   1877   // identifiers.
   1878   BumpPtrAllocator Alloc;
   1879   struct TIInfo {
   1880     unsigned UniqueId;
   1881     std::vector<GlobalTypeMember *> RefGlobals;
   1882   };
   1883   DenseMap<Metadata *, TIInfo> TypeIdInfo;
   1884   unsigned CurUniqueId = 0;
   1885   SmallVector<MDNode *, 2> Types;
   1886 
   1887   // Cross-DSO CFI emits jumptable entries for exported functions as well as
   1888   // address taken functions in case they are address taken in other modules.
   1889   const bool CrossDsoCfi = M.getModuleFlag("Cross-DSO CFI") != nullptr;
   1890 
   1891   struct ExportedFunctionInfo {
   1892     CfiFunctionLinkage Linkage;
   1893     MDNode *FuncMD; // {name, linkage, type[, type...]}
   1894   };
   1895   DenseMap<StringRef, ExportedFunctionInfo> ExportedFunctions;
   1896   if (ExportSummary) {
   1897     // A set of all functions that are address taken by a live global object.
   1898     DenseSet<GlobalValue::GUID> AddressTaken;
   1899     for (auto &I : *ExportSummary)
   1900       for (auto &GVS : I.second.SummaryList)
   1901         if (GVS->isLive())
   1902           for (auto &Ref : GVS->refs())
   1903             AddressTaken.insert(Ref.getGUID());
   1904 
   1905     NamedMDNode *CfiFunctionsMD = M.getNamedMetadata("cfi.functions");
   1906     if (CfiFunctionsMD) {
   1907       for (auto FuncMD : CfiFunctionsMD->operands()) {
   1908         assert(FuncMD->getNumOperands() >= 2);
   1909         StringRef FunctionName =
   1910             cast<MDString>(FuncMD->getOperand(0))->getString();
   1911         CfiFunctionLinkage Linkage = static_cast<CfiFunctionLinkage>(
   1912             cast<ConstantAsMetadata>(FuncMD->getOperand(1))
   1913                 ->getValue()
   1914                 ->getUniqueInteger()
   1915                 .getZExtValue());
   1916         const GlobalValue::GUID GUID = GlobalValue::getGUID(
   1917                 GlobalValue::dropLLVMManglingEscape(FunctionName));
   1918         // Do not emit jumptable entries for functions that are not-live and
   1919         // have no live references (and are not exported with cross-DSO CFI.)
   1920         if (!ExportSummary->isGUIDLive(GUID))
   1921           continue;
   1922         if (!AddressTaken.count(GUID)) {
   1923           if (!CrossDsoCfi || Linkage != CFL_Definition)
   1924             continue;
   1925 
   1926           bool Exported = false;
   1927           if (auto VI = ExportSummary->getValueInfo(GUID))
   1928             for (auto &GVS : VI.getSummaryList())
   1929               if (GVS->isLive() && !GlobalValue::isLocalLinkage(GVS->linkage()))
   1930                 Exported = true;
   1931 
   1932           if (!Exported)
   1933             continue;
   1934         }
   1935         auto P = ExportedFunctions.insert({FunctionName, {Linkage, FuncMD}});
   1936         if (!P.second && P.first->second.Linkage != CFL_Definition)
   1937           P.first->second = {Linkage, FuncMD};
   1938       }
   1939 
   1940       for (const auto &P : ExportedFunctions) {
   1941         StringRef FunctionName = P.first;
   1942         CfiFunctionLinkage Linkage = P.second.Linkage;
   1943         MDNode *FuncMD = P.second.FuncMD;
   1944         Function *F = M.getFunction(FunctionName);
   1945         if (F && F->hasLocalLinkage()) {
   1946           // Locally defined function that happens to have the same name as a
   1947           // function defined in a ThinLTO module. Rename it to move it out of
   1948           // the way of the external reference that we're about to create.
   1949           // Note that setName will find a unique name for the function, so even
   1950           // if there is an existing function with the suffix there won't be a
   1951           // name collision.
   1952           F->setName(F->getName() + ".1");
   1953           F = nullptr;
   1954         }
   1955 
   1956         if (!F)
   1957           F = Function::Create(
   1958               FunctionType::get(Type::getVoidTy(M.getContext()), false),
   1959               GlobalVariable::ExternalLinkage,
   1960               M.getDataLayout().getProgramAddressSpace(), FunctionName, &M);
   1961 
   1962         // If the function is available_externally, remove its definition so
   1963         // that it is handled the same way as a declaration. Later we will try
   1964         // to create an alias using this function's linkage, which will fail if
   1965         // the linkage is available_externally. This will also result in us
   1966         // following the code path below to replace the type metadata.
   1967         if (F->hasAvailableExternallyLinkage()) {
   1968           F->setLinkage(GlobalValue::ExternalLinkage);
   1969           F->deleteBody();
   1970           F->setComdat(nullptr);
   1971           F->clearMetadata();
   1972         }
   1973 
   1974         // Update the linkage for extern_weak declarations when a definition
   1975         // exists.
   1976         if (Linkage == CFL_Definition && F->hasExternalWeakLinkage())
   1977           F->setLinkage(GlobalValue::ExternalLinkage);
   1978 
   1979         // If the function in the full LTO module is a declaration, replace its
   1980         // type metadata with the type metadata we found in cfi.functions. That
   1981         // metadata is presumed to be more accurate than the metadata attached
   1982         // to the declaration.
   1983         if (F->isDeclaration()) {
   1984           if (Linkage == CFL_WeakDeclaration)
   1985             F->setLinkage(GlobalValue::ExternalWeakLinkage);
   1986 
   1987           F->eraseMetadata(LLVMContext::MD_type);
   1988           for (unsigned I = 2; I < FuncMD->getNumOperands(); ++I)
   1989             F->addMetadata(LLVMContext::MD_type,
   1990                            *cast<MDNode>(FuncMD->getOperand(I).get()));
   1991         }
   1992       }
   1993     }
   1994   }
   1995 
   1996   DenseMap<GlobalObject *, GlobalTypeMember *> GlobalTypeMembers;
   1997   for (GlobalObject &GO : M.global_objects()) {
   1998     if (isa<GlobalVariable>(GO) && GO.isDeclarationForLinker())
   1999       continue;
   2000 
   2001     Types.clear();
   2002     GO.getMetadata(LLVMContext::MD_type, Types);
   2003 
   2004     bool IsJumpTableCanonical = false;
   2005     bool IsExported = false;
   2006     if (Function *F = dyn_cast<Function>(&GO)) {
   2007       IsJumpTableCanonical = isJumpTableCanonical(F);
   2008       if (ExportedFunctions.count(F->getName())) {
   2009         IsJumpTableCanonical |=
   2010             ExportedFunctions[F->getName()].Linkage == CFL_Definition;
   2011         IsExported = true;
   2012       // TODO: The logic here checks only that the function is address taken,
   2013       // not that the address takers are live. This can be updated to check
   2014       // their liveness and emit fewer jumptable entries once monolithic LTO
   2015       // builds also emit summaries.
   2016       } else if (!F->hasAddressTaken()) {
   2017         if (!CrossDsoCfi || !IsJumpTableCanonical || F->hasLocalLinkage())
   2018           continue;
   2019       }
   2020     }
   2021 
   2022     auto *GTM = GlobalTypeMember::create(Alloc, &GO, IsJumpTableCanonical,
   2023                                          IsExported, Types);
   2024     GlobalTypeMembers[&GO] = GTM;
   2025     for (MDNode *Type : Types) {
   2026       verifyTypeMDNode(&GO, Type);
   2027       auto &Info = TypeIdInfo[Type->getOperand(1)];
   2028       Info.UniqueId = ++CurUniqueId;
   2029       Info.RefGlobals.push_back(GTM);
   2030     }
   2031   }
   2032 
   2033   auto AddTypeIdUse = [&](Metadata *TypeId) -> TypeIdUserInfo & {
   2034     // Add the call site to the list of call sites for this type identifier. We
   2035     // also use TypeIdUsers to keep track of whether we have seen this type
   2036     // identifier before. If we have, we don't need to re-add the referenced
   2037     // globals to the equivalence class.
   2038     auto Ins = TypeIdUsers.insert({TypeId, {}});
   2039     if (Ins.second) {
   2040       // Add the type identifier to the equivalence class.
   2041       GlobalClassesTy::iterator GCI = GlobalClasses.insert(TypeId);
   2042       GlobalClassesTy::member_iterator CurSet = GlobalClasses.findLeader(GCI);
   2043 
   2044       // Add the referenced globals to the type identifier's equivalence class.
   2045       for (GlobalTypeMember *GTM : TypeIdInfo[TypeId].RefGlobals)
   2046         CurSet = GlobalClasses.unionSets(
   2047             CurSet, GlobalClasses.findLeader(GlobalClasses.insert(GTM)));
   2048     }
   2049 
   2050     return Ins.first->second;
   2051   };
   2052 
   2053   if (TypeTestFunc) {
   2054     for (const Use &U : TypeTestFunc->uses()) {
   2055       auto CI = cast<CallInst>(U.getUser());
   2056       // If this type test is only used by llvm.assume instructions, it
   2057       // was used for whole program devirtualization, and is being kept
   2058       // for use by other optimization passes. We do not need or want to
   2059       // lower it here. We also don't want to rewrite any associated globals
   2060       // unnecessarily. These will be removed by a subsequent LTT invocation
   2061       // with the DropTypeTests flag set.
   2062       bool OnlyAssumeUses = !CI->use_empty();
   2063       for (const Use &CIU : CI->uses()) {
   2064         if (isa<AssumeInst>(CIU.getUser()))
   2065           continue;
   2066         OnlyAssumeUses = false;
   2067         break;
   2068       }
   2069       if (OnlyAssumeUses)
   2070         continue;
   2071 
   2072       auto TypeIdMDVal = dyn_cast<MetadataAsValue>(CI->getArgOperand(1));
   2073       if (!TypeIdMDVal)
   2074         report_fatal_error("Second argument of llvm.type.test must be metadata");
   2075       auto TypeId = TypeIdMDVal->getMetadata();
   2076       AddTypeIdUse(TypeId).CallSites.push_back(CI);
   2077     }
   2078   }
   2079 
   2080   if (ICallBranchFunnelFunc) {
   2081     for (const Use &U : ICallBranchFunnelFunc->uses()) {
   2082       if (Arch != Triple::x86_64)
   2083         report_fatal_error(
   2084             "llvm.icall.branch.funnel not supported on this target");
   2085 
   2086       auto CI = cast<CallInst>(U.getUser());
   2087 
   2088       std::vector<GlobalTypeMember *> Targets;
   2089       if (CI->getNumArgOperands() % 2 != 1)
   2090         report_fatal_error("number of arguments should be odd");
   2091 
   2092       GlobalClassesTy::member_iterator CurSet;
   2093       for (unsigned I = 1; I != CI->getNumArgOperands(); I += 2) {
   2094         int64_t Offset;
   2095         auto *Base = dyn_cast<GlobalObject>(GetPointerBaseWithConstantOffset(
   2096             CI->getOperand(I), Offset, M.getDataLayout()));
   2097         if (!Base)
   2098           report_fatal_error(
   2099               "Expected branch funnel operand to be global value");
   2100 
   2101         GlobalTypeMember *GTM = GlobalTypeMembers[Base];
   2102         Targets.push_back(GTM);
   2103         GlobalClassesTy::member_iterator NewSet =
   2104             GlobalClasses.findLeader(GlobalClasses.insert(GTM));
   2105         if (I == 1)
   2106           CurSet = NewSet;
   2107         else
   2108           CurSet = GlobalClasses.unionSets(CurSet, NewSet);
   2109       }
   2110 
   2111       GlobalClasses.unionSets(
   2112           CurSet, GlobalClasses.findLeader(
   2113                       GlobalClasses.insert(ICallBranchFunnel::create(
   2114                           Alloc, CI, Targets, ++CurUniqueId))));
   2115     }
   2116   }
   2117 
   2118   if (ExportSummary) {
   2119     DenseMap<GlobalValue::GUID, TinyPtrVector<Metadata *>> MetadataByGUID;
   2120     for (auto &P : TypeIdInfo) {
   2121       if (auto *TypeId = dyn_cast<MDString>(P.first))
   2122         MetadataByGUID[GlobalValue::getGUID(TypeId->getString())].push_back(
   2123             TypeId);
   2124     }
   2125 
   2126     for (auto &P : *ExportSummary) {
   2127       for (auto &S : P.second.SummaryList) {
   2128         if (!ExportSummary->isGlobalValueLive(S.get()))
   2129           continue;
   2130         if (auto *FS = dyn_cast<FunctionSummary>(S->getBaseObject()))
   2131           for (GlobalValue::GUID G : FS->type_tests())
   2132             for (Metadata *MD : MetadataByGUID[G])
   2133               AddTypeIdUse(MD).IsExported = true;
   2134       }
   2135     }
   2136   }
   2137 
   2138   if (GlobalClasses.empty())
   2139     return false;
   2140 
   2141   // Build a list of disjoint sets ordered by their maximum global index for
   2142   // determinism.
   2143   std::vector<std::pair<GlobalClassesTy::iterator, unsigned>> Sets;
   2144   for (GlobalClassesTy::iterator I = GlobalClasses.begin(),
   2145                                  E = GlobalClasses.end();
   2146        I != E; ++I) {
   2147     if (!I->isLeader())
   2148       continue;
   2149     ++NumTypeIdDisjointSets;
   2150 
   2151     unsigned MaxUniqueId = 0;
   2152     for (GlobalClassesTy::member_iterator MI = GlobalClasses.member_begin(I);
   2153          MI != GlobalClasses.member_end(); ++MI) {
   2154       if (auto *MD = MI->dyn_cast<Metadata *>())
   2155         MaxUniqueId = std::max(MaxUniqueId, TypeIdInfo[MD].UniqueId);
   2156       else if (auto *BF = MI->dyn_cast<ICallBranchFunnel *>())
   2157         MaxUniqueId = std::max(MaxUniqueId, BF->UniqueId);
   2158     }
   2159     Sets.emplace_back(I, MaxUniqueId);
   2160   }
   2161   llvm::sort(Sets,
   2162              [](const std::pair<GlobalClassesTy::iterator, unsigned> &S1,
   2163                 const std::pair<GlobalClassesTy::iterator, unsigned> &S2) {
   2164                return S1.second < S2.second;
   2165              });
   2166 
   2167   // For each disjoint set we found...
   2168   for (const auto &S : Sets) {
   2169     // Build the list of type identifiers in this disjoint set.
   2170     std::vector<Metadata *> TypeIds;
   2171     std::vector<GlobalTypeMember *> Globals;
   2172     std::vector<ICallBranchFunnel *> ICallBranchFunnels;
   2173     for (GlobalClassesTy::member_iterator MI =
   2174              GlobalClasses.member_begin(S.first);
   2175          MI != GlobalClasses.member_end(); ++MI) {
   2176       if (MI->is<Metadata *>())
   2177         TypeIds.push_back(MI->get<Metadata *>());
   2178       else if (MI->is<GlobalTypeMember *>())
   2179         Globals.push_back(MI->get<GlobalTypeMember *>());
   2180       else
   2181         ICallBranchFunnels.push_back(MI->get<ICallBranchFunnel *>());
   2182     }
   2183 
   2184     // Order type identifiers by unique ID for determinism. This ordering is
   2185     // stable as there is a one-to-one mapping between metadata and unique IDs.
   2186     llvm::sort(TypeIds, [&](Metadata *M1, Metadata *M2) {
   2187       return TypeIdInfo[M1].UniqueId < TypeIdInfo[M2].UniqueId;
   2188     });
   2189 
   2190     // Same for the branch funnels.
   2191     llvm::sort(ICallBranchFunnels,
   2192                [&](ICallBranchFunnel *F1, ICallBranchFunnel *F2) {
   2193                  return F1->UniqueId < F2->UniqueId;
   2194                });
   2195 
   2196     // Build bitsets for this disjoint set.
   2197     buildBitSetsFromDisjointSet(TypeIds, Globals, ICallBranchFunnels);
   2198   }
   2199 
   2200   allocateByteArrays();
   2201 
   2202   // Parse alias data to replace stand-in function declarations for aliases
   2203   // with an alias to the intended target.
   2204   if (ExportSummary) {
   2205     if (NamedMDNode *AliasesMD = M.getNamedMetadata("aliases")) {
   2206       for (auto AliasMD : AliasesMD->operands()) {
   2207         assert(AliasMD->getNumOperands() >= 4);
   2208         StringRef AliasName =
   2209             cast<MDString>(AliasMD->getOperand(0))->getString();
   2210         StringRef Aliasee = cast<MDString>(AliasMD->getOperand(1))->getString();
   2211 
   2212         if (!ExportedFunctions.count(Aliasee) ||
   2213             ExportedFunctions[Aliasee].Linkage != CFL_Definition ||
   2214             !M.getNamedAlias(Aliasee))
   2215           continue;
   2216 
   2217         GlobalValue::VisibilityTypes Visibility =
   2218             static_cast<GlobalValue::VisibilityTypes>(
   2219                 cast<ConstantAsMetadata>(AliasMD->getOperand(2))
   2220                     ->getValue()
   2221                     ->getUniqueInteger()
   2222                     .getZExtValue());
   2223         bool Weak =
   2224             static_cast<bool>(cast<ConstantAsMetadata>(AliasMD->getOperand(3))
   2225                                   ->getValue()
   2226                                   ->getUniqueInteger()
   2227                                   .getZExtValue());
   2228 
   2229         auto *Alias = GlobalAlias::create("", M.getNamedAlias(Aliasee));
   2230         Alias->setVisibility(Visibility);
   2231         if (Weak)
   2232           Alias->setLinkage(GlobalValue::WeakAnyLinkage);
   2233 
   2234         if (auto *F = M.getFunction(AliasName)) {
   2235           Alias->takeName(F);
   2236           F->replaceAllUsesWith(Alias);
   2237           F->eraseFromParent();
   2238         } else {
   2239           Alias->setName(AliasName);
   2240         }
   2241       }
   2242     }
   2243   }
   2244 
   2245   // Emit .symver directives for exported functions, if they exist.
   2246   if (ExportSummary) {
   2247     if (NamedMDNode *SymversMD = M.getNamedMetadata("symvers")) {
   2248       for (auto Symver : SymversMD->operands()) {
   2249         assert(Symver->getNumOperands() >= 2);
   2250         StringRef SymbolName =
   2251             cast<MDString>(Symver->getOperand(0))->getString();
   2252         StringRef Alias = cast<MDString>(Symver->getOperand(1))->getString();
   2253 
   2254         if (!ExportedFunctions.count(SymbolName))
   2255           continue;
   2256 
   2257         M.appendModuleInlineAsm(
   2258             (llvm::Twine(".symver ") + SymbolName + ", " + Alias).str());
   2259       }
   2260     }
   2261   }
   2262 
   2263   return true;
   2264 }
   2265 
   2266 PreservedAnalyses LowerTypeTestsPass::run(Module &M,
   2267                                           ModuleAnalysisManager &AM) {
   2268   bool Changed;
   2269   if (UseCommandLine)
   2270     Changed = LowerTypeTestsModule::runForTesting(M);
   2271   else
   2272     Changed =
   2273         LowerTypeTestsModule(M, ExportSummary, ImportSummary, DropTypeTests)
   2274             .lower();
   2275   if (!Changed)
   2276     return PreservedAnalyses::all();
   2277   return PreservedAnalyses::none();
   2278 }
   2279