Home | History | Annotate | Line # | Download | only in Basic
      1 //===- SourceLocation.h - Compact identifier for Source Files ---*- C++ -*-===//
      2 //
      3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
      4 // See https://llvm.org/LICENSE.txt for license information.
      5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
      6 //
      7 //===----------------------------------------------------------------------===//
      8 //
      9 /// \file
     10 /// Defines the clang::SourceLocation class and associated facilities.
     11 //
     12 //===----------------------------------------------------------------------===//
     13 
     14 #ifndef LLVM_CLANG_BASIC_SOURCELOCATION_H
     15 #define LLVM_CLANG_BASIC_SOURCELOCATION_H
     16 
     17 #include "clang/Basic/LLVM.h"
     18 #include "llvm/ADT/StringRef.h"
     19 #include "llvm/Support/PointerLikeTypeTraits.h"
     20 #include <cassert>
     21 #include <cstdint>
     22 #include <string>
     23 #include <utility>
     24 
     25 namespace llvm {
     26 
     27 template <typename T> struct DenseMapInfo;
     28 
     29 class FoldingSetNodeID;
     30 template <typename T> struct FoldingSetTrait;
     31 
     32 } // namespace llvm
     33 
     34 namespace clang {
     35 
     36 class SourceManager;
     37 
     38 /// An opaque identifier used by SourceManager which refers to a
     39 /// source file (MemoryBuffer) along with its \#include path and \#line data.
     40 ///
     41 class FileID {
     42   /// A mostly-opaque identifier, where 0 is "invalid", >0 is
     43   /// this module, and <-1 is something loaded from another module.
     44   int ID = 0;
     45 
     46 public:
     47   bool isValid() const { return ID != 0; }
     48   bool isInvalid() const { return ID == 0; }
     49 
     50   bool operator==(const FileID &RHS) const { return ID == RHS.ID; }
     51   bool operator<(const FileID &RHS) const { return ID < RHS.ID; }
     52   bool operator<=(const FileID &RHS) const { return ID <= RHS.ID; }
     53   bool operator!=(const FileID &RHS) const { return !(*this == RHS); }
     54   bool operator>(const FileID &RHS) const { return RHS < *this; }
     55   bool operator>=(const FileID &RHS) const { return RHS <= *this; }
     56 
     57   static FileID getSentinel() { return get(-1); }
     58   unsigned getHashValue() const { return static_cast<unsigned>(ID); }
     59 
     60 private:
     61   friend class ASTWriter;
     62   friend class ASTReader;
     63   friend class SourceManager;
     64 
     65   static FileID get(int V) {
     66     FileID F;
     67     F.ID = V;
     68     return F;
     69   }
     70 
     71   int getOpaqueValue() const { return ID; }
     72 };
     73 
     74 /// Encodes a location in the source. The SourceManager can decode this
     75 /// to get at the full include stack, line and column information.
     76 ///
     77 /// Technically, a source location is simply an offset into the manager's view
     78 /// of the input source, which is all input buffers (including macro
     79 /// expansions) concatenated in an effectively arbitrary order. The manager
     80 /// actually maintains two blocks of input buffers. One, starting at offset
     81 /// 0 and growing upwards, contains all buffers from this module. The other,
     82 /// starting at the highest possible offset and growing downwards, contains
     83 /// buffers of loaded modules.
     84 ///
     85 /// In addition, one bit of SourceLocation is used for quick access to the
     86 /// information whether the location is in a file or a macro expansion.
     87 ///
     88 /// It is important that this type remains small. It is currently 32 bits wide.
     89 class SourceLocation {
     90   friend class ASTReader;
     91   friend class ASTWriter;
     92   friend class SourceManager;
     93   friend struct llvm::FoldingSetTrait<SourceLocation>;
     94 
     95   unsigned ID = 0;
     96 
     97   enum : unsigned {
     98     MacroIDBit = 1U << 31
     99   };
    100 
    101 public:
    102   bool isFileID() const  { return (ID & MacroIDBit) == 0; }
    103   bool isMacroID() const { return (ID & MacroIDBit) != 0; }
    104 
    105   /// Return true if this is a valid SourceLocation object.
    106   ///
    107   /// Invalid SourceLocations are often used when events have no corresponding
    108   /// location in the source (e.g. a diagnostic is required for a command line
    109   /// option).
    110   bool isValid() const { return ID != 0; }
    111   bool isInvalid() const { return ID == 0; }
    112 
    113 private:
    114   /// Return the offset into the manager's global input view.
    115   unsigned getOffset() const {
    116     return ID & ~MacroIDBit;
    117   }
    118 
    119   static SourceLocation getFileLoc(unsigned ID) {
    120     assert((ID & MacroIDBit) == 0 && "Ran out of source locations!");
    121     SourceLocation L;
    122     L.ID = ID;
    123     return L;
    124   }
    125 
    126   static SourceLocation getMacroLoc(unsigned ID) {
    127     assert((ID & MacroIDBit) == 0 && "Ran out of source locations!");
    128     SourceLocation L;
    129     L.ID = MacroIDBit | ID;
    130     return L;
    131   }
    132 
    133 public:
    134   /// Return a source location with the specified offset from this
    135   /// SourceLocation.
    136   SourceLocation getLocWithOffset(int Offset) const {
    137     assert(((getOffset()+Offset) & MacroIDBit) == 0 && "offset overflow");
    138     SourceLocation L;
    139     L.ID = ID+Offset;
    140     return L;
    141   }
    142 
    143   /// When a SourceLocation itself cannot be used, this returns
    144   /// an (opaque) 32-bit integer encoding for it.
    145   ///
    146   /// This should only be passed to SourceLocation::getFromRawEncoding, it
    147   /// should not be inspected directly.
    148   unsigned getRawEncoding() const { return ID; }
    149 
    150   /// Turn a raw encoding of a SourceLocation object into
    151   /// a real SourceLocation.
    152   ///
    153   /// \see getRawEncoding.
    154   static SourceLocation getFromRawEncoding(unsigned Encoding) {
    155     SourceLocation X;
    156     X.ID = Encoding;
    157     return X;
    158   }
    159 
    160   /// When a SourceLocation itself cannot be used, this returns
    161   /// an (opaque) pointer encoding for it.
    162   ///
    163   /// This should only be passed to SourceLocation::getFromPtrEncoding, it
    164   /// should not be inspected directly.
    165   void* getPtrEncoding() const {
    166     // Double cast to avoid a warning "cast to pointer from integer of different
    167     // size".
    168     return (void*)(uintptr_t)getRawEncoding();
    169   }
    170 
    171   /// Turn a pointer encoding of a SourceLocation object back
    172   /// into a real SourceLocation.
    173   static SourceLocation getFromPtrEncoding(const void *Encoding) {
    174     return getFromRawEncoding((unsigned)(uintptr_t)Encoding);
    175   }
    176 
    177   static bool isPairOfFileLocations(SourceLocation Start, SourceLocation End) {
    178     return Start.isValid() && Start.isFileID() && End.isValid() &&
    179            End.isFileID();
    180   }
    181 
    182   unsigned getHashValue() const;
    183   void print(raw_ostream &OS, const SourceManager &SM) const;
    184   std::string printToString(const SourceManager &SM) const;
    185   void dump(const SourceManager &SM) const;
    186 };
    187 
    188 inline bool operator==(const SourceLocation &LHS, const SourceLocation &RHS) {
    189   return LHS.getRawEncoding() == RHS.getRawEncoding();
    190 }
    191 
    192 inline bool operator!=(const SourceLocation &LHS, const SourceLocation &RHS) {
    193   return !(LHS == RHS);
    194 }
    195 
    196 // Ordering is meaningful only if LHS and RHS have the same FileID!
    197 // Otherwise use SourceManager::isBeforeInTranslationUnit().
    198 inline bool operator<(const SourceLocation &LHS, const SourceLocation &RHS) {
    199   return LHS.getRawEncoding() < RHS.getRawEncoding();
    200 }
    201 inline bool operator>(const SourceLocation &LHS, const SourceLocation &RHS) {
    202   return LHS.getRawEncoding() > RHS.getRawEncoding();
    203 }
    204 inline bool operator<=(const SourceLocation &LHS, const SourceLocation &RHS) {
    205   return LHS.getRawEncoding() <= RHS.getRawEncoding();
    206 }
    207 inline bool operator>=(const SourceLocation &LHS, const SourceLocation &RHS) {
    208   return LHS.getRawEncoding() >= RHS.getRawEncoding();
    209 }
    210 
    211 /// A trivial tuple used to represent a source range.
    212 class SourceRange {
    213   SourceLocation B;
    214   SourceLocation E;
    215 
    216 public:
    217   SourceRange() = default;
    218   SourceRange(SourceLocation loc) : B(loc), E(loc) {}
    219   SourceRange(SourceLocation begin, SourceLocation end) : B(begin), E(end) {}
    220 
    221   SourceLocation getBegin() const { return B; }
    222   SourceLocation getEnd() const { return E; }
    223 
    224   void setBegin(SourceLocation b) { B = b; }
    225   void setEnd(SourceLocation e) { E = e; }
    226 
    227   bool isValid() const { return B.isValid() && E.isValid(); }
    228   bool isInvalid() const { return !isValid(); }
    229 
    230   bool operator==(const SourceRange &X) const {
    231     return B == X.B && E == X.E;
    232   }
    233 
    234   bool operator!=(const SourceRange &X) const {
    235     return B != X.B || E != X.E;
    236   }
    237 
    238   // Returns true iff other is wholly contained within this range.
    239   bool fullyContains(const SourceRange &other) const {
    240     return B <= other.B && E >= other.E;
    241   }
    242 
    243   void print(raw_ostream &OS, const SourceManager &SM) const;
    244   std::string printToString(const SourceManager &SM) const;
    245   void dump(const SourceManager &SM) const;
    246 };
    247 
    248 /// Represents a character-granular source range.
    249 ///
    250 /// The underlying SourceRange can either specify the starting/ending character
    251 /// of the range, or it can specify the start of the range and the start of the
    252 /// last token of the range (a "token range").  In the token range case, the
    253 /// size of the last token must be measured to determine the actual end of the
    254 /// range.
    255 class CharSourceRange {
    256   SourceRange Range;
    257   bool IsTokenRange = false;
    258 
    259 public:
    260   CharSourceRange() = default;
    261   CharSourceRange(SourceRange R, bool ITR) : Range(R), IsTokenRange(ITR) {}
    262 
    263   static CharSourceRange getTokenRange(SourceRange R) {
    264     return CharSourceRange(R, true);
    265   }
    266 
    267   static CharSourceRange getCharRange(SourceRange R) {
    268     return CharSourceRange(R, false);
    269   }
    270 
    271   static CharSourceRange getTokenRange(SourceLocation B, SourceLocation E) {
    272     return getTokenRange(SourceRange(B, E));
    273   }
    274 
    275   static CharSourceRange getCharRange(SourceLocation B, SourceLocation E) {
    276     return getCharRange(SourceRange(B, E));
    277   }
    278 
    279   /// Return true if the end of this range specifies the start of
    280   /// the last token.  Return false if the end of this range specifies the last
    281   /// character in the range.
    282   bool isTokenRange() const { return IsTokenRange; }
    283   bool isCharRange() const { return !IsTokenRange; }
    284 
    285   SourceLocation getBegin() const { return Range.getBegin(); }
    286   SourceLocation getEnd() const { return Range.getEnd(); }
    287   SourceRange getAsRange() const { return Range; }
    288 
    289   void setBegin(SourceLocation b) { Range.setBegin(b); }
    290   void setEnd(SourceLocation e) { Range.setEnd(e); }
    291   void setTokenRange(bool TR) { IsTokenRange = TR; }
    292 
    293   bool isValid() const { return Range.isValid(); }
    294   bool isInvalid() const { return !isValid(); }
    295 };
    296 
    297 /// Represents an unpacked "presumed" location which can be presented
    298 /// to the user.
    299 ///
    300 /// A 'presumed' location can be modified by \#line and GNU line marker
    301 /// directives and is always the expansion point of a normal location.
    302 ///
    303 /// You can get a PresumedLoc from a SourceLocation with SourceManager.
    304 class PresumedLoc {
    305   const char *Filename = nullptr;
    306   FileID ID;
    307   unsigned Line, Col;
    308   SourceLocation IncludeLoc;
    309 
    310 public:
    311   PresumedLoc() = default;
    312   PresumedLoc(const char *FN, FileID FID, unsigned Ln, unsigned Co,
    313               SourceLocation IL)
    314       : Filename(FN), ID(FID), Line(Ln), Col(Co), IncludeLoc(IL) {}
    315 
    316   /// Return true if this object is invalid or uninitialized.
    317   ///
    318   /// This occurs when created with invalid source locations or when walking
    319   /// off the top of a \#include stack.
    320   bool isInvalid() const { return Filename == nullptr; }
    321   bool isValid() const { return Filename != nullptr; }
    322 
    323   /// Return the presumed filename of this location.
    324   ///
    325   /// This can be affected by \#line etc.
    326   const char *getFilename() const {
    327     assert(isValid());
    328     return Filename;
    329   }
    330 
    331   FileID getFileID() const {
    332     assert(isValid());
    333     return ID;
    334   }
    335 
    336   /// Return the presumed line number of this location.
    337   ///
    338   /// This can be affected by \#line etc.
    339   unsigned getLine() const {
    340     assert(isValid());
    341     return Line;
    342   }
    343 
    344   /// Return the presumed column number of this location.
    345   ///
    346   /// This cannot be affected by \#line, but is packaged here for convenience.
    347   unsigned getColumn() const {
    348     assert(isValid());
    349     return Col;
    350   }
    351 
    352   /// Return the presumed include location of this location.
    353   ///
    354   /// This can be affected by GNU linemarker directives.
    355   SourceLocation getIncludeLoc() const {
    356     assert(isValid());
    357     return IncludeLoc;
    358   }
    359 };
    360 
    361 class FileEntry;
    362 
    363 /// A SourceLocation and its associated SourceManager.
    364 ///
    365 /// This is useful for argument passing to functions that expect both objects.
    366 class FullSourceLoc : public SourceLocation {
    367   const SourceManager *SrcMgr = nullptr;
    368 
    369 public:
    370   /// Creates a FullSourceLoc where isValid() returns \c false.
    371   FullSourceLoc() = default;
    372 
    373   explicit FullSourceLoc(SourceLocation Loc, const SourceManager &SM)
    374       : SourceLocation(Loc), SrcMgr(&SM) {}
    375 
    376   bool hasManager() const {
    377       bool hasSrcMgr =  SrcMgr != nullptr;
    378       assert(hasSrcMgr == isValid() && "FullSourceLoc has location but no manager");
    379       return hasSrcMgr;
    380   }
    381 
    382   /// \pre This FullSourceLoc has an associated SourceManager.
    383   const SourceManager &getManager() const {
    384     assert(SrcMgr && "SourceManager is NULL.");
    385     return *SrcMgr;
    386   }
    387 
    388   FileID getFileID() const;
    389 
    390   FullSourceLoc getExpansionLoc() const;
    391   FullSourceLoc getSpellingLoc() const;
    392   FullSourceLoc getFileLoc() const;
    393   PresumedLoc getPresumedLoc(bool UseLineDirectives = true) const;
    394   bool isMacroArgExpansion(FullSourceLoc *StartLoc = nullptr) const;
    395   FullSourceLoc getImmediateMacroCallerLoc() const;
    396   std::pair<FullSourceLoc, StringRef> getModuleImportLoc() const;
    397   unsigned getFileOffset() const;
    398 
    399   unsigned getExpansionLineNumber(bool *Invalid = nullptr) const;
    400   unsigned getExpansionColumnNumber(bool *Invalid = nullptr) const;
    401 
    402   unsigned getSpellingLineNumber(bool *Invalid = nullptr) const;
    403   unsigned getSpellingColumnNumber(bool *Invalid = nullptr) const;
    404 
    405   const char *getCharacterData(bool *Invalid = nullptr) const;
    406 
    407   unsigned getLineNumber(bool *Invalid = nullptr) const;
    408   unsigned getColumnNumber(bool *Invalid = nullptr) const;
    409 
    410   const FileEntry *getFileEntry() const;
    411 
    412   /// Return a StringRef to the source buffer data for the
    413   /// specified FileID.
    414   StringRef getBufferData(bool *Invalid = nullptr) const;
    415 
    416   /// Decompose the specified location into a raw FileID + Offset pair.
    417   ///
    418   /// The first element is the FileID, the second is the offset from the
    419   /// start of the buffer of the location.
    420   std::pair<FileID, unsigned> getDecomposedLoc() const;
    421 
    422   bool isInSystemHeader() const;
    423 
    424   /// Determines the order of 2 source locations in the translation unit.
    425   ///
    426   /// \returns true if this source location comes before 'Loc', false otherwise.
    427   bool isBeforeInTranslationUnitThan(SourceLocation Loc) const;
    428 
    429   /// Determines the order of 2 source locations in the translation unit.
    430   ///
    431   /// \returns true if this source location comes before 'Loc', false otherwise.
    432   bool isBeforeInTranslationUnitThan(FullSourceLoc Loc) const {
    433     assert(Loc.isValid());
    434     assert(SrcMgr == Loc.SrcMgr && "Loc comes from another SourceManager!");
    435     return isBeforeInTranslationUnitThan((SourceLocation)Loc);
    436   }
    437 
    438   /// Comparison function class, useful for sorting FullSourceLocs.
    439   struct BeforeThanCompare {
    440     bool operator()(const FullSourceLoc& lhs, const FullSourceLoc& rhs) const {
    441       return lhs.isBeforeInTranslationUnitThan(rhs);
    442     }
    443   };
    444 
    445   /// Prints information about this FullSourceLoc to stderr.
    446   ///
    447   /// This is useful for debugging.
    448   void dump() const;
    449 
    450   friend bool
    451   operator==(const FullSourceLoc &LHS, const FullSourceLoc &RHS) {
    452     return LHS.getRawEncoding() == RHS.getRawEncoding() &&
    453           LHS.SrcMgr == RHS.SrcMgr;
    454   }
    455 
    456   friend bool
    457   operator!=(const FullSourceLoc &LHS, const FullSourceLoc &RHS) {
    458     return !(LHS == RHS);
    459   }
    460 };
    461 
    462 } // namespace clang
    463 
    464 namespace llvm {
    465 
    466   /// Define DenseMapInfo so that FileID's can be used as keys in DenseMap and
    467   /// DenseSets.
    468   template <>
    469   struct DenseMapInfo<clang::FileID> {
    470     static clang::FileID getEmptyKey() {
    471       return {};
    472     }
    473 
    474     static clang::FileID getTombstoneKey() {
    475       return clang::FileID::getSentinel();
    476     }
    477 
    478     static unsigned getHashValue(clang::FileID S) {
    479       return S.getHashValue();
    480     }
    481 
    482     static bool isEqual(clang::FileID LHS, clang::FileID RHS) {
    483       return LHS == RHS;
    484     }
    485   };
    486 
    487   /// Define DenseMapInfo so that SourceLocation's can be used as keys in
    488   /// DenseMap and DenseSet. This trait class is eqivalent to
    489   /// DenseMapInfo<unsigned> which uses SourceLocation::ID is used as a key.
    490   template <> struct DenseMapInfo<clang::SourceLocation> {
    491     static clang::SourceLocation getEmptyKey() {
    492       return clang::SourceLocation::getFromRawEncoding(~0U);
    493     }
    494 
    495     static clang::SourceLocation getTombstoneKey() {
    496       return clang::SourceLocation::getFromRawEncoding(~0U - 1);
    497     }
    498 
    499     static unsigned getHashValue(clang::SourceLocation Loc) {
    500       return Loc.getHashValue();
    501     }
    502 
    503     static bool isEqual(clang::SourceLocation LHS, clang::SourceLocation RHS) {
    504       return LHS == RHS;
    505     }
    506   };
    507 
    508   // Allow calling FoldingSetNodeID::Add with SourceLocation object as parameter
    509   template <> struct FoldingSetTrait<clang::SourceLocation> {
    510     static void Profile(const clang::SourceLocation &X, FoldingSetNodeID &ID);
    511   };
    512 
    513   // Teach SmallPtrSet how to handle SourceLocation.
    514   template<>
    515   struct PointerLikeTypeTraits<clang::SourceLocation> {
    516     static constexpr int NumLowBitsAvailable = 0;
    517 
    518     static void *getAsVoidPointer(clang::SourceLocation L) {
    519       return L.getPtrEncoding();
    520     }
    521 
    522     static clang::SourceLocation getFromVoidPointer(void *P) {
    523       return clang::SourceLocation::getFromRawEncoding((unsigned)(uintptr_t)P);
    524     }
    525   };
    526 
    527 } // namespace llvm
    528 
    529 #endif // LLVM_CLANG_BASIC_SOURCELOCATION_H
    530