Home | History | Annotate | Line # | Download | only in Support
      1 //===-- DataExtractor.h -----------------------------------------*- C++ -*-===//
      2 //
      3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
      4 // See https://llvm.org/LICENSE.txt for license information.
      5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
      6 //
      7 //===----------------------------------------------------------------------===//
      8 
      9 #ifndef LLVM_SUPPORT_DATAEXTRACTOR_H
     10 #define LLVM_SUPPORT_DATAEXTRACTOR_H
     11 
     12 #include "llvm/ADT/StringRef.h"
     13 #include "llvm/Support/DataTypes.h"
     14 #include "llvm/Support/Error.h"
     15 
     16 namespace llvm {
     17 
     18 /// An auxiliary type to facilitate extraction of 3-byte entities.
     19 struct Uint24 {
     20   uint8_t Bytes[3];
     21   Uint24(uint8_t U) {
     22     Bytes[0] = Bytes[1] = Bytes[2] = U;
     23   }
     24   Uint24(uint8_t U0, uint8_t U1, uint8_t U2) {
     25     Bytes[0] = U0; Bytes[1] = U1; Bytes[2] = U2;
     26   }
     27   uint32_t getAsUint32(bool IsLittleEndian) const {
     28     int LoIx = IsLittleEndian ? 0 : 2;
     29     return Bytes[LoIx] + (Bytes[1] << 8) + (Bytes[2-LoIx] << 16);
     30   }
     31 };
     32 
     33 using uint24_t = Uint24;
     34 static_assert(sizeof(uint24_t) == 3, "sizeof(uint24_t) != 3");
     35 
     36 /// Needed by swapByteOrder().
     37 inline uint24_t getSwappedBytes(uint24_t C) {
     38   return uint24_t(C.Bytes[2], C.Bytes[1], C.Bytes[0]);
     39 }
     40 
     41 class DataExtractor {
     42   StringRef Data;
     43   uint8_t IsLittleEndian;
     44   uint8_t AddressSize;
     45 public:
     46   /// A class representing a position in a DataExtractor, as well as any error
     47   /// encountered during extraction. It enables one to extract a sequence of
     48   /// values without error-checking and then checking for errors in bulk at the
     49   /// end. The class holds an Error object, so failing to check the result of
     50   /// the parse will result in a runtime error. The error flag is sticky and
     51   /// will cause all subsequent extraction functions to fail without even
     52   /// attempting to parse and without updating the Cursor offset. After clearing
     53   /// the error flag, one can again use the Cursor object for parsing.
     54   class Cursor {
     55     uint64_t Offset;
     56     Error Err;
     57 
     58     friend class DataExtractor;
     59 
     60   public:
     61     /// Construct a cursor for extraction from the given offset.
     62     explicit Cursor(uint64_t Offset) : Offset(Offset), Err(Error::success()) {}
     63 
     64     /// Checks whether the cursor is valid (i.e. no errors were encountered). In
     65     /// case of errors, this does not clear the error flag -- one must call
     66     /// takeError() instead.
     67     explicit operator bool() { return !Err; }
     68 
     69     /// Return the current position of this Cursor. In the error state this is
     70     /// the position of the Cursor before the first error was encountered.
     71     uint64_t tell() const { return Offset; }
     72 
     73     /// Return error contained inside this Cursor, if any. Clears the internal
     74     /// Cursor state.
     75     Error takeError() { return std::move(Err); }
     76   };
     77 
     78   /// Construct with a buffer that is owned by the caller.
     79   ///
     80   /// This constructor allows us to use data that is owned by the
     81   /// caller. The data must stay around as long as this object is
     82   /// valid.
     83   DataExtractor(StringRef Data, bool IsLittleEndian, uint8_t AddressSize)
     84     : Data(Data), IsLittleEndian(IsLittleEndian), AddressSize(AddressSize) {}
     85   DataExtractor(ArrayRef<uint8_t> Data, bool IsLittleEndian,
     86                 uint8_t AddressSize)
     87       : Data(StringRef(reinterpret_cast<const char *>(Data.data()),
     88                        Data.size())),
     89         IsLittleEndian(IsLittleEndian), AddressSize(AddressSize) {}
     90 
     91   /// Get the data pointed to by this extractor.
     92   StringRef getData() const { return Data; }
     93   /// Get the endianness for this extractor.
     94   bool isLittleEndian() const { return IsLittleEndian; }
     95   /// Get the address size for this extractor.
     96   uint8_t getAddressSize() const { return AddressSize; }
     97   /// Set the address size for this extractor.
     98   void setAddressSize(uint8_t Size) { AddressSize = Size; }
     99 
    100   /// Extract a C string from \a *offset_ptr.
    101   ///
    102   /// Returns a pointer to a C String from the data at the offset
    103   /// pointed to by \a offset_ptr. A variable length NULL terminated C
    104   /// string will be extracted and the \a offset_ptr will be
    105   /// updated with the offset of the byte that follows the NULL
    106   /// terminator byte.
    107   ///
    108   /// @param[in,out] OffsetPtr
    109   ///     A pointer to an offset within the data that will be advanced
    110   ///     by the appropriate number of bytes if the value is extracted
    111   ///     correctly. If the offset is out of bounds or there are not
    112   ///     enough bytes to extract this value, the offset will be left
    113   ///     unmodified.
    114   ///
    115   /// @param[in,out] Err
    116   ///     A pointer to an Error object. Upon return the Error object is set to
    117   ///     indicate the result (success/failure) of the function. If the Error
    118   ///     object is already set when calling this function, no extraction is
    119   ///     performed.
    120   ///
    121   /// @return
    122   ///     A pointer to the C string value in the data. If the offset
    123   ///     pointed to by \a offset_ptr is out of bounds, or if the
    124   ///     offset plus the length of the C string is out of bounds,
    125   ///     NULL will be returned.
    126   const char *getCStr(uint64_t *OffsetPtr, Error *Err = nullptr) const {
    127     return getCStrRef(OffsetPtr, Err).data();
    128   }
    129 
    130   /// Extract a C string from the location given by the cursor. In case of an
    131   /// extraction error, or if the cursor is already in an error state, a
    132   /// nullptr is returned.
    133   const char *getCStr(Cursor &C) const { return getCStrRef(C).data(); }
    134 
    135   /// Extract a C string from \a *offset_ptr.
    136   ///
    137   /// Returns a StringRef for the C String from the data at the offset
    138   /// pointed to by \a offset_ptr. A variable length NULL terminated C
    139   /// string will be extracted and the \a offset_ptr will be
    140   /// updated with the offset of the byte that follows the NULL
    141   /// terminator byte.
    142   ///
    143   /// \param[in,out] OffsetPtr
    144   ///     A pointer to an offset within the data that will be advanced
    145   ///     by the appropriate number of bytes if the value is extracted
    146   ///     correctly. If the offset is out of bounds or there are not
    147   ///     enough bytes to extract this value, the offset will be left
    148   ///     unmodified.
    149   ///
    150   /// @param[in,out] Err
    151   ///     A pointer to an Error object. Upon return the Error object is set to
    152   ///     indicate the result (success/failure) of the function. If the Error
    153   ///     object is already set when calling this function, no extraction is
    154   ///     performed.
    155   ///
    156   /// \return
    157   ///     A StringRef for the C string value in the data. If the offset
    158   ///     pointed to by \a offset_ptr is out of bounds, or if the
    159   ///     offset plus the length of the C string is out of bounds,
    160   ///     a default-initialized StringRef will be returned.
    161   StringRef getCStrRef(uint64_t *OffsetPtr, Error *Err = nullptr) const;
    162 
    163   /// Extract a C string (as a StringRef) from the location given by the cursor.
    164   /// In case of an extraction error, or if the cursor is already in an error
    165   /// state, a default-initialized StringRef is returned.
    166   StringRef getCStrRef(Cursor &C) const {
    167     return getCStrRef(&C.Offset, &C.Err);
    168   }
    169 
    170   /// Extract a fixed length string from \a *OffsetPtr and consume \a Length
    171   /// bytes.
    172   ///
    173   /// Returns a StringRef for the string from the data at the offset
    174   /// pointed to by \a OffsetPtr. A fixed length C string will be extracted
    175   /// and the \a OffsetPtr will be advanced by \a Length bytes.
    176   ///
    177   /// \param[in,out] OffsetPtr
    178   ///     A pointer to an offset within the data that will be advanced
    179   ///     by the appropriate number of bytes if the value is extracted
    180   ///     correctly. If the offset is out of bounds or there are not
    181   ///     enough bytes to extract this value, the offset will be left
    182   ///     unmodified.
    183   ///
    184   /// \param[in] Length
    185   ///     The length of the fixed length string to extract. If there are not
    186   ///     enough bytes in the data to extract the full string, the offset will
    187   ///     be left unmodified.
    188   ///
    189   /// \param[in] TrimChars
    190   ///     A set of characters to trim from the end of the string. Fixed length
    191   ///     strings are commonly either NULL terminated by one or more zero
    192   ///     bytes. Some clients have one or more spaces at the end of the string,
    193   ///     but a good default is to trim the NULL characters.
    194   ///
    195   /// \return
    196   ///     A StringRef for the C string value in the data. If the offset
    197   ///     pointed to by \a OffsetPtr is out of bounds, or if the
    198   ///     offset plus the length of the C string is out of bounds,
    199   ///     a default-initialized StringRef will be returned.
    200   StringRef getFixedLengthString(uint64_t *OffsetPtr,
    201       uint64_t Length, StringRef TrimChars = {"\0", 1}) const;
    202 
    203   /// Extract a fixed number of bytes from the specified offset.
    204   ///
    205   /// Returns a StringRef for the bytes from the data at the offset
    206   /// pointed to by \a OffsetPtr. A fixed length C string will be extracted
    207   /// and the \a OffsetPtr will be advanced by \a Length bytes.
    208   ///
    209   /// \param[in,out] OffsetPtr
    210   ///     A pointer to an offset within the data that will be advanced
    211   ///     by the appropriate number of bytes if the value is extracted
    212   ///     correctly. If the offset is out of bounds or there are not
    213   ///     enough bytes to extract this value, the offset will be left
    214   ///     unmodified.
    215   ///
    216   /// \param[in] Length
    217   ///     The number of bytes to extract. If there are not enough bytes in the
    218   ///     data to extract all of the bytes, the offset will be left unmodified.
    219   ///
    220   /// @param[in,out] Err
    221   ///     A pointer to an Error object. Upon return the Error object is set to
    222   ///     indicate the result (success/failure) of the function. If the Error
    223   ///     object is already set when calling this function, no extraction is
    224   ///     performed.
    225   ///
    226   /// \return
    227   ///     A StringRef for the extracted bytes. If the offset pointed to by
    228   ///     \a OffsetPtr is out of bounds, or if the offset plus the length
    229   ///     is out of bounds, a default-initialized StringRef will be returned.
    230   StringRef getBytes(uint64_t *OffsetPtr, uint64_t Length,
    231                      Error *Err = nullptr) const;
    232 
    233   /// Extract a fixed number of bytes from the location given by the cursor. In
    234   /// case of an extraction error, or if the cursor is already in an error
    235   /// state, a default-initialized StringRef is returned.
    236   StringRef getBytes(Cursor &C, uint64_t Length) {
    237     return getBytes(&C.Offset, Length, &C.Err);
    238   }
    239 
    240   /// Extract an unsigned integer of size \a byte_size from \a
    241   /// *offset_ptr.
    242   ///
    243   /// Extract a single unsigned integer value and update the offset
    244   /// pointed to by \a offset_ptr. The size of the extracted integer
    245   /// is specified by the \a byte_size argument. \a byte_size should
    246   /// have a value greater than or equal to one and less than or equal
    247   /// to eight since the return value is 64 bits wide. Any
    248   /// \a byte_size values less than 1 or greater than 8 will result in
    249   /// nothing being extracted, and zero being returned.
    250   ///
    251   /// @param[in,out] offset_ptr
    252   ///     A pointer to an offset within the data that will be advanced
    253   ///     by the appropriate number of bytes if the value is extracted
    254   ///     correctly. If the offset is out of bounds or there are not
    255   ///     enough bytes to extract this value, the offset will be left
    256   ///     unmodified.
    257   ///
    258   /// @param[in] byte_size
    259   ///     The size in byte of the integer to extract.
    260   ///
    261   /// @param[in,out] Err
    262   ///     A pointer to an Error object. Upon return the Error object is set to
    263   ///     indicate the result (success/failure) of the function. If the Error
    264   ///     object is already set when calling this function, no extraction is
    265   ///     performed.
    266   ///
    267   /// @return
    268   ///     The unsigned integer value that was extracted, or zero on
    269   ///     failure.
    270   uint64_t getUnsigned(uint64_t *offset_ptr, uint32_t byte_size,
    271                        Error *Err = nullptr) const;
    272 
    273   /// Extract an unsigned integer of the given size from the location given by
    274   /// the cursor. In case of an extraction error, or if the cursor is already in
    275   /// an error state, zero is returned.
    276   uint64_t getUnsigned(Cursor &C, uint32_t Size) const {
    277     return getUnsigned(&C.Offset, Size, &C.Err);
    278   }
    279 
    280   /// Extract an signed integer of size \a byte_size from \a *offset_ptr.
    281   ///
    282   /// Extract a single signed integer value (sign extending if required)
    283   /// and update the offset pointed to by \a offset_ptr. The size of
    284   /// the extracted integer is specified by the \a byte_size argument.
    285   /// \a byte_size should have a value greater than or equal to one
    286   /// and less than or equal to eight since the return value is 64
    287   /// bits wide. Any \a byte_size values less than 1 or greater than
    288   /// 8 will result in nothing being extracted, and zero being returned.
    289   ///
    290   /// @param[in,out] offset_ptr
    291   ///     A pointer to an offset within the data that will be advanced
    292   ///     by the appropriate number of bytes if the value is extracted
    293   ///     correctly. If the offset is out of bounds or there are not
    294   ///     enough bytes to extract this value, the offset will be left
    295   ///     unmodified.
    296   ///
    297   /// @param[in] size
    298   ///     The size in bytes of the integer to extract.
    299   ///
    300   /// @return
    301   ///     The sign extended signed integer value that was extracted,
    302   ///     or zero on failure.
    303   int64_t getSigned(uint64_t *offset_ptr, uint32_t size) const;
    304 
    305   //------------------------------------------------------------------
    306   /// Extract an pointer from \a *offset_ptr.
    307   ///
    308   /// Extract a single pointer from the data and update the offset
    309   /// pointed to by \a offset_ptr. The size of the extracted pointer
    310   /// is \a getAddressSize(), so the address size has to be
    311   /// set correctly prior to extracting any pointer values.
    312   ///
    313   /// @param[in,out] offset_ptr
    314   ///     A pointer to an offset within the data that will be advanced
    315   ///     by the appropriate number of bytes if the value is extracted
    316   ///     correctly. If the offset is out of bounds or there are not
    317   ///     enough bytes to extract this value, the offset will be left
    318   ///     unmodified.
    319   ///
    320   /// @return
    321   ///     The extracted pointer value as a 64 integer.
    322   uint64_t getAddress(uint64_t *offset_ptr) const {
    323     return getUnsigned(offset_ptr, AddressSize);
    324   }
    325 
    326   /// Extract a pointer-sized unsigned integer from the location given by the
    327   /// cursor. In case of an extraction error, or if the cursor is already in
    328   /// an error state, zero is returned.
    329   uint64_t getAddress(Cursor &C) const { return getUnsigned(C, AddressSize); }
    330 
    331   /// Extract a uint8_t value from \a *offset_ptr.
    332   ///
    333   /// Extract a single uint8_t from the binary data at the offset
    334   /// pointed to by \a offset_ptr, and advance the offset on success.
    335   ///
    336   /// @param[in,out] offset_ptr
    337   ///     A pointer to an offset within the data that will be advanced
    338   ///     by the appropriate number of bytes if the value is extracted
    339   ///     correctly. If the offset is out of bounds or there are not
    340   ///     enough bytes to extract this value, the offset will be left
    341   ///     unmodified.
    342   ///
    343   /// @param[in,out] Err
    344   ///     A pointer to an Error object. Upon return the Error object is set to
    345   ///     indicate the result (success/failure) of the function. If the Error
    346   ///     object is already set when calling this function, no extraction is
    347   ///     performed.
    348   ///
    349   /// @return
    350   ///     The extracted uint8_t value.
    351   uint8_t getU8(uint64_t *offset_ptr, Error *Err = nullptr) const;
    352 
    353   /// Extract a single uint8_t value from the location given by the cursor. In
    354   /// case of an extraction error, or if the cursor is already in an error
    355   /// state, zero is returned.
    356   uint8_t getU8(Cursor &C) const { return getU8(&C.Offset, &C.Err); }
    357 
    358   /// Extract \a count uint8_t values from \a *offset_ptr.
    359   ///
    360   /// Extract \a count uint8_t values from the binary data at the
    361   /// offset pointed to by \a offset_ptr, and advance the offset on
    362   /// success. The extracted values are copied into \a dst.
    363   ///
    364   /// @param[in,out] offset_ptr
    365   ///     A pointer to an offset within the data that will be advanced
    366   ///     by the appropriate number of bytes if the value is extracted
    367   ///     correctly. If the offset is out of bounds or there are not
    368   ///     enough bytes to extract this value, the offset will be left
    369   ///     unmodified.
    370   ///
    371   /// @param[out] dst
    372   ///     A buffer to copy \a count uint8_t values into. \a dst must
    373   ///     be large enough to hold all requested data.
    374   ///
    375   /// @param[in] count
    376   ///     The number of uint8_t values to extract.
    377   ///
    378   /// @return
    379   ///     \a dst if all values were properly extracted and copied,
    380   ///     NULL otherise.
    381   uint8_t *getU8(uint64_t *offset_ptr, uint8_t *dst, uint32_t count) const;
    382 
    383   /// Extract \a Count uint8_t values from the location given by the cursor and
    384   /// store them into the destination buffer. In case of an extraction error, or
    385   /// if the cursor is already in an error state, a nullptr is returned and the
    386   /// destination buffer is left unchanged.
    387   uint8_t *getU8(Cursor &C, uint8_t *Dst, uint32_t Count) const;
    388 
    389   /// Extract \a Count uint8_t values from the location given by the cursor and
    390   /// store them into the destination vector. The vector is resized to fit the
    391   /// extracted data. In case of an extraction error, or if the cursor is
    392   /// already in an error state, the destination vector is left unchanged and
    393   /// cursor is placed into an error state.
    394   void getU8(Cursor &C, SmallVectorImpl<uint8_t> &Dst, uint32_t Count) const {
    395     if (isValidOffsetForDataOfSize(C.Offset, Count))
    396       Dst.resize(Count);
    397 
    398     // This relies on the fact that getU8 will not attempt to write to the
    399     // buffer if isValidOffsetForDataOfSize(C.Offset, Count) is false.
    400     getU8(C, Dst.data(), Count);
    401   }
    402 
    403   //------------------------------------------------------------------
    404   /// Extract a uint16_t value from \a *offset_ptr.
    405   ///
    406   /// Extract a single uint16_t from the binary data at the offset
    407   /// pointed to by \a offset_ptr, and update the offset on success.
    408   ///
    409   /// @param[in,out] offset_ptr
    410   ///     A pointer to an offset within the data that will be advanced
    411   ///     by the appropriate number of bytes if the value is extracted
    412   ///     correctly. If the offset is out of bounds or there are not
    413   ///     enough bytes to extract this value, the offset will be left
    414   ///     unmodified.
    415   ///
    416   /// @param[in,out] Err
    417   ///     A pointer to an Error object. Upon return the Error object is set to
    418   ///     indicate the result (success/failure) of the function. If the Error
    419   ///     object is already set when calling this function, no extraction is
    420   ///     performed.
    421   ///
    422   /// @return
    423   ///     The extracted uint16_t value.
    424   //------------------------------------------------------------------
    425   uint16_t getU16(uint64_t *offset_ptr, Error *Err = nullptr) const;
    426 
    427   /// Extract a single uint16_t value from the location given by the cursor. In
    428   /// case of an extraction error, or if the cursor is already in an error
    429   /// state, zero is returned.
    430   uint16_t getU16(Cursor &C) const { return getU16(&C.Offset, &C.Err); }
    431 
    432   /// Extract \a count uint16_t values from \a *offset_ptr.
    433   ///
    434   /// Extract \a count uint16_t values from the binary data at the
    435   /// offset pointed to by \a offset_ptr, and advance the offset on
    436   /// success. The extracted values are copied into \a dst.
    437   ///
    438   /// @param[in,out] offset_ptr
    439   ///     A pointer to an offset within the data that will be advanced
    440   ///     by the appropriate number of bytes if the value is extracted
    441   ///     correctly. If the offset is out of bounds or there are not
    442   ///     enough bytes to extract this value, the offset will be left
    443   ///     unmodified.
    444   ///
    445   /// @param[out] dst
    446   ///     A buffer to copy \a count uint16_t values into. \a dst must
    447   ///     be large enough to hold all requested data.
    448   ///
    449   /// @param[in] count
    450   ///     The number of uint16_t values to extract.
    451   ///
    452   /// @return
    453   ///     \a dst if all values were properly extracted and copied,
    454   ///     NULL otherise.
    455   uint16_t *getU16(uint64_t *offset_ptr, uint16_t *dst, uint32_t count) const;
    456 
    457   /// Extract a 24-bit unsigned value from \a *offset_ptr and return it
    458   /// in a uint32_t.
    459   ///
    460   /// Extract 3 bytes from the binary data at the offset pointed to by
    461   /// \a offset_ptr, construct a uint32_t from them and update the offset
    462   /// on success.
    463   ///
    464   /// @param[in,out] OffsetPtr
    465   ///     A pointer to an offset within the data that will be advanced
    466   ///     by the 3 bytes if the value is extracted correctly. If the offset
    467   ///     is out of bounds or there are not enough bytes to extract this value,
    468   ///     the offset will be left unmodified.
    469   ///
    470   /// @param[in,out] Err
    471   ///     A pointer to an Error object. Upon return the Error object is set to
    472   ///     indicate the result (success/failure) of the function. If the Error
    473   ///     object is already set when calling this function, no extraction is
    474   ///     performed.
    475   ///
    476   /// @return
    477   ///     The extracted 24-bit value represented in a uint32_t.
    478   uint32_t getU24(uint64_t *OffsetPtr, Error *Err = nullptr) const;
    479 
    480   /// Extract a single 24-bit unsigned value from the location given by the
    481   /// cursor. In case of an extraction error, or if the cursor is already in an
    482   /// error state, zero is returned.
    483   uint32_t getU24(Cursor &C) const { return getU24(&C.Offset, &C.Err); }
    484 
    485   /// Extract a uint32_t value from \a *offset_ptr.
    486   ///
    487   /// Extract a single uint32_t from the binary data at the offset
    488   /// pointed to by \a offset_ptr, and update the offset on success.
    489   ///
    490   /// @param[in,out] offset_ptr
    491   ///     A pointer to an offset within the data that will be advanced
    492   ///     by the appropriate number of bytes if the value is extracted
    493   ///     correctly. If the offset is out of bounds or there are not
    494   ///     enough bytes to extract this value, the offset will be left
    495   ///     unmodified.
    496   ///
    497   /// @param[in,out] Err
    498   ///     A pointer to an Error object. Upon return the Error object is set to
    499   ///     indicate the result (success/failure) of the function. If the Error
    500   ///     object is already set when calling this function, no extraction is
    501   ///     performed.
    502   ///
    503   /// @return
    504   ///     The extracted uint32_t value.
    505   uint32_t getU32(uint64_t *offset_ptr, Error *Err = nullptr) const;
    506 
    507   /// Extract a single uint32_t value from the location given by the cursor. In
    508   /// case of an extraction error, or if the cursor is already in an error
    509   /// state, zero is returned.
    510   uint32_t getU32(Cursor &C) const { return getU32(&C.Offset, &C.Err); }
    511 
    512   /// Extract \a count uint32_t values from \a *offset_ptr.
    513   ///
    514   /// Extract \a count uint32_t values from the binary data at the
    515   /// offset pointed to by \a offset_ptr, and advance the offset on
    516   /// success. The extracted values are copied into \a dst.
    517   ///
    518   /// @param[in,out] offset_ptr
    519   ///     A pointer to an offset within the data that will be advanced
    520   ///     by the appropriate number of bytes if the value is extracted
    521   ///     correctly. If the offset is out of bounds or there are not
    522   ///     enough bytes to extract this value, the offset will be left
    523   ///     unmodified.
    524   ///
    525   /// @param[out] dst
    526   ///     A buffer to copy \a count uint32_t values into. \a dst must
    527   ///     be large enough to hold all requested data.
    528   ///
    529   /// @param[in] count
    530   ///     The number of uint32_t values to extract.
    531   ///
    532   /// @return
    533   ///     \a dst if all values were properly extracted and copied,
    534   ///     NULL otherise.
    535   uint32_t *getU32(uint64_t *offset_ptr, uint32_t *dst, uint32_t count) const;
    536 
    537   /// Extract a uint64_t value from \a *offset_ptr.
    538   ///
    539   /// Extract a single uint64_t from the binary data at the offset
    540   /// pointed to by \a offset_ptr, and update the offset on success.
    541   ///
    542   /// @param[in,out] offset_ptr
    543   ///     A pointer to an offset within the data that will be advanced
    544   ///     by the appropriate number of bytes if the value is extracted
    545   ///     correctly. If the offset is out of bounds or there are not
    546   ///     enough bytes to extract this value, the offset will be left
    547   ///     unmodified.
    548   ///
    549   /// @param[in,out] Err
    550   ///     A pointer to an Error object. Upon return the Error object is set to
    551   ///     indicate the result (success/failure) of the function. If the Error
    552   ///     object is already set when calling this function, no extraction is
    553   ///     performed.
    554   ///
    555   /// @return
    556   ///     The extracted uint64_t value.
    557   uint64_t getU64(uint64_t *offset_ptr, Error *Err = nullptr) const;
    558 
    559   /// Extract a single uint64_t value from the location given by the cursor. In
    560   /// case of an extraction error, or if the cursor is already in an error
    561   /// state, zero is returned.
    562   uint64_t getU64(Cursor &C) const { return getU64(&C.Offset, &C.Err); }
    563 
    564   /// Extract \a count uint64_t values from \a *offset_ptr.
    565   ///
    566   /// Extract \a count uint64_t values from the binary data at the
    567   /// offset pointed to by \a offset_ptr, and advance the offset on
    568   /// success. The extracted values are copied into \a dst.
    569   ///
    570   /// @param[in,out] offset_ptr
    571   ///     A pointer to an offset within the data that will be advanced
    572   ///     by the appropriate number of bytes if the value is extracted
    573   ///     correctly. If the offset is out of bounds or there are not
    574   ///     enough bytes to extract this value, the offset will be left
    575   ///     unmodified.
    576   ///
    577   /// @param[out] dst
    578   ///     A buffer to copy \a count uint64_t values into. \a dst must
    579   ///     be large enough to hold all requested data.
    580   ///
    581   /// @param[in] count
    582   ///     The number of uint64_t values to extract.
    583   ///
    584   /// @return
    585   ///     \a dst if all values were properly extracted and copied,
    586   ///     NULL otherise.
    587   uint64_t *getU64(uint64_t *offset_ptr, uint64_t *dst, uint32_t count) const;
    588 
    589   /// Extract a signed LEB128 value from \a *offset_ptr.
    590   ///
    591   /// Extracts an signed LEB128 number from this object's data
    592   /// starting at the offset pointed to by \a offset_ptr. The offset
    593   /// pointed to by \a offset_ptr will be updated with the offset of
    594   /// the byte following the last extracted byte.
    595   ///
    596   /// @param[in,out] OffsetPtr
    597   ///     A pointer to an offset within the data that will be advanced
    598   ///     by the appropriate number of bytes if the value is extracted
    599   ///     correctly. If the offset is out of bounds or there are not
    600   ///     enough bytes to extract this value, the offset will be left
    601   ///     unmodified.
    602   ///
    603   /// @param[in,out] Err
    604   ///     A pointer to an Error object. Upon return the Error object is set to
    605   ///     indicate the result (success/failure) of the function. If the Error
    606   ///     object is already set when calling this function, no extraction is
    607   ///     performed.
    608   ///
    609   /// @return
    610   ///     The extracted signed integer value.
    611   int64_t getSLEB128(uint64_t *OffsetPtr, Error *Err = nullptr) const;
    612 
    613   /// Extract an signed LEB128 value from the location given by the cursor.
    614   /// In case of an extraction error, or if the cursor is already in an error
    615   /// state, zero is returned.
    616   int64_t getSLEB128(Cursor &C) const { return getSLEB128(&C.Offset, &C.Err); }
    617 
    618   /// Extract a unsigned LEB128 value from \a *offset_ptr.
    619   ///
    620   /// Extracts an unsigned LEB128 number from this object's data
    621   /// starting at the offset pointed to by \a offset_ptr. The offset
    622   /// pointed to by \a offset_ptr will be updated with the offset of
    623   /// the byte following the last extracted byte.
    624   ///
    625   /// @param[in,out] offset_ptr
    626   ///     A pointer to an offset within the data that will be advanced
    627   ///     by the appropriate number of bytes if the value is extracted
    628   ///     correctly. If the offset is out of bounds or there are not
    629   ///     enough bytes to extract this value, the offset will be left
    630   ///     unmodified.
    631   ///
    632   /// @param[in,out] Err
    633   ///     A pointer to an Error object. Upon return the Error object is set to
    634   ///     indicate the result (success/failure) of the function. If the Error
    635   ///     object is already set when calling this function, no extraction is
    636   ///     performed.
    637   ///
    638   /// @return
    639   ///     The extracted unsigned integer value.
    640   uint64_t getULEB128(uint64_t *offset_ptr, llvm::Error *Err = nullptr) const;
    641 
    642   /// Extract an unsigned LEB128 value from the location given by the cursor.
    643   /// In case of an extraction error, or if the cursor is already in an error
    644   /// state, zero is returned.
    645   uint64_t getULEB128(Cursor &C) const { return getULEB128(&C.Offset, &C.Err); }
    646 
    647   /// Advance the Cursor position by the given number of bytes. No-op if the
    648   /// cursor is in an error state.
    649   void skip(Cursor &C, uint64_t Length) const;
    650 
    651   /// Return true iff the cursor is at the end of the buffer, regardless of the
    652   /// error state of the cursor. The only way both eof and error states can be
    653   /// true is if one attempts a read while the cursor is at the very end of the
    654   /// data buffer.
    655   bool eof(const Cursor &C) const { return size() == C.Offset; }
    656 
    657   /// Test the validity of \a offset.
    658   ///
    659   /// @return
    660   ///     \b true if \a offset is a valid offset into the data in this
    661   ///     object, \b false otherwise.
    662   bool isValidOffset(uint64_t offset) const { return size() > offset; }
    663 
    664   /// Test the availability of \a length bytes of data from \a offset.
    665   ///
    666   /// @return
    667   ///     \b true if \a offset is a valid offset and there are \a
    668   ///     length bytes available at that offset, \b false otherwise.
    669   bool isValidOffsetForDataOfSize(uint64_t offset, uint64_t length) const {
    670     return offset + length >= offset && isValidOffset(offset + length - 1);
    671   }
    672 
    673   /// Test the availability of enough bytes of data for a pointer from
    674   /// \a offset. The size of a pointer is \a getAddressSize().
    675   ///
    676   /// @return
    677   ///     \b true if \a offset is a valid offset and there are enough
    678   ///     bytes for a pointer available at that offset, \b false
    679   ///     otherwise.
    680   bool isValidOffsetForAddress(uint64_t offset) const {
    681     return isValidOffsetForDataOfSize(offset, AddressSize);
    682   }
    683 
    684   /// Return the number of bytes in the underlying buffer.
    685   size_t size() const { return Data.size(); }
    686 
    687 protected:
    688   // Make it possible for subclasses to access these fields without making them
    689   // public.
    690   static uint64_t &getOffset(Cursor &C) { return C.Offset; }
    691   static Error &getError(Cursor &C) { return C.Err; }
    692 
    693 private:
    694   /// If it is possible to read \a Size bytes at offset \a Offset, returns \b
    695   /// true. Otherwise, returns \b false. If \a E is not nullptr, also sets the
    696   /// error object to indicate an error.
    697   bool prepareRead(uint64_t Offset, uint64_t Size, Error *E) const;
    698 
    699   template <typename T> T getU(uint64_t *OffsetPtr, Error *Err) const;
    700   template <typename T>
    701   T *getUs(uint64_t *OffsetPtr, T *Dst, uint32_t Count, Error *Err) const;
    702 };
    703 
    704 } // namespace llvm
    705 
    706 #endif
    707