Restore "Function bitcode index in Value Symbol Table and lazy reading support"

[oota-llvm.git] / include / llvm / Bitcode / BitstreamReader.h
diff --git a/include/llvm/Bitcode/BitstreamReader.h b/include/llvm/Bitcode/BitstreamReader.h

index 05623fe8e71f55d0652fc4e1720aba90d10ac80f..c0cf6cde887f12d032256a9ffb4472e8bd0dbfc0 100644 (file)
--- a/include/llvm/Bitcode/BitstreamReader.h
+++ b/include/llvm/Bitcode/BitstreamReader.h
@@ -24,8 +24,6 @@
  
  namespace llvm {
  
-class Deserializer;
-
  /// This class is used to read from an LLVM bitcode stream, maintaining
  /// information that is global to decoding the entire file. While a file is
  /// being read, multiple cursors can be independently advanced or skipped around
@@ -50,8 +48,8 @@ private:
    /// information in the BlockInfo block. Only llvm-bcanalyzer uses this.
    bool IgnoreBlockInfoNames;
  
-  BitstreamReader(const BitstreamReader&) LLVM_DELETED_FUNCTION;
-  void operator=(const BitstreamReader&) LLVM_DELETED_FUNCTION;
+  BitstreamReader(const BitstreamReader&) = delete;
+  void operator=(const BitstreamReader&) = delete;
  public:
    BitstreamReader() : IgnoreBlockInfoNames(true) {
    }
@@ -61,9 +59,8 @@ public:
      init(Start, End);
    }
  
-  BitstreamReader(MemoryObject *bytes) : IgnoreBlockInfoNames(true) {
-    BitcodeBytes.reset(bytes);
-  }
+  BitstreamReader(std::unique_ptr<MemoryObject> BitcodeBytes)
+      : BitcodeBytes(std::move(BitcodeBytes)), IgnoreBlockInfoNames(true) {}
  
    BitstreamReader(BitstreamReader &&Other) {
      *this = std::move(Other);
@@ -116,7 +113,7 @@ public:
        return *const_cast<BlockInfo*>(BI);
  
      // Otherwise, add a new record.
-    BlockInfoRecords.push_back(BlockInfo());
+    BlockInfoRecords.emplace_back();
      BlockInfoRecords.back().BlockID = BlockID;
      return BlockInfoRecords.back();
    }
@@ -165,20 +162,22 @@ struct BitstreamEntry {
  /// Unlike iterators, BitstreamCursors are heavy-weight objects that should not
  /// be passed by value.
  class BitstreamCursor {
-  friend class Deserializer;
    BitstreamReader *BitStream;
    size_t NextChar;
  
+  // The size of the bicode. 0 if we don't know it yet.
+  size_t Size;
+
    /// This is the current data we have pulled from the stream but have not
    /// returned to the client. This is specifically and intentionally defined to
    /// follow the word size of the host machine for efficiency. We use word_t in
    /// places that are aware of this to make it perfectly explicit what is going
    /// on.
-  typedef uint32_t word_t;
+  typedef size_t word_t;
    word_t CurWord;
  
    /// This is the number of bits in CurWord that are valid. This is always from
-  /// [0...31/63] inclusive (depending on word size).
+  /// [0...bits_of(size_t)-1] inclusive.
    unsigned BitsInCurWord;
  
    // This is the declared size of code values used for the current block, in
@@ -199,6 +198,8 @@ class BitstreamCursor {
  
  
  public:
+  static const size_t MaxChunkSize = sizeof(word_t) * 8;
+
    BitstreamCursor() { init(nullptr); }
  
    explicit BitstreamCursor(BitstreamReader &R) { init(&R); }
@@ -208,17 +209,13 @@ public:
  
      BitStream = R;
      NextChar = 0;
-    CurWord = 0;
+    Size = 0;
      BitsInCurWord = 0;
      CurCodeSize = 2;
    }
  
    void freeState();
  
-  bool isEndPos(size_t pos) {
-    return BitStream->getBitcodeBytes().isObjectEnd(static_cast<uint64_t>(pos));
-  }
-
    bool canSkipToPos(size_t pos) const {
      // pos can be skipped to if it is a valid address or one byte past the end.
      return pos == 0 || BitStream->getBitcodeBytes().isValidAddress(
@@ -226,7 +223,12 @@ public:
    }
  
    bool AtEndOfStream() {
-    return BitsInCurWord == 0 && isEndPos(NextChar);
+    if (BitsInCurWord != 0)
+      return false;
+    if (Size != 0)
+      return Size == NextChar;
+    fillCurWord();
+    return BitsInCurWord == 0;
    }
  
    /// Return the number of bits used to encode an abbrev #.
@@ -255,8 +257,8 @@ public:
      AF_DontAutoprocessAbbrevs = 2
    };
  
-      /// Advance the current bitstream, returning the next entry in the stream.
-      BitstreamEntry advance(unsigned Flags = 0) {
+  /// Advance the current bitstream, returning the next entry in the stream.
+  BitstreamEntry advance(unsigned Flags = 0) {
      while (1) {
        unsigned Code = ReadCode();
        if (Code == bitc::END_BLOCK) {
@@ -298,82 +300,82 @@ public:
  
    /// Reset the stream to the specified bit number.
    void JumpToBit(uint64_t BitNo) {
-    uintptr_t ByteNo = uintptr_t(BitNo/8) & ~(sizeof(word_t)-1);
+    size_t ByteNo = size_t(BitNo/8) & ~(sizeof(word_t)-1);
      unsigned WordBitNo = unsigned(BitNo & (sizeof(word_t)*8-1));
      assert(canSkipToPos(ByteNo) && "Invalid location");
  
      // Move the cursor to the right word.
      NextChar = ByteNo;
      BitsInCurWord = 0;
-    CurWord = 0;
  
      // Skip over any bits that are already consumed.
-    if (WordBitNo) {
-      if (sizeof(word_t) > 4)
-        Read64(WordBitNo);
-      else
-        Read(WordBitNo);
-    }
+    if (WordBitNo)
+      Read(WordBitNo);
    }
  
+  void fillCurWord() {
+    if (Size != 0 && NextChar >= Size)
+      report_fatal_error("Unexpected end of file");
  
-  uint32_t Read(unsigned NumBits) {
-    assert(NumBits && NumBits <= 32 &&
-           "Cannot return zero or more than 32 bits!");
+    // Read the next word from the stream.
+    uint8_t Array[sizeof(word_t)] = {0};
  
-    // If the field is fully contained by CurWord, return it quickly.
-    if (BitsInCurWord >= NumBits) {
-      uint32_t R = uint32_t(CurWord) & (~0U >> (32-NumBits));
-      CurWord >>= NumBits;
-      BitsInCurWord -= NumBits;
-      return R;
-    }
+    uint64_t BytesRead =
+        BitStream->getBitcodeBytes().readBytes(Array, sizeof(Array), NextChar);
  
      // If we run out of data, stop at the end of the stream.
-    if (isEndPos(NextChar)) {
+    if (BytesRead == 0) {
        CurWord = 0;
        BitsInCurWord = 0;
-      return 0;
+      Size = NextChar;
+      return;
      }
  
-    uint32_t R = uint32_t(CurWord);
+    CurWord =
+        support::endian::read<word_t, support::little, support::unaligned>(
+            Array);
+    NextChar += BytesRead;
+    BitsInCurWord = BytesRead * 8;
+  }
  
-    // Read the next word from the stream.
-    uint8_t Array[sizeof(word_t)] = {0};
+  word_t Read(unsigned NumBits) {
+    static const unsigned BitsInWord = MaxChunkSize;
  
-    BitStream->getBitcodeBytes().readBytes(Array, sizeof(Array), NextChar);
+    assert(NumBits && NumBits <= BitsInWord &&
+           "Cannot return zero or more than BitsInWord bits!");
  
-    // Handle big-endian byte-swapping if necessary.
-    support::detail::packed_endian_specific_integral
-      <word_t, support::little, support::unaligned> EndianValue;
-    memcpy(&EndianValue, Array, sizeof(Array));
+    static const unsigned Mask = sizeof(word_t) > 4 ? 0x3f : 0x1f;
  
-    CurWord = EndianValue;
+    // If the field is fully contained by CurWord, return it quickly.
+    if (BitsInCurWord >= NumBits) {
+      word_t R = CurWord & (~word_t(0) >> (BitsInWord - NumBits));
  
-    NextChar += sizeof(word_t);
+      // Use a mask to avoid undefined behavior.
+      CurWord >>= (NumBits & Mask);
  
-    // Extract NumBits-BitsInCurWord from what we just read.
-    unsigned BitsLeft = NumBits-BitsInCurWord;
+      BitsInCurWord -= NumBits;
+      return R;
+    }
  
-    // Be careful here, BitsLeft is in the range [1..32]/[1..64] inclusive.
-    R |= uint32_t((CurWord & (word_t(~0ULL) >> (sizeof(word_t)*8-BitsLeft)))
-                    << BitsInCurWord);
+    word_t R = BitsInCurWord ? CurWord : 0;
+    unsigned BitsLeft = NumBits - BitsInCurWord;
  
-    // BitsLeft bits have just been used up from CurWord.  BitsLeft is in the
-    // range [1..32]/[1..64] so be careful how we shift.
-    if (BitsLeft != sizeof(word_t)*8)
-      CurWord >>= BitsLeft;
-    else
-      CurWord = 0;
-    BitsInCurWord = sizeof(word_t)*8-BitsLeft;
-    return R;
-  }
+    fillCurWord();
+
+    // If we run out of data, stop at the end of the stream.
+    if (BitsLeft > BitsInCurWord)
+      return 0;
+
+    word_t R2 = CurWord & (~word_t(0) >> (BitsInWord - BitsLeft));
+
+    // Use a mask to avoid undefined behavior.
+    CurWord >>= (BitsLeft & Mask);
+
+    BitsInCurWord -= BitsLeft;
  
-  uint64_t Read64(unsigned NumBits) {
-    if (NumBits <= 32) return Read(NumBits);
+    R |= R2 << (NumBits - BitsLeft);
  
-    uint64_t V = Read(32);
-    return V | (uint64_t)Read(NumBits-32) << 32;
+    return R;
    }
  
    uint32_t ReadVBR(unsigned NumBits) {
@@ -426,7 +428,6 @@ private:
      }
  
      BitsInCurWord = 0;
-    CurWord = 0;
    }
  public:
  
@@ -490,19 +491,12 @@ private:
    // Record Processing
    //===--------------------------------------------------------------------===//
  
-private:
-  void readAbbreviatedLiteral(const BitCodeAbbrevOp &Op,
-                              SmallVectorImpl<uint64_t> &Vals);
-  void readAbbreviatedField(const BitCodeAbbrevOp &Op,
-                            SmallVectorImpl<uint64_t> &Vals);
-  void skipAbbreviatedField(const BitCodeAbbrevOp &Op);
-
  public:
-
    /// Return the abbreviation for the specified AbbrevId.
    const BitCodeAbbrev *getAbbrev(unsigned AbbrevID) {
-    unsigned AbbrevNo = AbbrevID-bitc::FIRST_APPLICATION_ABBREV;
-    assert(AbbrevNo < CurAbbrevs.size() && "Invalid abbrev #!");
+    unsigned AbbrevNo = AbbrevID - bitc::FIRST_APPLICATION_ABBREV;
+    if (AbbrevNo >= CurAbbrevs.size())
+      report_fatal_error("Invalid abbrev number");
      return CurAbbrevs[AbbrevNo].get();
    }