AsmWriter/Bitcode: MDGlobalVariable

[oota-llvm.git] / include / llvm / Bitcode / BitstreamReader.h
diff --git a/include/llvm/Bitcode/BitstreamReader.h b/include/llvm/Bitcode/BitstreamReader.h

index b42f559e13b44f57a9f0fb797028f6182b36491c..bc3e48a43416b2f5347e1d701c8140a524db9aec 100644 (file)
--- a/include/llvm/Bitcode/BitstreamReader.h
+++ b/include/llvm/Bitcode/BitstreamReader.h
@@ -17,7 +17,7 @@
  
  #include "llvm/Bitcode/BitCodes.h"
  #include "llvm/Support/Endian.h"
-#include "llvm/Support/StreamableMemoryObject.h"
+#include "llvm/Support/StreamingMemoryObject.h"
  #include <climits>
  #include <string>
  #include <vector>
@@ -42,7 +42,7 @@ public:
      std::vector<std::pair<unsigned, std::string> > RecordNames;
    };
  private:
-  std::unique_ptr<StreamableMemoryObject> BitcodeBytes;
+  std::unique_ptr<MemoryObject> BitcodeBytes;
  
    std::vector<BlockInfo> BlockInfoRecords;
  
@@ -61,9 +61,8 @@ public:
      init(Start, End);
    }
  
-  BitstreamReader(StreamableMemoryObject *bytes) : IgnoreBlockInfoNames(true) {
-    BitcodeBytes.reset(bytes);
-  }
+  BitstreamReader(std::unique_ptr<MemoryObject> BitcodeBytes)
+      : BitcodeBytes(std::move(BitcodeBytes)), IgnoreBlockInfoNames(true) {}
  
    BitstreamReader(BitstreamReader &&Other) {
      *this = std::move(Other);
@@ -82,7 +81,7 @@ public:
      BitcodeBytes.reset(getNonStreamedMemoryObject(Start, End));
    }
  
-  StreamableMemoryObject &getBitcodeBytes() { return *BitcodeBytes; }
+  MemoryObject &getBitcodeBytes() { return *BitcodeBytes; }
  
    /// This is called by clients that want block/record name information.
    void CollectBlockInfoNames() { IgnoreBlockInfoNames = false; }
@@ -169,16 +168,19 @@ class BitstreamCursor {
    BitstreamReader *BitStream;
    size_t NextChar;
  
+  // The size of the bicode. 0 if we don't know it yet.
+  size_t Size;
+
    /// This is the current data we have pulled from the stream but have not
    /// returned to the client. This is specifically and intentionally defined to
    /// follow the word size of the host machine for efficiency. We use word_t in
    /// places that are aware of this to make it perfectly explicit what is going
    /// on.
-  typedef uint32_t word_t;
+  typedef size_t word_t;
    word_t CurWord;
  
    /// This is the number of bits in CurWord that are valid. This is always from
-  /// [0...31/63] inclusive (depending on word size).
+  /// [0...bits_of(size_t)-1] inclusive.
    unsigned BitsInCurWord;
  
    // This is the declared size of code values used for the current block, in
@@ -199,45 +201,35 @@ class BitstreamCursor {
  
  
  public:
-  BitstreamCursor() : BitStream(nullptr), NextChar(0) {}
+  BitstreamCursor() { init(nullptr); }
  
-  explicit BitstreamCursor(BitstreamReader &R) : BitStream(&R) {
-    NextChar = 0;
-    CurWord = 0;
-    BitsInCurWord = 0;
-    CurCodeSize = 2;
-  }
+  explicit BitstreamCursor(BitstreamReader &R) { init(&R); }
  
-  void init(BitstreamReader &R) {
+  void init(BitstreamReader *R) {
      freeState();
  
-    BitStream = &R;
+    BitStream = R;
      NextChar = 0;
-    CurWord = 0;
+    Size = 0;
      BitsInCurWord = 0;
      CurCodeSize = 2;
    }
  
    void freeState();
  
-  bool isEndPos(size_t pos) {
-    return BitStream->getBitcodeBytes().isObjectEnd(static_cast<uint64_t>(pos));
-  }
-
    bool canSkipToPos(size_t pos) const {
      // pos can be skipped to if it is a valid address or one byte past the end.
      return pos == 0 || BitStream->getBitcodeBytes().isValidAddress(
          static_cast<uint64_t>(pos - 1));
    }
  
-  uint32_t getWord(size_t pos) {
-    uint8_t buf[4] = { 0xFF, 0xFF, 0xFF, 0xFF };
-    BitStream->getBitcodeBytes().readBytes(pos, sizeof(buf), buf);
-    return *reinterpret_cast<support::ulittle32_t *>(buf);
-  }
-
    bool AtEndOfStream() {
-    return BitsInCurWord == 0 && isEndPos(NextChar);
+    if (BitsInCurWord != 0)
+      return false;
+    if (Size != 0)
+      return Size == NextChar;
+    fillCurWord();
+    return BitsInCurWord == 0;
    }
  
    /// Return the number of bits used to encode an abbrev #.
@@ -316,77 +308,75 @@ public:
      // Move the cursor to the right word.
      NextChar = ByteNo;
      BitsInCurWord = 0;
-    CurWord = 0;
  
      // Skip over any bits that are already consumed.
-    if (WordBitNo) {
-      if (sizeof(word_t) > 4)
-        Read64(WordBitNo);
-      else
-        Read(WordBitNo);
+    if (WordBitNo)
+      Read(WordBitNo);
+  }
+
+  void fillCurWord() {
+    if (Size != 0 && NextChar >= (unsigned)Size)
+      report_fatal_error("Unexpected end of file");
+
+    // Read the next word from the stream.
+    uint8_t Array[sizeof(word_t)] = {0};
+
+    uint64_t BytesRead =
+        BitStream->getBitcodeBytes().readBytes(Array, sizeof(Array), NextChar);
+
+    // If we run out of data, stop at the end of the stream.
+    if (BytesRead == 0) {
+      Size = NextChar;
+      return;
      }
+
+    CurWord =
+        support::endian::read<word_t, support::little, support::unaligned>(
+            Array);
+    NextChar += BytesRead;
+    BitsInCurWord = BytesRead * 8;
    }
  
+  word_t Read(unsigned NumBits) {
+    static const unsigned BitsInWord = sizeof(word_t) * 8;
+
+    assert(NumBits && NumBits <= BitsInWord &&
+           "Cannot return zero or more than BitsInWord bits!");
  
-  uint32_t Read(unsigned NumBits) {
-    assert(NumBits && NumBits <= 32 &&
-           "Cannot return zero or more than 32 bits!");
+    static const unsigned Mask = sizeof(word_t) > 4 ? 0x3f : 0x1f;
  
      // If the field is fully contained by CurWord, return it quickly.
      if (BitsInCurWord >= NumBits) {
-      uint32_t R = uint32_t(CurWord) & (~0U >> (32-NumBits));
-      CurWord >>= NumBits;
+      word_t R = CurWord & (~word_t(0) >> (BitsInWord - NumBits));
+
+      // Use a mask to avoid undefined behavior.
+      CurWord >>= (NumBits & Mask);
+
        BitsInCurWord -= NumBits;
        return R;
      }
  
-    // If we run out of data, stop at the end of the stream.
-    if (isEndPos(NextChar)) {
-      CurWord = 0;
-      BitsInCurWord = 0;
-      return 0;
-    }
-
-    uint32_t R = uint32_t(CurWord);
+    word_t R = BitsInCurWord ? CurWord : 0;
+    unsigned BitsLeft = NumBits - BitsInCurWord;
  
-    // Read the next word from the stream.
-    uint8_t Array[sizeof(word_t)] = {0};
+    fillCurWord();
  
-    BitStream->getBitcodeBytes().readBytes(NextChar, sizeof(Array), Array);
-
-    // Handle big-endian byte-swapping if necessary.
-    support::detail::packed_endian_specific_integral
-      <word_t, support::little, support::unaligned> EndianValue;
-    memcpy(&EndianValue, Array, sizeof(Array));
+    // If we run out of data, stop at the end of the stream.
+    if (BitsLeft > BitsInCurWord)
+      return 0;
  
-    CurWord = EndianValue;
+    word_t R2 = CurWord & (~word_t(0) >> (BitsInWord - BitsLeft));
  
-    NextChar += sizeof(word_t);
+    // Use a mask to avoid undefined behavior.
+    CurWord >>= (BitsLeft & Mask);
  
-    // Extract NumBits-BitsInCurWord from what we just read.
-    unsigned BitsLeft = NumBits-BitsInCurWord;
+    BitsInCurWord -= BitsLeft;
  
-    // Be careful here, BitsLeft is in the range [1..32]/[1..64] inclusive.
-    R |= uint32_t((CurWord & (word_t(~0ULL) >> (sizeof(word_t)*8-BitsLeft)))
-                    << BitsInCurWord);
+    R |= R2 << (NumBits - BitsLeft);
  
-    // BitsLeft bits have just been used up from CurWord.  BitsLeft is in the
-    // range [1..32]/[1..64] so be careful how we shift.
-    if (BitsLeft != sizeof(word_t)*8)
-      CurWord >>= BitsLeft;
-    else
-      CurWord = 0;
-    BitsInCurWord = sizeof(word_t)*8-BitsLeft;
      return R;
    }
  
-  uint64_t Read64(unsigned NumBits) {
-    if (NumBits <= 32) return Read(NumBits);
-
-    uint64_t V = Read(32);
-    return V | (uint64_t)Read(NumBits-32) << 32;
-  }
-
    uint32_t ReadVBR(unsigned NumBits) {
      uint32_t Piece = Read(NumBits);
      if ((Piece & (1U << (NumBits-1))) == 0)
@@ -437,7 +427,6 @@ private:
      }
  
      BitsInCurWord = 0;
-    CurWord = 0;
    }
  public:
  
@@ -501,19 +490,12 @@ private:
    // Record Processing
    //===--------------------------------------------------------------------===//
  
-private:
-  void readAbbreviatedLiteral(const BitCodeAbbrevOp &Op,
-                              SmallVectorImpl<uint64_t> &Vals);
-  void readAbbreviatedField(const BitCodeAbbrevOp &Op,
-                            SmallVectorImpl<uint64_t> &Vals);
-  void skipAbbreviatedField(const BitCodeAbbrevOp &Op);
-
  public:
-
    /// Return the abbreviation for the specified AbbrevId.
    const BitCodeAbbrev *getAbbrev(unsigned AbbrevID) {
-    unsigned AbbrevNo = AbbrevID-bitc::FIRST_APPLICATION_ABBREV;
-    assert(AbbrevNo < CurAbbrevs.size() && "Invalid abbrev #!");
+    unsigned AbbrevNo = AbbrevID - bitc::FIRST_APPLICATION_ABBREV;
+    if (AbbrevNo >= CurAbbrevs.size())
+      report_fatal_error("Invalid abbrev number");
      return CurAbbrevs[AbbrevNo].get();
    }