include/llvm/Bitcode/BitstreamReader.h - Issue 8393017: Bitcode streaming - Code Review

Chromium Code Reviews

chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out

(784)

My Issues | Starred Open | Closed | All

Unified Diff: include/llvm/Bitcode/BitstreamReader.h

Issue 8393017: Bitcode streaming (Closed)

Patch Set: put destructors back, fix trailing whitespace Created 9 years, 1 month ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

« no previous file with comments | « no previous file | include/llvm/Bitcode/ReaderWriter.h » ('j') | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

Index: include/llvm/Bitcode/BitstreamReader.h

diff --git a/include/llvm/Bitcode/BitstreamReader.h b/include/llvm/Bitcode/BitstreamReader.h

index 0437f53134dc6cbc237c512467f2a57f0b6c4048..a1b6ed5f97048bb78588dae0474d2afed0093e54 100644

--- a/include/llvm/Bitcode/BitstreamReader.h

+++ b/include/llvm/Bitcode/BitstreamReader.h

@@ -15,14 +15,211 @@

#ifndef BITSTREAM_READER_H

#define BITSTREAM_READER_H

+#include "llvm/ADT/OwningPtr.h"

#include "llvm/Bitcode/BitCodes.h"

+#include "llvm/Support/BitcodeStream.h"

#include <climits>

#include <string>

#include <vector>

namespace llvm {

- class Deserializer;

+class Deserializer;

+

+class BitstreamBytes {

+public:

+ BitstreamBytes() { }

+

+ virtual ~BitstreamBytes() {}

+

+ // Returns true if pos is the ending stream position (one byte past the last

+ // valid byte).

+ // May block until Pos bytes have been read, or EOF is reached.

+ virtual bool isEndPos(size_t Pos) = 0;

+

+ // Returns the ending stream position (one byte past the last valid byte).

+ // May block until EOF is reached.

+ virtual size_t getEndPos() = 0;

+

+ // Returns true if seeking to Pos is within the stream or one past the end.

+ // May block until Pos bytes have been read, or EOF is reached.

+ virtual bool canSkipToPos(size_t Pos) = 0;

+

+ // Returns the in memory address of Pos from the beginning of the stream.

+ // May block until Pos bytes have been read, or EOF is reached.

+ // Note that the first byte past the end may be skipped to, but may not have

+ // its address taken.

+ virtual const unsigned char *addressOf(size_t Pos) = 0;

+

+ // Returns the character at Pos from the beginning of the stream.

+ // May block until Pos bytes have been read, or EOF is reached.

+ virtual unsigned char getByte(size_t Pos) = 0;

+

+ // Returns the word at Pos from the beginning of the stream.

+ // (Pos is still counted in bytes, as in the rest of the methods)

+ // May block until Pos bytes have been read, or EOF is reached.

+ virtual uint32_t getWord(size_t Pos) = 0;

+

+private:

+ BitstreamBytes(const BitstreamBytes&); // DO NOT IMPLEMENT

+ void operator=(const BitstreamBytes&); // DO NOT IMPLEMENT

+};

+

+class MemoryBitstreamBytes : public BitstreamBytes {

+public:

+ MemoryBitstreamBytes() { }

+

+ MemoryBitstreamBytes(const unsigned char *Start, const unsigned char *End)

+ : FirstChar(Start), LastChar(End) {

+ }

+

+ virtual ~MemoryBitstreamBytes() {}

+

+ virtual bool isEndPos(size_t Pos) {

+ return Pos == static_cast<size_t>(LastChar-FirstChar);

+ }

+

+ virtual size_t getEndPos() {

+ return static_cast<size_t>(LastChar-FirstChar);

+ }

+

+ virtual bool canSkipToPos(size_t Pos) {

+ return Pos <= static_cast<size_t>(LastChar-FirstChar);

+ }

+

+ virtual const unsigned char *addressOf(size_t Pos) {

+ assert(canSkipToPos(Pos) && Pos != static_cast<size_t>(LastChar-FirstChar)

+ && "taking address outside of buffer");

+ return FirstChar + Pos;

+ }

+

+ virtual unsigned char getByte(size_t Pos) {

+ assert(canSkipToPos(Pos) && Pos != static_cast<size_t>(LastChar-FirstChar)

+ && "indexing outside of buffer");

+ return *(FirstChar + Pos);

+ }

+

+ virtual uint32_t getWord(size_t Pos) {

+ assert(canSkipToPos(Pos + 3) &&

+ (Pos + 3) != static_cast<size_t>(LastChar-FirstChar) &&

+ "indexing outside of buffer");

+ const unsigned char *p = FirstChar + Pos;

+ return *p << 0 |

+ *(p + 1) << 8 |

+ *(p + 2) << 16 |

+ *(p + 3) << 24;

+ }

+

+private:

+ const unsigned char *FirstChar;

+ const unsigned char *LastChar;

+

+ MemoryBitstreamBytes(const MemoryBitstreamBytes&); // DO NOT IMPLEMENT

+ void operator=(const MemoryBitstreamBytes&); // DO NOT IMPLEMENT

+};

+

+class LazyBitstreamBytes : public BitstreamBytes {

+public:

+ LazyBitstreamBytes(BitcodeStreamer *streamer) :

+ Bytes(kChunkSize), Streamer(streamer), BytesRead(0), BytesSkipped(0),

+ BitcodeSize(0), EOFReached(false) {

+ BytesRead = streamer->GetBytes(&Bytes[0], kChunkSize);

+ }

+

+ virtual ~LazyBitstreamBytes() {}

+

+ virtual bool isEndPos(size_t Pos) {

+ if (BitcodeSize) return Pos == BitcodeSize;

+ fetchToPos(Pos);

+ return Pos == BytesRead;

+ }

+

+ virtual size_t getEndPos() {

+ if (BitcodeSize) return BitcodeSize;

+ size_t pos = BytesRead + kChunkSize;

+ // keep fetching until we run out of bytes

+ while (fetchToPos(pos)) pos += kChunkSize;

+ return BitcodeSize;

+ }

+

+ // If the bitcode has a header, then its size is known, and we don't have to

+ // block until we actually want to read it.

+ virtual bool canSkipToPos(size_t Pos) {

+ if (BitcodeSize && Pos <= BitcodeSize) return true;

+ return fetchToPos(Pos) || Pos == BitcodeSize;

+ }

+

+ virtual const unsigned char *addressOf(size_t Pos) {

+ assert(0 && "addressOf inside streaming bitstreams not allowed");

+ return NULL;

+ }

+

+ virtual unsigned char getByte(size_t Pos) {

+ fetchToPos(Pos);

+ assert(Pos < BytesRead && "indexing outside of buffer");

+ return Bytes[Pos + BytesSkipped];

+ }

+

+ virtual uint32_t getWord(size_t Pos) {

+ fetchToPos(Pos + 3);

+ assert(Pos + 3 < BytesRead && "indexing outside of buffer");

+ size_t RealPos = Pos + BytesSkipped;

+ return (Bytes[RealPos + 0] << 0) |

+ (Bytes[RealPos + 1] << 8) |

+ (Bytes[RealPos + 2] << 16) |

+ (Bytes[RealPos + 3] << 24);

+ }

+

+ // Drop s bytes from the front of the stream, pushing the positions of the

+ // remaining bytes down by s. This is used to skip past the bitcode header,

+ // since we don't know a priori if it's present, and we can't put bytes

+ // back into the stream once we've read them.

+ bool dropLeadingBytes(size_t s) {

+ if (BytesRead < s) return true;

+ BytesSkipped = s;

+ BytesRead -= s;

+ return false;

+ }

+

+ void setKnownBitcodeSize(size_t size) {

+ BitcodeSize = size;

+ }

+

+private:

+ const static uint32_t kChunkSize = 4096 * 4;

+ std::vector<unsigned char> Bytes;

+ OwningPtr<BitcodeStreamer> Streamer;

+ size_t BytesRead; // Bytes read from stream

+ size_t BytesSkipped;// Bytes skipped at start of stream (e.g. wrapper/header)

+ size_t BitcodeSize; // 0 if unknown, set if wrapper was seen or EOF reached

+ bool EOFReached;

+

+ // fetch enough bytes such that Pos can be read or EOF is reached

+ // (i.e. BytesRead > Pos). Return true if Pos can be read.

+ // Unlike most of the functions in BitcodeReader, returns true on success.

+ bool fetchToPos(size_t Pos) {

+ if (EOFReached) return Pos < BitcodeSize;

+ while (Pos >= BytesRead) {

+ Bytes.resize(BytesRead + kChunkSize);

+ size_t bytes = Streamer->GetBytes(&Bytes[BytesRead + BytesSkipped],

+ kChunkSize);

+ BytesRead += bytes;

+ if (bytes < kChunkSize) {

+ if (BitcodeSize && BytesRead < Pos)

+ assert(0 && "Unexpected short read fetching bitcode");

+ if (BytesRead <= Pos) { // reached EOF/ran out of bytes

+ BitcodeSize = BytesRead;

+ EOFReached = true;

+ return false;

+ }

+ }

+ }

+ return true;

+ }

+

+ LazyBitstreamBytes(const LazyBitstreamBytes&); // DO NOT IMPLEMENT

+ void operator=(const LazyBitstreamBytes&); // DO NOT IMPLEMENT

+};

class BitstreamReader {

public:

@@ -36,9 +233,7 @@ public:

std::vector<std::pair<unsigned, std::string> > RecordNames;

};

private:

- /// FirstChar/LastChar - This remembers the first and last bytes of the

- /// stream.

- const unsigned char *FirstChar, *LastChar;

+ OwningPtr<BitstreamBytes> Bytes;

std::vector<BlockInfo> BlockInfoRecords;

@@ -47,10 +242,10 @@ private:

/// uses this.

bool IgnoreBlockInfoNames;

- BitstreamReader(const BitstreamReader&); // NOT IMPLEMENTED

- void operator=(const BitstreamReader&); // NOT IMPLEMENTED

+ BitstreamReader(const BitstreamReader&); // DO NOT IMPLEMENT

+ void operator=(const BitstreamReader&); // DO NOT IMPLEMENT

public:

- BitstreamReader() : FirstChar(0), LastChar(0), IgnoreBlockInfoNames(true) {

+ BitstreamReader() : IgnoreBlockInfoNames(true) {

}

BitstreamReader(const unsigned char *Start, const unsigned char *End) {

@@ -58,12 +253,17 @@ public:

init(Start, End);

}

+ BitstreamReader(BitstreamBytes *bsv) {

+ Bytes.reset(bsv);

+ }

+

void init(const unsigned char *Start, const unsigned char *End) {

- FirstChar = Start;

- LastChar = End;

assert(((End-Start) & 3) == 0 &&"Bitcode stream not a multiple of 4 bytes");

+ Bytes.reset(new MemoryBitstreamBytes(Start, End));

}

+ BitstreamBytes &getBytes() { return *Bytes; }

+

~BitstreamReader() {

// Free the BlockInfoRecords.

while (!BlockInfoRecords.empty()) {

@@ -76,9 +276,6 @@ public:

}

}

- const unsigned char *getFirstChar() const { return FirstChar; }

- const unsigned char *getLastChar() const { return LastChar; }

-

/// CollectBlockInfoNames - This is called by clients that want block/record

/// name information.

void CollectBlockInfoNames() { IgnoreBlockInfoNames = false; }

@@ -122,7 +319,7 @@ public:

class BitstreamCursor {

friend class Deserializer;

BitstreamReader *BitStream;

- const unsigned char *NextChar;

+ size_t NextChar;

/// CurWord - This is the current data we have pulled from the stream but have

/// not returned to the client.

@@ -156,8 +353,7 @@ public:

}

explicit BitstreamCursor(BitstreamReader &R) : BitStream(&R) {

- NextChar = R.getFirstChar();

- assert(NextChar && "Bitstream not initialized yet");

+ NextChar = 0;

CurWord = 0;

BitsInCurWord = 0;

CurCodeSize = 2;

@@ -167,8 +363,7 @@ public:

freeState();

BitStream = &R;

- NextChar = R.getFirstChar();

- assert(NextChar && "Bitstream not initialized yet");

+ NextChar = 0;

CurWord = 0;

BitsInCurWord = 0;

CurCodeSize = 2;

@@ -226,12 +421,12 @@ public:

unsigned GetAbbrevIDWidth() const { return CurCodeSize; }

bool AtEndOfStream() const {

- return NextChar == BitStream->getLastChar() && BitsInCurWord == 0;

+ return BitStream->getBytes().isEndPos(NextChar) && BitsInCurWord == 0;

}

/// GetCurrentBitNo - Return the bit # of the bit we are reading.

uint64_t GetCurrentBitNo() const {

- return (NextChar-BitStream->getFirstChar())*CHAR_BIT - BitsInCurWord;

+ return NextChar*CHAR_BIT - BitsInCurWord;

}

BitstreamReader *getBitStreamReader() {

@@ -246,12 +441,10 @@ public:

void JumpToBit(uint64_t BitNo) {

uintptr_t ByteNo = uintptr_t(BitNo/8) & ~3;

uintptr_t WordBitNo = uintptr_t(BitNo) & 31;

- assert(ByteNo <= (uintptr_t)(BitStream->getLastChar()-

- BitStream->getFirstChar()) &&

- "Invalid location");

+ assert(BitStream->getBytes().canSkipToPos(ByteNo) && "Invalid location");

// Move the cursor to the right word.

- NextChar = BitStream->getFirstChar()+ByteNo;

+ NextChar = ByteNo;

BitsInCurWord = 0;

CurWord = 0;

@@ -272,7 +465,7 @@ public:

}

// If we run out of data, stop at the end of the stream.

- if (NextChar == BitStream->getLastChar()) {

+ if (BitStream->getBytes().isEndPos(NextChar)) {

CurWord = 0;

BitsInCurWord = 0;

return 0;

@@ -281,8 +474,7 @@ public:

unsigned R = CurWord;

// Read the next word from the stream.

- CurWord = (NextChar[0] << 0) | (NextChar[1] << 8) |

- (NextChar[2] << 16) | (NextChar[3] << 24);

+ CurWord = BitStream->getBytes().getWord(NextChar);

NextChar += 4;

// Extract NumBits-BitsInCurWord from what we just read.

@@ -376,9 +568,8 @@ public:

// Check that the block wasn't partially defined, and that the offset isn't

// bogus.

- const unsigned char *const SkipTo = NextChar + NumWords*4;

- if (AtEndOfStream() || SkipTo > BitStream->getLastChar() ||

- SkipTo < BitStream->getFirstChar())

+ size_t SkipTo = NextChar + NumWords*4;

+ if (AtEndOfStream() || !BitStream->getBytes().canSkipToPos(SkipTo))

return true;

NextChar = SkipTo;

@@ -409,8 +600,7 @@ public:

if (NumWordsP) *NumWordsP = NumWords;

// Validate that this block is sane.

- if (CurCodeSize == 0 || AtEndOfStream() ||

- NextChar+NumWords*4 > BitStream->getLastChar())

+ if (CurCodeSize == 0 || AtEndOfStream())

return true;

return false;

@@ -512,24 +702,24 @@ public:

SkipToWord(); // 32-bit alignment

// Figure out where the end of this blob will be including tail padding.

- const unsigned char *NewEnd = NextChar+((NumElts+3)&~3);

+ size_t NewEnd = NextChar+((NumElts+3)&~3);

// If this would read off the end of the bitcode file, just set the

// record to empty and return.

- if (NewEnd > BitStream->getLastChar()) {

+ if (!BitStream->getBytes().canSkipToPos(NewEnd)) {

Vals.append(NumElts, 0);

- NextChar = BitStream->getLastChar();

+ NextChar = BitStream->getBytes().getEndPos();

break;

}

// Otherwise, read the number of bytes. If we can return a reference to

// the data, do so to avoid copying it.

if (BlobStart) {

- *BlobStart = (const char*)NextChar;

+ *BlobStart = (const char*)BitStream->getBytes().addressOf(NextChar);

*BlobLen = NumElts;

} else {

for (; NumElts; ++NextChar, --NumElts)

- Vals.push_back(*NextChar);

+ Vals.push_back(BitStream->getBytes().getByte(NextChar));

}

// Skip over tail padding.

NextChar = NewEnd;

« no previous file with comments | « no previous file | include/llvm/Bitcode/ReaderWriter.h » ('j') | no next file with comments »

Powered by Google App Engine

This is Rietveld 408576698