Index: include/llvm/Bitcode/NaCl/NaClBitstreamReader.h |
diff --git a/include/llvm/Bitcode/NaCl/NaClBitstreamReader.h b/include/llvm/Bitcode/NaCl/NaClBitstreamReader.h |
index 1a981ae117dab156c27e4b3058b089af9e6eea92..86972c63741c13481cde6ad2bcb092923824b7a7 100644 |
--- a/include/llvm/Bitcode/NaCl/NaClBitstreamReader.h |
+++ b/include/llvm/Bitcode/NaCl/NaClBitstreamReader.h |
@@ -21,7 +21,10 @@ |
#include "llvm/Bitcode/NaCl/NaClLLVMBitCodes.h" |
#include "llvm/Support/Endian.h" |
#include "llvm/Support/StreamingMemoryObject.h" |
+#include <atomic> |
#include <climits> |
+#include <unordered_map> |
John
2016/03/29 16:27:10
alphabetize?
Karl
2016/03/29 20:10:47
Done.
|
+#include <mutex> |
#include <vector> |
namespace llvm { |
@@ -130,15 +133,80 @@ public: |
AbbrevList Abbrevs; |
}; |
+ // Holds the global abbreviations in the BlockInfo block of the bitcode |
+ // file. Sharing is used to allow parallel parses. Share by using |
+ // std::share_ptr's and std::shared_from_this(). |
+ // |
+ // Note: The BlockInfo block must be parsed before sharing of the |
+ // BLockInfoRecordsMap. Therefore, before changing to a parallel parse, the |
+ // BlockInfoRecordsMap must be frozen. Failure to do so, can lead to |
+ // unexpected behaviour. |
+ // |
+ // In practice, this means that only function blocks can be parsed in |
+ // parallel. |
+ class BlockInfoRecordsMap : |
+ public std::enable_shared_from_this<BlockInfoRecordsMap> { |
+ friend class NaClBitstreamReader; |
+ BlockInfoRecordsMap(const BlockInfoRecordsMap&) = delete; |
+ BlockInfoRecordsMap &operator=(const BlockInfoRecordsMap&) = delete; |
+ public: |
+ using InfosMap = std::unordered_map<unsigned, BlockInfo>; |
+ |
+ static std::shared_ptr<BlockInfoRecordsMap> create() { |
+ return std::shared_ptr<BlockInfoRecordsMap>(new BlockInfoRecordsMap()); |
John
2016/03/29 16:27:10
perhaps you could use std::make_shared? you'll pro
Karl
2016/03/29 20:10:47
I followed the advice of "Effective Modern C++" by
|
+ } |
+ ~BlockInfoRecordsMap() = default; |
+ |
+ bool isFrozen() { |
John
2016/03/29 16:27:10
can this method be marked const?
Karl
2016/03/29 20:10:47
Done.
|
+ return IsFrozen.load(); |
+ } |
+ |
+ // Returns false if already frozen. |
John
2016/03/29 16:27:10
returns true if already frozen, no?
Karl
2016/03/29 20:10:47
Good catch. Forgot to update the comment when I ch
|
+ bool freeze() { |
+ return IsFrozen.exchange(true); |
+ } |
+ |
+ BlockInfo &getBlockInfo(unsigned BlockID) { |
John
2016/03/29 16:27:10
can this method be marked const?
Karl
2016/03/29 20:10:47
Unfortunately no. The way that the code updates th
|
+ InfosMap::iterator Pos = Infos.find(BlockID); |
John
2016/03/29 16:27:10
auto? I believe this is one of the few cases where
Karl
2016/03/29 20:10:47
Done.
|
+ if (Pos != Infos.end()) |
+ return Pos->second; |
+ report_fatal_error("Invalid block ID: " + std::to_string(BlockID)); |
+ } |
+ |
+ // Locks the BlockInfoAbbrev for the instance's lifetime, allowing updates |
+ // to the BlockInfoRecordsMap. Also verifies that the BlockInfoRecordsMap |
+ // didn't get frozen during the instance's lifetime. |
+ class UpdateLock { |
+ UpdateLock() = delete; |
+ UpdateLock &operator=(const UpdateLock&) = delete; |
+ public: |
+ explicit UpdateLock(BlockInfoRecordsMap &BlockInfoRecords); |
+ ~UpdateLock(); |
+ private: |
+ // The BlockInfoRecordsMap to update. |
+ BlockInfoRecordsMap &BlockInfoRecords; |
+ // The locked mutex from BlockInfoRecordsMap; |
+ std::unique_lock<std::mutex> Lock; |
+ }; |
+ |
+ private: |
+ // The set of known BlockInfo's. |
+ InfosMap Infos; |
+ // True if the known BlockInfo blocks are frozen (i.e. the bitstream reader |
+ // will ignore the BlockInfo block). |
+ std::atomic_bool IsFrozen; |
+ // Lock to use to update this data structure. |
+ std::mutex Lock; |
+ |
+ BlockInfoRecordsMap(); |
+ }; |
+ |
private: |
friend class NaClBitstreamCursor; |
std::unique_ptr<MemoryObject> BitcodeBytes; |
- std::vector<BlockInfo> BlockInfoRecords; |
- |
- // True if the BlockInfo block has been read. |
- bool HasReadBlockInfoBlock = false; |
+ std::shared_ptr<BlockInfoRecordsMap> BlockInfoRecords; |
/// \brief Holds the offset of the first byte after the header. |
size_t InitialAddress; |
@@ -159,22 +227,33 @@ public: |
/// the given bitcode header. |
NaClBitstreamReader(const unsigned char *Start, const unsigned char *End, |
NaClBitcodeHeader &Header) |
- : BitcodeBytes(getNonStreamedMemoryObject(Start, End)) { |
+ : BitcodeBytes(getNonStreamedMemoryObject(Start, End)), |
+ BlockInfoRecords(BlockInfoRecordsMap::create()) { |
initFromHeader(Header); |
} |
/// Read stream from Bytes, after parsing the given bitcode header. |
NaClBitstreamReader(MemoryObject *Bytes, NaClBitcodeHeader &Header) |
- : BitcodeBytes(Bytes) { |
+ : BitcodeBytes(Bytes), BlockInfoRecords(BlockInfoRecordsMap::create()) { |
initFromHeader(Header); |
} |
/// Read stream from bytes, starting at the given initial address. |
/// Provides simple API for unit testing. |
NaClBitstreamReader(MemoryObject *Bytes, size_t InitialAddress) |
- : BitcodeBytes(Bytes), InitialAddress(InitialAddress) { |
+ : BitcodeBytes(Bytes), BlockInfoRecords(BlockInfoRecordsMap::create()), |
+ InitialAddress(InitialAddress) { |
} |
+ /// Read stream from sequence of bytes [Start .. End), using the global |
+ /// abbreviations of the given bitstream reader. Assumes that [Start .. End) |
+ /// is copied from Reader's memory object. |
+ NaClBitstreamReader(const unsigned char *Start, |
+ const unsigned char *End, NaClBitstreamReader *Reader) |
+ : BitcodeBytes(getNonStreamedMemoryObject(Start, End)), |
+ BlockInfoRecords(Reader->BlockInfoRecords), InitialAddress(0) |
+ { BlockInfoRecords->freeze(); } |
+ |
// Returns the memory object that is being read. |
MemoryObject &getBitcodeBytes() { return *BitcodeBytes; } |
@@ -189,28 +268,8 @@ public: |
// Block Manipulation |
//===--------------------------------------------------------------------===// |
- /// If there is block info for the specified ID, return it, otherwise return |
- /// null. |
- const BlockInfo *getBlockInfo(unsigned BlockID) const { |
- // Common case, the most recent entry matches BlockID. |
- if (!BlockInfoRecords.empty() && |
- BlockInfoRecords.back().getBlockID() == BlockID) |
- return &BlockInfoRecords.back(); |
- |
- for (unsigned i = 0, e = static_cast<unsigned>(BlockInfoRecords.size()); |
- i != e; ++i) |
- if (BlockInfoRecords[i].getBlockID() == BlockID) |
- return &BlockInfoRecords[i]; |
- return nullptr; |
- } |
- |
- BlockInfo &getOrCreateBlockInfo(unsigned BlockID) { |
- if (const BlockInfo *BI = getBlockInfo(BlockID)) |
- return *const_cast<BlockInfo*>(BI); |
- |
- // Otherwise, add a new record. |
- BlockInfoRecords.push_back(BlockInfo(BlockID)); |
- return BlockInfoRecords.back(); |
+ BlockInfo &getBlockInfo(unsigned BlockID) { |
+ return BlockInfoRecords->getBlockInfo(BlockID); |
} |
}; |
@@ -413,7 +472,7 @@ public: |
BitsInCurWord = 0; |
if (BitStream) { |
BlockScope.push_back( |
- Block(&BitStream->getOrCreateBlockInfo(naclbitc::TOP_LEVEL_BLOCKID))); |
+ Block(&BitStream->getBlockInfo(naclbitc::TOP_LEVEL_BLOCKID))); |
} |
} |
@@ -523,10 +582,35 @@ public: |
} |
} |
+ /// Returns the starting byte of the word containing BitNo. |
+ uintptr_t getStartWordByteForBit(uint64_t BitNo) const { |
+ return uintptr_t(BitNo/8) & ~(sizeof(word_t)-1); |
+ } |
+ |
+ /// Returns the index of BitNo within the word it appears in. |
+ unsigned getWordBitNo(uint64_t BitNo) const { |
+ return unsigned(BitNo & (sizeof(word_t)*8-1)); |
+ } |
+ |
+ /// Returns the ending byte of the word containing BitNo. |
+ uintptr_t getEndWordByteForBit(uint64_t BitNo) const { |
+ return getStartWordByteForBit(BitNo) + |
+ (getWordBitNo(BitNo) |
+ ? sizeof(word_t) |
+ : 0); |
+ } |
+ |
+ /// Fills Buffer[Size] using bytes at Address (in the memory object being |
+ /// read). Returns number of bytes filled (less than Size if at end of memory |
+ /// object). |
+ uint64_t fillBuffer(uint8_t *Buffer, size_t Size, size_t Address) const { |
+ return BitStream->getBitcodeBytes().readBytes(Buffer, Size, Address); |
+ } |
+ |
/// Reset the stream to the specified bit number. |
void JumpToBit(uint64_t BitNo) { |
- uintptr_t ByteNo = uintptr_t(BitNo/8) & ~(sizeof(word_t)-1); |
- unsigned WordBitNo = unsigned(BitNo & (sizeof(word_t)*8-1)); |
+ uintptr_t ByteNo = getStartWordByteForBit(BitNo); |
+ unsigned WordBitNo = getWordBitNo(BitNo); |
if (!canSkipToPos(ByteNo)) |
reportInvalidJumpToBit(BitNo); |
@@ -545,8 +629,7 @@ public: |
// Read the next word from the stream. |
uint8_t Array[sizeof(word_t)] = {0}; |
- uint64_t BytesRead = |
- BitStream->getBitcodeBytes().readBytes(Array, sizeof(Array), NextChar); |
+ uint64_t BytesRead = fillBuffer(Array, sizeof(Array), NextChar); |
// If we run out of data, stop at the end of the stream. |
if (BytesRead == 0) { |