Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(12)

Unified Diff: src/PNaClTranslator.cpp

Issue 361733002: Update Subzero to start parsing PNaCl bitcode files. (Closed) Base URL: https://chromium.googlesource.com/native_client/pnacl-subzero.git@master
Patch Set: Fix more nits. Created 6 years, 6 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View side-by-side diff with in-line comments
Download patch
Index: src/PNaClTranslator.cpp
diff --git a/src/PNaClTranslator.cpp b/src/PNaClTranslator.cpp
new file mode 100644
index 0000000000000000000000000000000000000000..327f35fdf5e82a946aa8612a0eac30390bad09a4
--- /dev/null
+++ b/src/PNaClTranslator.cpp
@@ -0,0 +1,872 @@
+//===- subzero/src/PNaClTranslator.cpp - Builds ICE from PNaCl bitcode ----===//
+//
+// The Subzero Code Generator
+//
+// This file is distributed under the University of Illinois Open Source
+// License. See LICENSE.TXT for details.
+//
+//===----------------------------------------------------------------------===//
+//
+// This file implements the PNaCl bitcode file to Ice translator.
+//
+//===----------------------------------------------------------------------===//
+
+#include "PNaClTranslator.h"
+#include "llvm/Bitcode/NaCl/NaClBitcodeDecoders.h"
+#include "llvm/Bitcode/NaCl/NaClBitcodeHeader.h"
+#include "llvm/Bitcode/NaCl/NaClBitcodeParser.h"
+#include "llvm/Bitcode/NaCl/NaClReaderWriter.h"
+#include "llvm/IR/Constants.h"
+#include "llvm/IR/LLVMContext.h"
+#include "llvm/IR/Module.h"
+#include "llvm/Support/Format.h"
+#include "llvm/Support/MemoryBuffer.h"
+#include "llvm/Support/raw_ostream.h"
+#include "llvm/Support/ValueHandle.h"
+
+#include <vector>
+#include <cassert>
+
+using namespace llvm;
+
+namespace {
+
+// Top-level class to read PNaCl bitcode files, and translate to ICE.
+class TopLevelParser : public NaClBitcodeParser {
+ TopLevelParser(const TopLevelParser&) LLVM_DELETED_FUNCTION;
+ void operator=(const TopLevelParser&) LLVM_DELETED_FUNCTION;
jvoung (off chromium) 2014/07/01 17:32:52 I think for Subzero, Jim has been using: T &opera
Karl 2014/07/01 21:31:07 Done.
+
+public:
+ TopLevelParser(Module *Mod,
jvoung (off chromium) 2014/07/01 17:32:52 It would be good to clarify what state the incomin
Karl 2014/07/01 21:31:07 I hadn't really worried about this because these c
+ NaClBitcodeHeader &Header,
+ NaClBitstreamCursor &Cursor)
+ : NaClBitcodeParser(Cursor),
+ Mod(Mod),
+ Header(Header),
+ NumErrors(),
jvoung (off chromium) 2014/07/01 17:32:53 initialize to 0?
Karl 2014/07/01 21:31:06 Definitely!
jvoung (off chromium) 2014/07/02 17:00:15 Okay, using () does initialize to zero, but it see
Karl 2014/07/02 18:09:54 Adding zero to be more clear.
+ NumFunctionIds(0),
+ GlobalVarPlaceHolderType(0) {}
+
+ virtual ~TopLevelParser() {} LLVM_OVERRIDE;
+
+ virtual bool Error(const std::string &Message) LLVM_OVERRIDE {
+ ++NumErrors;
+ return NaClBitcodeParser::Error(Message);
+ }
+
+ /// Returns the number of errors found while parsing the bitcode
+ /// file.
+ unsigned getNumErrors() const {
+ return NumErrors;
+ }
+
+ /// Returns the LLVM module associated with the translation.
+ Module *getModule() {
+ return Mod;
+ }
+
+ /// Returns the number of bytes in the bitcode header.
+ size_t getHeaderSize() {
jvoung (off chromium) 2014/07/01 17:32:53 Some of these other methods are const too?
Karl 2014/07/01 21:31:06 Done.
+ return Header.getHeaderSize();
+ }
+
+ /// Returns the llvm context to use.
+ LLVMContext &getLLVMContext() {
+ return Mod->getContext();
+ }
+
+ /// Changes the size of the type list to the given size.
+ void resizeTypeIDValues(unsigned NewSize) {
+ TypeIDValues.resize(NewSize);
+ }
+
+ /// Returns the type associated with the given index.
+ Type *getTypeByID(unsigned ID) {
+ Type *Ty = ID < TypeIDValues.size() ? TypeIDValues[ID] : 0;
jvoung (off chromium) 2014/07/01 17:32:53 Clarify that the array could really end up storing
Karl 2014/07/01 21:31:08 Done.
+ if (Ty) return Ty;
+ return reportTypeIDAsUndefined(ID);
+ }
+
+ /// Defines type for ID.
+ void setTypeID(unsigned ID, Type *Ty) {
+ if (ID < TypeIDValues.size() && TypeIDValues[ID] == 0) {
+ TypeIDValues[ID] = Ty;
+ return;
+ }
+ reportBadSetTypeID(ID, Ty);
+ }
+
+ /// Sets the next function ID to the given LLVM function.
+ void setNextFunctionID(Function *Fcn) {
+ ++NumFunctionIds;
+ ValueIDValues.push_back(Fcn);
+ }
+
+ /// Defines the next function ID as one that has an implementation
+ /// (i.e a corresponding function block in the bitcode).
+ void setNextValueIDAsImplementedFunction() {
+ DefiningFunctionsList.push_back(ValueIDValues.size());
+ }
+
+ /// Returns the LLVM IR value associatd with the global value ID.
+ Value *getGlobalValueByID(unsigned ID) {
+ if (ID >= ValueIDValues.size()) return 0;
+ return ValueIDValues[ID];
+ }
+
+ /// Returns the number of function addresses (i.e. ID's) defined in
+ /// the bitcode file.
+ unsigned getNumFunctionIDs() {
jvoung (off chromium) 2014/07/01 17:32:52 const
Karl 2014/07/01 21:31:08 Done.
+ return NumFunctionIds;
+ }
+
+ /// Returns the number of global values defined in the bitcode
+ /// file.
+ unsigned getNumGlobalValueIDs() {
+ return ValueIDValues.size();
+ }
+
+ /// Resizes the list of of value IDs to include Count global
+ /// variable IDs.
+ void resizeValueIDsForGlobalVarCount(unsigned Count) {
+ ValueIDValues.resize(ValueIDValues.size() + Count);
+ }
+
+ /// Returns the global variable address associated with the given
+ /// value ID. If the ID refers to a global variable address not yet
+ /// defined, a placeholder is created so that we can fix it up
+ /// later.
+ Constant *getOrCreateGlobalVarRef(unsigned ID) {
+ if (ID >= ValueIDValues.size()) return 0;
+ if (Value *C = ValueIDValues[ID])
+ return dyn_cast<Constant>(C);
+
+ if (GlobalVarPlaceHolderType == 0)
jvoung (off chromium) 2014/07/01 17:32:53 Why not just eagerly initialize it in the class's
Karl 2014/07/01 21:31:06 Done.
+ GlobalVarPlaceHolderType = Type::getInt8Ty(getLLVMContext());
+ Constant *C =
+ new GlobalVariable(*Mod, GlobalVarPlaceHolderType, false,
+ GlobalValue::ExternalLinkage, 0);
+ ValueIDValues[ID] = C;
+ return C;
+ }
+
+ /// Assigns the given global variable (address) to the given value
+ /// ID. Returns true if ID is a valid global variable ID. Otherwise
+ /// returns false.
+ bool assignGlobalVariable(GlobalVariable *GV, unsigned ID) {
+ if (ID < NumFunctionIds || ID >= ValueIDValues.size()) return false;
+ WeakVH &OldV = ValueIDValues[ID];
+ if (OldV == 0) {
+ ValueIDValues[ID] = GV;
+ return true;
+ }
+
+ // If reached, there was a forward reference to this value. Replace it.
+ Value *PrevVal = OldV;
+ GlobalVariable *Placeholder = cast<GlobalVariable>(PrevVal);
+ Placeholder->replaceAllUsesWith(
+ ConstantExpr::getBitCast(GV, Placeholder->getType()));
+ Placeholder->eraseFromParent();
+ ValueIDValues[ID] = GV;
+ return true;
+ }
+
+private:
+ // The parsed module.
+ Module *Mod;
+ // The bitcode header.
+ NaClBitcodeHeader &Header;
+ // The number of errors reported.
+ unsigned NumErrors;
+ // The types associated with each type ID.
+ std::vector<Type*> TypeIDValues;
+ // The (global) value IDs.
+ std::vector<WeakVH> ValueIDValues;
+ // The number of function IDs.
+ unsigned NumFunctionIds;
+ // The list of value IDs (in the order found) of defining function
+ // addresses.
+ std::vector<unsigned> DefiningFunctionsList;
+ // Cached global variable placeholder type. Used for all forward
+ // references to global variable addresses.
+ Type *GlobalVarPlaceHolderType;
+
+ virtual bool ParseBlock(unsigned BlockID) LLVM_OVERRIDE;
+
+ /// Reports that type ID is undefined, and then returns
+ /// the void type.
+ Type *reportTypeIDAsUndefined(unsigned ID);
+
+ /// Reports error about bad call to setTypeID.
+ void reportBadSetTypeID(unsigned ID, Type *Ty);
+};
+
+Type *TopLevelParser::reportTypeIDAsUndefined(unsigned ID) {
+ std::string Buffer;
+ raw_string_ostream StrBuf(Buffer);
jvoung (off chromium) 2014/07/01 17:32:52 This probably doesn't count as "Subzero core" sinc
Karl 2014/07/01 21:31:06 First off, Jim's comment about not using it is inc
+ StrBuf << "Can't find type for type id: " << ID;
+ Error(StrBuf.str());
+ Type *Ty = Type::getVoidTy(getLLVMContext());
+ // To reduce error messages, update type list if possible.
+ if (ID < TypeIDValues.size()) TypeIDValues[ID] = Ty;
+ return Ty;
+}
+
+void TopLevelParser::reportBadSetTypeID(unsigned ID, Type *Ty) {
+ std::string Buffer;
+ raw_string_ostream StrBuf(Buffer);
+ if (ID >= TypeIDValues.size()) {
+ StrBuf << "Type index " << ID << " out of range: can't install.";
+ } else {
+ // Must be case that index already defined.
+ StrBuf << "Type index " << ID << " defined as " << *TypeIDValues[ID]
+ << " and " << *Ty << ".";
+ }
+ Error(StrBuf.str());
+}
+
+// class for parsing blocks within the TopLevelParser.
+class BlockParser : public NaClBitcodeParser {
+protected:
+
+ // Constructor for nested block parsers.
+ BlockParser(unsigned BlockID, BlockParser *EnclosingParser)
+ : NaClBitcodeParser(BlockID, EnclosingParser),
+ Context(EnclosingParser->Context) {}
+
+ // Returns a string describing the bit address of the current record
+ // being processed by the block parser.
+ std::string getRecordAddress() const {
jvoung (off chromium) 2014/07/01 17:32:52 could inline this into Error(), then you don't nee
Karl 2014/07/01 21:31:06 Ok. the other uses I had for it has since been rem
+ uint64_t Bit = Record.GetStartBit() + Context->getHeaderSize() * 8;
+ std::string Buffer;
+ raw_string_ostream StrBuf(Buffer);
+ StrBuf << format("%"PRIu64":%u",
+ (Bit / 8),
+ static_cast<unsigned>(Bit % 8));
+ return StrBuf.str();
+ }
+
+ virtual bool Error(const std::string &Message) LLVM_OVERRIDE {
+ std::string Buffer;
+ raw_string_ostream StrBuf(Buffer);
+ StrBuf << "(" << getRecordAddress() << ") " << Message;
+ return Context->Error(StrBuf.str());
+ }
+
+public:
+ // Constructor for the top-level module block parser.
+ BlockParser(unsigned BlockID, TopLevelParser *Context)
jvoung (off chromium) 2014/07/01 17:32:52 Why not make this first, before the nested block c
Karl 2014/07/01 21:31:07 Done.
+ : NaClBitcodeParser(BlockID, Context),
+ Context(Context) {}
+
+ virtual ~BlockParser() LLVM_OVERRIDE {}
+
+protected:
+ // Default implementation. Reports that block is unknown and skips
+ // its contents.
+ virtual bool ParseBlock(unsigned BlockID) LLVM_OVERRIDE;
+
+ // Default implementation. Reports that the record is not
+ // understood.
+ virtual void ProcessRecord() LLVM_OVERRIDE;
+
+ // The context parser that contains the decoded state.
jvoung (off chromium) 2014/07/01 17:32:53 Can we collect the fields in one place, and the me
Karl 2014/07/01 21:31:06 Done.
+ TopLevelParser *Context;
+
+ /// Checks if the size of the record is Size. If not, an error is
+ /// produced using the given RecordName. Return true if error was
+ /// reported. Otherwise false.
jvoung (off chromium) 2014/07/01 17:32:53 I feel like some of these comments about the error
Karl 2014/07/01 21:31:08 Done.
+ bool checkRecordSize(unsigned Size, const char *RecordName) {
+ const NaClBitcodeRecord::RecordVector &Values = Record.GetValues();
+ if (Values.size() != Size) {
+ return RecordSizeError(Size, RecordName, 0);
+ }
+ return false;
+ }
+
+ /// Checks if the size of the record is at least as large as the
+ /// LowerLimit. If not, an error is produced using the given
+ /// RecordName. Return true if error was reported. Otherwise false.
+ bool checkRecordSizeAtLeast(unsigned LowerLimit, const char *RecordName) {
+ const NaClBitcodeRecord::RecordVector &Values = Record.GetValues();
+ if (Values.size() < LowerLimit) {
+ return RecordSizeError(LowerLimit, RecordName, "at least");
+ }
+ return false;
+ }
+
+ /// Checks if the size of the record is no larger than the
+ /// UpperLimit. If not, an error is produced using the given
+ /// RecordName. Return true if error was reported. Otherwise false.
+ bool checkRecordSizeNoMoreThan(unsigned UpperLimit, const char *RecordName) {
+ const NaClBitcodeRecord::RecordVector &Values = Record.GetValues();
+ if (Values.size() > UpperLimit) {
+ return RecordSizeError(UpperLimit, RecordName, "no more than");
+ }
+ return false;
+ }
+
+ /// Checks if the size of the record is at least as large as the
+ /// LowerLimit, and no larger than the UpperLimit. If not, an error
+ /// is produced using the given RecordName. Return true if error was
+ /// reported. Otherwise false.
+ bool checkRecordSizeInRange(unsigned LowerLimit, unsigned UpperLimit,
+ const char *RecordName) {
+ return checkRecordSizeAtLeast(LowerLimit, RecordName)
+ || checkRecordSizeNoMoreThan(UpperLimit, RecordName);
+ }
+
+private:
+ /// Generates a record size error. ExpectedSize is the number
+ /// of elements expected. RecordName is the name of the kind of
+ /// record that has incorrect size. ContextMessage (if not 0)
+ /// is appended to "record expects" to describe how ExpectedSize
+ /// should be interpreted.
+ bool RecordSizeError(unsigned ExpectedSize,
+ const char *RecordName,
+ const char *ContextMessage) {
+ std::string Buffer;
+ raw_string_ostream StrBuf(Buffer);
+ StrBuf << RecordName << " record expects";
+ if (ContextMessage) StrBuf << " " << ContextMessage;
+ StrBuf << " " << ExpectedSize << " argument";
+ if(ExpectedSize > 1) StrBuf << "s";
+ StrBuf << ". Found: " << Record.GetValues().size();
+ return Error(StrBuf.str());
+ }
+};
+
+bool BlockParser::ParseBlock(unsigned BlockID) {
jvoung (off chromium) 2014/07/01 17:32:53 I wonder if this class should be called something
Karl 2014/07/01 21:31:07 Done.
+ // If called, derived class doesn't know how to handle block.
+ // Report error and skip.
+ std::string Buffer;
+ raw_string_ostream StrBuf(Buffer);
+ StrBuf << "Don't know how to parse block id: " << BlockID;
+ Error(StrBuf.str());
+ SkipBlock();
+ return false;
+}
+
+void BlockParser::ProcessRecord() {
+ // If called, derived class doesn't know how to handle.
+ std::string Buffer;
+ raw_string_ostream StrBuf(Buffer);
+ StrBuf << "Don't know how to process record: " << Record;
+ Error(StrBuf.str());
+}
+
+// Class to parse a types block.
+class TypesParser : public BlockParser {
+public:
+ TypesParser(unsigned BlockID, BlockParser *EnclosingParser)
+ : BlockParser(BlockID, EnclosingParser), NextTypeId(0) {}
+
+ ~TypesParser() LLVM_OVERRIDE {}
+
+protected:
+ virtual void ProcessRecord() LLVM_OVERRIDE;
+ // The type ID that will be associated with the next type defining
+ // record in the types block.
+ unsigned NextTypeId;
+};
+
+void TypesParser::ProcessRecord() {
+ Type *Ty = 0;
+ const NaClBitcodeRecord::RecordVector &Values = Record.GetValues();
+ switch (Record.GetCode()) {
+ case naclbitc::TYPE_CODE_NUMENTRY:
+ // NUMENTRY: [numentries]
+ if (checkRecordSize(1, "Type count")) return;
+ Context->resizeTypeIDValues(Values[0]);
+ return;
+ case naclbitc::TYPE_CODE_VOID:
+ // VOID
+ if (checkRecordSize(0, "Type void")) break;
+ Ty = Type::getVoidTy(Context->getLLVMContext());
+ break;
+ case naclbitc::TYPE_CODE_FLOAT:
+ // FLOAT
+ if (checkRecordSize(0, "Type float")) break;
+ Ty = Type::getFloatTy(Context->getLLVMContext());
+ break;
+ case naclbitc::TYPE_CODE_DOUBLE:
+ // DOUBLE
+ if (checkRecordSize(0, "Type double")) break;
+ Ty = Type::getDoubleTy(Context->getLLVMContext());
+ break;
+ case naclbitc::TYPE_CODE_INTEGER:
+ // INTEGER: [width]
+ if (checkRecordSize(1, "Type integer")) break;
+ Ty = IntegerType::get(Context->getLLVMContext(), Values[0]);
+ // TODO(kschimpf) Check if size is legal.
+ break;
+ case naclbitc::TYPE_CODE_VECTOR:
+ // VECTOR: [numelts, eltty]
+ if (checkRecordSize(2, "Type vector")) break;
+ Ty = VectorType::get(Context->getTypeByID(Values[1]), Values[0]);
+ break;
+ case naclbitc::TYPE_CODE_FUNCTION: {
+ // FUNCTION: [vararg, retty, paramty x N]
+ if (checkRecordSizeAtLeast(2, "Type signature")) break;
+ SmallVector<Type *, 8> ArgTys;
+ for (unsigned i = 2, e = Values.size(); i != e; ++i) {
+ ArgTys.push_back(Context->getTypeByID(Values[i]));
+ }
+ Ty = FunctionType::get(Context->getTypeByID(Values[1]),
+ ArgTys, Values[0]);
+ break;
+ }
+ default:
+ BlockParser::ProcessRecord();
+ break;
+ }
+ // If Ty not defined, assume error. Use void as filler.
+ if (Ty == 0)
+ Ty = Type::getVoidTy(Context->getLLVMContext());
+ Context->setTypeID(NextTypeId++, Ty);
+}
+
+/// Parses the globals block (i.e. global variables).
+class GlobalsParser : public BlockParser {
+public:
+ GlobalsParser(unsigned BlockID, BlockParser *EnclosingParser)
+ : BlockParser(BlockID, EnclosingParser),
+ InitializersNeeded(0),
+ Alignment(1),
+ IsConstant(false) {
+ NextGlobalID = Context->getNumFunctionIDs();
+ }
+
+ virtual ~GlobalsParser() LLVM_OVERRIDE {}
+
+protected:
+ virtual void ExitBlock() LLVM_OVERRIDE {
+ verifyNoMissingInitializers();
+ unsigned NumIDs = Context->getNumGlobalValueIDs();
+ if (NextGlobalID < NumIDs) {
+ unsigned NumFcnIDs = Context->getNumFunctionIDs();
+ std::string Buffer;
+ raw_string_ostream StrBuf(Buffer);
+ StrBuf << "Globals block expects "
+ << (NumIDs - NumFcnIDs)
+ << " global definitions. Found: "
+ << (NextGlobalID - NumFcnIDs);
+ Error(StrBuf.str());
+ }
+ BlockParser::ExitBlock();
+ }
+
+ virtual void ProcessRecord() LLVM_OVERRIDE;
+
+ // Holds the sequence of initializers for the global.
+ SmallVector<Constant *, 10> Initializers;
jvoung (off chromium) 2014/07/01 17:32:53 Similar, can we put all the fields in one block, a
Karl 2014/07/01 21:31:07 Done.
+
+ // Keeps track of how many initializers are expected for
+ // the global variable being built.
+ unsigned InitializersNeeded;
+
+ // The alignment assumed for the global variable being built.
+ unsigned Alignment;
+
+ // True if the global variable being built is a constant.
+ bool IsConstant;
+
+ // The index of the next global variable.
+ unsigned NextGlobalID;
+
+ // Checks if the number of initializers needed is the same as the
+ // number found in the bitcode file. If different, and error message
+ // is generated, and the internal state of the parser is fixed so
+ // this condition is no longer violated.
+ void verifyNoMissingInitializers() {
+ if (InitializersNeeded != Initializers.size()) {
+ std::string Buffer;
+ raw_string_ostream StrBuf(Buffer);
+ StrBuf << "Global variable @g"
+ << (NextGlobalID - Context->getNumFunctionIDs())
+ << " expected " << InitializersNeeded << " initializer";
+ if (InitializersNeeded > 1) StrBuf << "s";
+ StrBuf << ". Found: " << Initializers.size();
+ Error(StrBuf.str());
+ // Fix up state so that we can continue.
+ InitializersNeeded = Initializers.size();
+ installGlobalVar();
+ }
+ }
+
+ // Reserves a slot in the list of initializers being built. If there
+ // isn't room for the slot, an error message is generated.
+ void reserveInitializer(const char *RecordName) {
+ if (InitializersNeeded == Initializers.size()) {
jvoung (off chromium) 2014/07/01 17:32:52 Would it be safer to check if >= ? Otherwise, it l
Karl 2014/07/01 21:31:07 I did this so that we wouldn't get cascading error
+ std::string Buffer;
+ raw_string_ostream StrBuf(Buffer);
+ StrBuf << RecordName << " record: Too many initializers, ignoring.";
jvoung (off chromium) 2014/07/01 17:32:52 Probably could have just std::string() + ... for t
Karl 2014/07/01 21:31:07 Done.
+ Error(StrBuf.str());
+ }
+ }
+
+ // Takes the initializers (and other parser state values) and
+ // installs a global variable (with the initializers) into the list
+ // of ValueIDs.
+ void installGlobalVar() {
+ Constant *Init = 0;
+ switch (Initializers.size()) {
+ case 0:
+ Error("No initializer for global variable in global vars block");
+ return;
+ case 1:
+ Init = Initializers[0];
+ break;
+ default:
+ Init = ConstantStruct::getAnon(Context->getLLVMContext(),
+ Initializers, true);
+ break;
+ }
+ GlobalVariable *GV = new GlobalVariable(
+ *Context->getModule(), Init->getType(), IsConstant,
+ GlobalValue::InternalLinkage, Init, "");
+ GV->setAlignment(Alignment);
+ if (!Context->assignGlobalVariable(GV, NextGlobalID)) {
+ std::string Buffer;
+ raw_string_ostream StrBuf(Buffer);
+ StrBuf << "Defining global V[" << NextGlobalID
+ << "] not allowed. Out of range.";
+ Error(StrBuf.str());
+ }
+ ++NextGlobalID;
+ Initializers.clear();
+ InitializersNeeded = 0;
+ Alignment = 1;
+ IsConstant = false;
+ }
+};
+
+void GlobalsParser::ProcessRecord() {
+ const NaClBitcodeRecord::RecordVector &Values = Record.GetValues();
+ switch (Record.GetCode()) {
+ case naclbitc::GLOBALVAR_COUNT:
+ // COUNT: [n]
+ if (checkRecordSize(1, "Globals count")) return;
+ if (NextGlobalID > Context->getNumFunctionIDs()) {
jvoung (off chromium) 2014/07/01 17:32:52 I can't put my finger on it, but this checks seems
Karl 2014/07/01 21:31:07 The test is to verify it appears before any global
+ Error("Globals count record not first in block.");
+ return;
+ }
+ verifyNoMissingInitializers();
+ Context->resizeValueIDsForGlobalVarCount(Values[0]);
+ return;
+ case naclbitc::GLOBALVAR_VAR: {
+ // VAR: [align, isconst]
+ if (checkRecordSize(2, "Globals variable")) return;
+ verifyNoMissingInitializers();
+ InitializersNeeded = 1;
+ Initializers.clear();
+ Alignment = (1 << Values[0]) >> 1;
+ IsConstant = Values[0] != 0;
jvoung (off chromium) 2014/07/01 17:32:52 Values[1] != 0 Otherwise, the alignment could mak
Karl 2014/07/01 21:31:08 Done.
+ return;
+ }
+ case naclbitc::GLOBALVAR_COMPOUND:
+ // COMPOUND: [size]
+ if (checkRecordSize(1, "globals compound")) return;
+ if (Initializers.size() > 0 || InitializersNeeded != 1) {
+ Error("Globals compound record not first initializer");
+ return;
+ }
+ if (Values[0] < 2) {
+ std::string Buffer;
+ raw_string_ostream StrBuf(Buffer);
+ StrBuf << "Globals compound record size invalid. Found: "
+ << Values[0];
+ Error(StrBuf.str());
+ return;
+ }
+ InitializersNeeded = Values[0];
+ return;
+ case naclbitc::GLOBALVAR_ZEROFILL: {
+ // ZEROFILL: [size]
+ if (checkRecordSize(1, "Globals zerofill")) return;
+ reserveInitializer("Globals zerofill");
+ Type *Ty = ArrayType::get(Type::getInt8Ty(Context->getLLVMContext()),
+ Values[0]);
+ Constant *Zero = ConstantAggregateZero::get(Ty);
+ Initializers.push_back(Zero);
+ break;
+ }
+ case naclbitc::GLOBALVAR_DATA: {
+ // DATA: [b0, b1, ...]
+ if (checkRecordSizeAtLeast(1, "Globals data")) return;
+ reserveInitializer("Globals data");
+ unsigned Size = Values.size();
+ uint8_t *Buf = new uint8_t[Size];
+ assert(Buf);
+ for (unsigned i = 0; i < Size; ++i)
jvoung (off chromium) 2014/07/01 17:32:53 could memcpy this?
Karl 2014/07/01 21:31:07 Not really. We are doing a cast from uint64_t to u
+ Buf[i] = Values[i];
+ Constant *Init = ConstantDataArray::get(
+ Context->getLLVMContext(),
+ ArrayRef<uint8_t>(Buf, Buf + Size));
+ Initializers.push_back(Init);
+ delete[] Buf;
+ break;
+ }
+ case naclbitc::GLOBALVAR_RELOC: {
+ // RELOC: [val, [addend]]
+ if (checkRecordSizeInRange(1, 2, "Globals reloc")) return;
+ Constant *BaseVal =
+ Context->getOrCreateGlobalVarRef(Values[0]);
+ if (BaseVal == 0) {
+ std::string Buffer;
+ raw_string_ostream StrBuf(Buffer);
+ StrBuf << "Can't find global relocation value: " << Values[0];
+ Error(StrBuf.str());
+ return;
+ }
+ Type *IntPtrType = IntegerType::get(Context->getLLVMContext(), 32);
+ Constant *Val = ConstantExpr::getPtrToInt(BaseVal, IntPtrType);
+ if (Values.size() == 2) {
+ Val = ConstantExpr::getAdd(Val, ConstantInt::get(IntPtrType, Values[1]));
+ }
+ Initializers.push_back(Val);
+ break;
+ }
+ default:
+ BlockParser::ProcessRecord();
+ return;
+ }
+ // If reached, just processed another intializer. See if time
+ // to install global.
+ if (InitializersNeeded == Initializers.size()) installGlobalVar();
+}
+
+// Parses a valuesymtab block in the bitcode file.
+class ValuesymtabParser : public BlockParser {
+ typedef SmallString<128> StringType;
+public:
+ ValuesymtabParser(unsigned BlockID,
+ BlockParser *EnclosingParser,
jvoung (off chromium) 2014/07/01 17:32:53 indent to line up to after the ( ? There is "make
Karl 2014/07/01 21:31:06 Done.
Jim Stichnoth 2014/07/07 20:50:23 This (modifying unrelated files) is usually becaus
+ bool AllowBbEntries)
+ : BlockParser(BlockID, EnclosingParser),
+ AllowBbEntries(AllowBbEntries) {}
+
+ virtual ~ValuesymtabParser() LLVM_OVERRIDE {}
+
+protected:
+ // True if entries to name basic blocks allowed.
+ bool AllowBbEntries;
+ // The last name converted to a string using convertToString.
+ StringType ConvertedName;
+
+ virtual void ProcessRecord() LLVM_OVERRIDE;
+
+ void ConvertToString() {
+ ConvertedName.clear();
+ const NaClBitcodeRecord::RecordVector &Values = Record.GetValues();
+ for (size_t i = 1, e = Values.size(); i != e; ++i) {
+ ConvertedName += static_cast<char>(Values[i]);
+ }
+ }
+};
+
+void ValuesymtabParser::ProcessRecord() {
+ const NaClBitcodeRecord::RecordVector &Values = Record.GetValues();
+ switch (Record.GetCode()) {
+ case naclbitc::VST_CODE_ENTRY: {
+ // VST_ENTRY: [valid, namechar x N]
jvoung (off chromium) 2014/07/01 17:32:53 valueID, or something instead of valid
Karl 2014/07/01 21:31:07 Done.
+ if (checkRecordSizeAtLeast(2, "Valuesymtab value entry")) return;
+ ConvertToString();
jvoung (off chromium) 2014/07/01 17:32:52 Feels a bit roundabout that ConvertedName is a fie
Karl 2014/07/01 21:31:07 I mainly did this to avoid allocations between cal
+ Value *V = Context->getGlobalValueByID(Values[0]);
+ if (V == 0) {
+ std::string Buffer;
+ raw_string_ostream StrBuf(Buffer);
+ StrBuf << "Invalid global address ID in valuesymtab: " << Values[0];
+ Error(StrBuf.str());
+ return;
+ }
+ V->setName(StringRef(ConvertedName.data(), ConvertedName.size()));
+ return;
+ }
+ case naclbitc::VST_CODE_BBENTRY: {
+ // VST_BBENTRY: [bbid, namechar x N]
+ // For now, since we aren't processing function blocks, don't handle.
+ if (AllowBbEntries) {
+ Error("Valuesymtab bb entry not implemented");
+ return;
+ }
+ break;
+ }
+ default:
+ break;
+ }
+ // If reached, don't know how to handle record.
+ BlockParser::ProcessRecord();
+ return;
+}
+
+/// Parses the module block in the bitcode file.
+class ModuleParser : public BlockParser {
+public:
+ ModuleParser(unsigned BlockID, TopLevelParser *Context)
+ : BlockParser(BlockID, Context) {}
+
+ virtual ~ModuleParser() LLVM_OVERRIDE {}
+
+protected:
+ virtual bool ParseBlock(unsigned BlockID) LLVM_OVERRIDE;
+
+ virtual void ProcessRecord() LLVM_OVERRIDE;
+};
+
+bool ModuleParser::ParseBlock(unsigned BlockID) LLVM_OVERRIDE {
+ switch (BlockID) {
+ case naclbitc::BLOCKINFO_BLOCK_ID:
+ return NaClBitcodeParser::ParseBlock(BlockID);
+ case naclbitc::TYPE_BLOCK_ID_NEW: {
+ TypesParser Parser(BlockID, this);
+ return Parser.ParseThisBlock();
+ }
+ case naclbitc::GLOBALVAR_BLOCK_ID: {
+ GlobalsParser Parser(BlockID, this);
+ return Parser.ParseThisBlock();
+ }
+ case naclbitc::VALUE_SYMTAB_BLOCK_ID: {
+ ValuesymtabParser Parser(BlockID, this, false);
+ return Parser.ParseThisBlock();
+ }
+ case naclbitc::FUNCTION_BLOCK_ID: {
+ Error("Function block parser not yet implemented, skipping");
+ SkipBlock();
+ return false;
+ }
+ default:
+ return BlockParser::ParseBlock(BlockID);
+ }
+}
+
+void ModuleParser::ProcessRecord() {
+ const NaClBitcodeRecord::RecordVector &Values = Record.GetValues();
+ switch (Record.GetCode()) {
+ case naclbitc::MODULE_CODE_VERSION: {
+ // VERSION: [version#]
+ if (checkRecordSize(1, "Module version")) return;
+ unsigned Version = Values[0];
+ if (Version != 1) {
+ std::string Buffer;
+ raw_string_ostream StrBuf(Buffer);
+ StrBuf << "Unknown bitstream version: " << Version;
+ Error(StrBuf.str());
+ }
+ return;
+ }
+ case naclbitc::MODULE_CODE_FUNCTION: {
+ // FUNCTION: [type, callingconv, isproto, linkage]
+ if (checkRecordSize(4, "Function heading")) return;
+ Type *Ty = Context->getTypeByID(Values[0]);
+ FunctionType *FTy = dyn_cast<FunctionType>(Ty);
+ if (FTy == 0) {
+ std::string Buffer;
+ raw_string_ostream StrBuf(Buffer);
+ StrBuf << "Function heading expects function type. Found: "
+ << Ty;
+ Error(StrBuf.str());
+ return;
+ }
+ CallingConv::ID CallingConv;
+ if (!naclbitc::DecodeCallingConv(Values[1], CallingConv)) {
+ std::string Buffer;
+ raw_string_ostream StrBuf(Buffer);
+ StrBuf << "Function heading has unknown calling convention: "
+ << Values[1];
+ Error(StrBuf.str());
+ return;
+ }
+ GlobalValue::LinkageTypes Linkage;
+ if (!naclbitc::DecodeLinkage(Values[3], Linkage)) {
+ std::string Buffer;
+ raw_string_ostream StrBuf(Buffer);
+ StrBuf << "Function heading has unknown linkage. Found "
+ << Values[3];
+ Error(StrBuf.str());
+ return;
+ }
+ Function *Func = Function::Create(FTy, Linkage, "", Context->getModule());
+ Func->setCallingConv(CallingConv);
+ if (Values[2] == 0) Context->setNextValueIDAsImplementedFunction();
+ Context->setNextFunctionID(Func);
+ // TODO(kschimpf) verify if Func matches PNaCl ABI.
+ return;
+ }
+ default:
+ BlockParser::ProcessRecord();
+ return;
+ }
+}
+
+bool TopLevelParser::ParseBlock(unsigned BlockID) {
+ if (BlockID == naclbitc::MODULE_BLOCK_ID) {
+ ModuleParser Parser(BlockID, this);
+ bool Results = Parser.ParseThisBlock();
jvoung (off chromium) 2014/07/01 17:32:53 Singular Result? Otherwise it sounds like a collec
Karl 2014/07/01 21:31:06 Done.
+ // TODO(kschimpf): Remove once translating function blocks.
+ errs() << "Global addresses:\n";
+ for (size_t i = 0; i < ValueIDValues.size(); ++i) {
+ errs() << "[" << i << "]: " << *ValueIDValues[i] << "\n";
jvoung (off chromium) 2014/07/01 17:32:53 How will this eventually transition? This starts t
Karl 2014/07/01 21:31:08 I need to implement a FunctionParser. It will have
+ }
+ return Results;
+ }
+ // Generate error message by using default block implementation.
+ BlockParser Parser(BlockID, this);
+ return Parser.ParseThisBlock();
+}
+
+}
+
+namespace Ice {
+
+int PNaClTranslator::translate(std::string IRFilename) {
+ OwningPtr<MemoryBuffer> MemBuf;
+ if (error_code ec =
+ MemoryBuffer::getFileOrSTDIN(IRFilename.c_str(), MemBuf)) {
+ errs() << "Error reading '" << IRFilename << "': "
+ << ec.message() << "\n";
+ return ExitStatus = 1;
+ }
+
+ if (MemBuf->getBufferSize() % 4 != 0) {
+ errs() << IRFilename
+ << ": Bitcode stream should be a multiple of 4 bytes in length.\n";
+ return ExitStatus = 1;
+ }
+
+ const unsigned char *BufPtr = (const unsigned char *)MemBuf->getBufferStart();
+ const unsigned char *EndBufPtr = BufPtr+MemBuf->getBufferSize();
+
+ // Read header and verify it is good.
+ NaClBitcodeHeader Header;
+ if (Header.Read(BufPtr, EndBufPtr) || !Header.IsSupported()) {
+ errs() << "Invalid PNaCl bitcode header.\n";
+ return ExitStatus = 1;
+ }
+
+ // Create a bitstream reader to read the bitcode file.
+ NaClBitstreamReader InputStreamFile(BufPtr, EndBufPtr);
+ NaClBitstreamCursor InputStream(InputStreamFile);
+
+ OwningPtr<Module> Mod(
+ new Module(MemBuf->getBufferIdentifier(), getGlobalContext()));
+
+ Mod->setDataLayout(PNaClDataLayout);
+
+ TopLevelParser Parser(&*Mod, Header, InputStream);
jvoung (off chromium) 2014/07/01 17:32:52 Mod.get(), if you just want the raw pointer. Or m
Karl 2014/07/01 21:31:07 Moved into Parser constructor.
+ int TopLevelBlocks = 0;
+ while (!InputStream.AtEndOfStream()) {
+ if (Parser.Parse()) return 1;
+ ++TopLevelBlocks;
+ }
+
+ if (TopLevelBlocks != 1) {
+ errs() << IRFilename << ": Contains more than one module. Found: "
+ << TopLevelBlocks << "\n";
+ return ExitStatus = 1;
+ }
+
+ return ExitStatus = (Parser.getNumErrors() > 0);
+}
+
+}
« src/PNaClTranslator.h ('K') | « src/PNaClTranslator.h ('k') | src/llvm2ice.cpp » ('j') | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698