src/PNaClTranslator.cpp - Issue 361733002: Update Subzero to start parsing PNaCl bitcode files.

Unified Diff: src/PNaClTranslator.cpp

Issue 361733002: Update Subzero to start parsing PNaCl bitcode files. (Closed) Base URL: https://chromium.googlesource.com/native_client/pnacl-subzero.git@master

Patch Set: Fix more nits. Created 6 years, 6 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: src/PNaClTranslator.cpp

diff --git a/src/PNaClTranslator.cpp b/src/PNaClTranslator.cpp

new file mode 100644

index 0000000000000000000000000000000000000000..327f35fdf5e82a946aa8612a0eac30390bad09a4

--- /dev/null

+++ b/src/PNaClTranslator.cpp

@@ -0,0 +1,872 @@

+//===- subzero/src/PNaClTranslator.cpp - Builds ICE from PNaCl bitcode ----===//

+//

+// The Subzero Code Generator

+//

+// This file is distributed under the University of Illinois Open Source

+// License. See LICENSE.TXT for details.

+//

+//===----------------------------------------------------------------------===//

+//

+// This file implements the PNaCl bitcode file to Ice translator.

+//

+//===----------------------------------------------------------------------===//

+#include "PNaClTranslator.h"

+#include "llvm/Bitcode/NaCl/NaClBitcodeDecoders.h"

+#include "llvm/Bitcode/NaCl/NaClBitcodeHeader.h"

+#include "llvm/Bitcode/NaCl/NaClBitcodeParser.h"

+#include "llvm/Bitcode/NaCl/NaClReaderWriter.h"

+#include "llvm/IR/Constants.h"

+#include "llvm/IR/LLVMContext.h"

+#include "llvm/IR/Module.h"

+#include "llvm/Support/Format.h"

+#include "llvm/Support/MemoryBuffer.h"

+#include "llvm/Support/raw_ostream.h"

+#include "llvm/Support/ValueHandle.h"

+#include <vector>

+#include <cassert>

+using namespace llvm;

+namespace {

+// Top-level class to read PNaCl bitcode files, and translate to ICE.

+class TopLevelParser : public NaClBitcodeParser {

+ TopLevelParser(const TopLevelParser&) LLVM_DELETED_FUNCTION;

+ void operator=(const TopLevelParser&) LLVM_DELETED_FUNCTION;

jvoung (off chromium) 2014/07/01 17:32:52 I think for Subzero, Jim has been using: T &opera

Karl 2014/07/01 21:31:07 Done.

+public:

+ TopLevelParser(Module *Mod,

jvoung (off chromium) 2014/07/01 17:32:52 It would be good to clarify what state the incomin

Karl 2014/07/01 21:31:07 I hadn't really worried about this because these c

+ NaClBitcodeHeader &Header,

+ NaClBitstreamCursor &Cursor)

+ : NaClBitcodeParser(Cursor),

+ Mod(Mod),

+ Header(Header),

+ NumErrors(),

jvoung (off chromium) 2014/07/01 17:32:53 initialize to 0?

Karl 2014/07/01 21:31:06 Definitely!

jvoung (off chromium) 2014/07/02 17:00:15 Okay, using () does initialize to zero, but it see

Karl 2014/07/02 18:09:54 Adding zero to be more clear.

+ NumFunctionIds(0),

+ GlobalVarPlaceHolderType(0) {}

+ virtual ~TopLevelParser() {} LLVM_OVERRIDE;

+ virtual bool Error(const std::string &Message) LLVM_OVERRIDE {

+ ++NumErrors;

+ return NaClBitcodeParser::Error(Message);

+ }

+ /// Returns the number of errors found while parsing the bitcode

+ /// file.

+ unsigned getNumErrors() const {

+ return NumErrors;

+ }

+ /// Returns the LLVM module associated with the translation.

+ Module *getModule() {

+ return Mod;

+ }

+ /// Returns the number of bytes in the bitcode header.

+ size_t getHeaderSize() {

jvoung (off chromium) 2014/07/01 17:32:53 Some of these other methods are const too?

Karl 2014/07/01 21:31:06 Done.

+ return Header.getHeaderSize();

+ }

+ /// Returns the llvm context to use.

+ LLVMContext &getLLVMContext() {

+ return Mod->getContext();

+ }

+ /// Changes the size of the type list to the given size.

+ void resizeTypeIDValues(unsigned NewSize) {

+ TypeIDValues.resize(NewSize);

+ }

+ /// Returns the type associated with the given index.

+ Type *getTypeByID(unsigned ID) {

+ Type *Ty = ID < TypeIDValues.size() ? TypeIDValues[ID] : 0;

jvoung (off chromium) 2014/07/01 17:32:53 Clarify that the array could really end up storing

Karl 2014/07/01 21:31:08 Done.

+ if (Ty) return Ty;

+ return reportTypeIDAsUndefined(ID);

+ }

+ /// Defines type for ID.

+ void setTypeID(unsigned ID, Type *Ty) {

+ if (ID < TypeIDValues.size() && TypeIDValues[ID] == 0) {

+ TypeIDValues[ID] = Ty;

+ return;

+ }

+ reportBadSetTypeID(ID, Ty);

+ }

+ /// Sets the next function ID to the given LLVM function.

+ void setNextFunctionID(Function *Fcn) {

+ ++NumFunctionIds;

+ ValueIDValues.push_back(Fcn);

+ }

+ /// Defines the next function ID as one that has an implementation

+ /// (i.e a corresponding function block in the bitcode).

+ void setNextValueIDAsImplementedFunction() {

+ DefiningFunctionsList.push_back(ValueIDValues.size());

+ }

+ /// Returns the LLVM IR value associatd with the global value ID.

+ Value *getGlobalValueByID(unsigned ID) {

+ if (ID >= ValueIDValues.size()) return 0;

+ return ValueIDValues[ID];

+ }

+ /// Returns the number of function addresses (i.e. ID's) defined in

+ /// the bitcode file.

+ unsigned getNumFunctionIDs() {

jvoung (off chromium) 2014/07/01 17:32:52 const

Karl 2014/07/01 21:31:08 Done.

+ return NumFunctionIds;

+ }

+ /// Returns the number of global values defined in the bitcode

+ /// file.

+ unsigned getNumGlobalValueIDs() {

+ return ValueIDValues.size();

+ }

+ /// Resizes the list of of value IDs to include Count global

+ /// variable IDs.

+ void resizeValueIDsForGlobalVarCount(unsigned Count) {

+ ValueIDValues.resize(ValueIDValues.size() + Count);

+ }

+ /// Returns the global variable address associated with the given

+ /// value ID. If the ID refers to a global variable address not yet

+ /// defined, a placeholder is created so that we can fix it up

+ /// later.

+ Constant *getOrCreateGlobalVarRef(unsigned ID) {

+ if (ID >= ValueIDValues.size()) return 0;

+ if (Value *C = ValueIDValues[ID])

+ return dyn_cast<Constant>(C);

+ if (GlobalVarPlaceHolderType == 0)

jvoung (off chromium) 2014/07/01 17:32:53 Why not just eagerly initialize it in the class's

Karl 2014/07/01 21:31:06 Done.

+ GlobalVarPlaceHolderType = Type::getInt8Ty(getLLVMContext());

+ Constant *C =

+ new GlobalVariable(*Mod, GlobalVarPlaceHolderType, false,

+ GlobalValue::ExternalLinkage, 0);

+ ValueIDValues[ID] = C;

+ return C;

+ }

+ /// Assigns the given global variable (address) to the given value

+ /// ID. Returns true if ID is a valid global variable ID. Otherwise

+ /// returns false.

+ bool assignGlobalVariable(GlobalVariable *GV, unsigned ID) {

+ if (ID < NumFunctionIds || ID >= ValueIDValues.size()) return false;

+ WeakVH &OldV = ValueIDValues[ID];

+ if (OldV == 0) {

+ ValueIDValues[ID] = GV;

+ return true;

+ }

+ // If reached, there was a forward reference to this value. Replace it.

+ Value *PrevVal = OldV;

+ GlobalVariable *Placeholder = cast<GlobalVariable>(PrevVal);

+ Placeholder->replaceAllUsesWith(

+ ConstantExpr::getBitCast(GV, Placeholder->getType()));

+ Placeholder->eraseFromParent();

+ ValueIDValues[ID] = GV;

+ return true;

+ }

+private:

+ // The parsed module.

+ Module *Mod;

+ // The bitcode header.

+ NaClBitcodeHeader &Header;

+ // The number of errors reported.

+ unsigned NumErrors;

+ // The types associated with each type ID.

+ std::vector<Type*> TypeIDValues;

+ // The (global) value IDs.

+ std::vector<WeakVH> ValueIDValues;

+ // The number of function IDs.

+ unsigned NumFunctionIds;

+ // The list of value IDs (in the order found) of defining function

+ // addresses.

+ std::vector<unsigned> DefiningFunctionsList;

+ // Cached global variable placeholder type. Used for all forward

+ // references to global variable addresses.

+ Type *GlobalVarPlaceHolderType;

+ virtual bool ParseBlock(unsigned BlockID) LLVM_OVERRIDE;

+ /// Reports that type ID is undefined, and then returns

+ /// the void type.

+ Type *reportTypeIDAsUndefined(unsigned ID);

+ /// Reports error about bad call to setTypeID.

+ void reportBadSetTypeID(unsigned ID, Type *Ty);

+};

+Type *TopLevelParser::reportTypeIDAsUndefined(unsigned ID) {

+ std::string Buffer;

+ raw_string_ostream StrBuf(Buffer);

jvoung (off chromium) 2014/07/01 17:32:52 This probably doesn't count as "Subzero core" sinc

Karl 2014/07/01 21:31:06 First off, Jim's comment about not using it is inc

+ StrBuf << "Can't find type for type id: " << ID;

+ Error(StrBuf.str());

+ Type *Ty = Type::getVoidTy(getLLVMContext());

+ // To reduce error messages, update type list if possible.

+ if (ID < TypeIDValues.size()) TypeIDValues[ID] = Ty;

+ return Ty;

+void TopLevelParser::reportBadSetTypeID(unsigned ID, Type *Ty) {

+ std::string Buffer;

+ raw_string_ostream StrBuf(Buffer);

+ if (ID >= TypeIDValues.size()) {

+ StrBuf << "Type index " << ID << " out of range: can't install.";

+ } else {

+ // Must be case that index already defined.

+ StrBuf << "Type index " << ID << " defined as " << *TypeIDValues[ID]

+ << " and " << *Ty << ".";

+ }

+ Error(StrBuf.str());

+// class for parsing blocks within the TopLevelParser.

+class BlockParser : public NaClBitcodeParser {

+protected:

+ // Constructor for nested block parsers.

+ BlockParser(unsigned BlockID, BlockParser *EnclosingParser)

+ : NaClBitcodeParser(BlockID, EnclosingParser),

+ Context(EnclosingParser->Context) {}

+ // Returns a string describing the bit address of the current record

+ // being processed by the block parser.

+ std::string getRecordAddress() const {

jvoung (off chromium) 2014/07/01 17:32:52 could inline this into Error(), then you don't nee

Karl 2014/07/01 21:31:06 Ok. the other uses I had for it has since been rem

+ uint64_t Bit = Record.GetStartBit() + Context->getHeaderSize() * 8;

+ std::string Buffer;

+ raw_string_ostream StrBuf(Buffer);

+ StrBuf << format("%"PRIu64":%u",

+ (Bit / 8),

+ static_cast<unsigned>(Bit % 8));

+ return StrBuf.str();

+ }

+ virtual bool Error(const std::string &Message) LLVM_OVERRIDE {

+ std::string Buffer;

+ raw_string_ostream StrBuf(Buffer);

+ StrBuf << "(" << getRecordAddress() << ") " << Message;

+ return Context->Error(StrBuf.str());

+ }

+public:

+ // Constructor for the top-level module block parser.

+ BlockParser(unsigned BlockID, TopLevelParser *Context)

jvoung (off chromium) 2014/07/01 17:32:52 Why not make this first, before the nested block c

Karl 2014/07/01 21:31:07 Done.

+ : NaClBitcodeParser(BlockID, Context),

+ Context(Context) {}

+ virtual ~BlockParser() LLVM_OVERRIDE {}

+protected:

+ // Default implementation. Reports that block is unknown and skips

+ // its contents.

+ virtual bool ParseBlock(unsigned BlockID) LLVM_OVERRIDE;

+ // Default implementation. Reports that the record is not

+ // understood.

+ virtual void ProcessRecord() LLVM_OVERRIDE;

+ // The context parser that contains the decoded state.

jvoung (off chromium) 2014/07/01 17:32:53 Can we collect the fields in one place, and the me

Karl 2014/07/01 21:31:06 Done.

+ TopLevelParser *Context;

+ /// Checks if the size of the record is Size. If not, an error is

+ /// produced using the given RecordName. Return true if error was

+ /// reported. Otherwise false.

jvoung (off chromium) 2014/07/01 17:32:53 I feel like some of these comments about the error

Karl 2014/07/01 21:31:08 Done.

+ bool checkRecordSize(unsigned Size, const char *RecordName) {

+ const NaClBitcodeRecord::RecordVector &Values = Record.GetValues();

+ if (Values.size() != Size) {

+ return RecordSizeError(Size, RecordName, 0);

+ }

+ return false;

+ }

+ /// Checks if the size of the record is at least as large as the

+ /// LowerLimit. If not, an error is produced using the given

+ /// RecordName. Return true if error was reported. Otherwise false.

+ bool checkRecordSizeAtLeast(unsigned LowerLimit, const char *RecordName) {

+ const NaClBitcodeRecord::RecordVector &Values = Record.GetValues();

+ if (Values.size() < LowerLimit) {

+ return RecordSizeError(LowerLimit, RecordName, "at least");

+ }

+ return false;

+ }

+ /// Checks if the size of the record is no larger than the

+ /// UpperLimit. If not, an error is produced using the given

+ /// RecordName. Return true if error was reported. Otherwise false.

+ bool checkRecordSizeNoMoreThan(unsigned UpperLimit, const char *RecordName) {

+ const NaClBitcodeRecord::RecordVector &Values = Record.GetValues();

+ if (Values.size() > UpperLimit) {

+ return RecordSizeError(UpperLimit, RecordName, "no more than");

+ }

+ return false;

+ }

+ /// Checks if the size of the record is at least as large as the

+ /// LowerLimit, and no larger than the UpperLimit. If not, an error

+ /// is produced using the given RecordName. Return true if error was

+ /// reported. Otherwise false.

+ bool checkRecordSizeInRange(unsigned LowerLimit, unsigned UpperLimit,

+ const char *RecordName) {

+ return checkRecordSizeAtLeast(LowerLimit, RecordName)

+ || checkRecordSizeNoMoreThan(UpperLimit, RecordName);

+ }

+private:

+ /// Generates a record size error. ExpectedSize is the number

+ /// of elements expected. RecordName is the name of the kind of

+ /// record that has incorrect size. ContextMessage (if not 0)

+ /// is appended to "record expects" to describe how ExpectedSize

+ /// should be interpreted.

+ bool RecordSizeError(unsigned ExpectedSize,

+ const char *RecordName,

+ const char *ContextMessage) {

+ std::string Buffer;

+ raw_string_ostream StrBuf(Buffer);

+ StrBuf << RecordName << " record expects";

+ if (ContextMessage) StrBuf << " " << ContextMessage;

+ StrBuf << " " << ExpectedSize << " argument";

+ if(ExpectedSize > 1) StrBuf << "s";

+ StrBuf << ". Found: " << Record.GetValues().size();

+ return Error(StrBuf.str());

+ }

+};

+bool BlockParser::ParseBlock(unsigned BlockID) {

jvoung (off chromium) 2014/07/01 17:32:53 I wonder if this class should be called something

Karl 2014/07/01 21:31:07 Done.

+ // If called, derived class doesn't know how to handle block.

+ // Report error and skip.

+ std::string Buffer;

+ raw_string_ostream StrBuf(Buffer);

+ StrBuf << "Don't know how to parse block id: " << BlockID;

+ Error(StrBuf.str());

+ SkipBlock();

+ return false;

+void BlockParser::ProcessRecord() {

+ // If called, derived class doesn't know how to handle.

+ std::string Buffer;

+ raw_string_ostream StrBuf(Buffer);

+ StrBuf << "Don't know how to process record: " << Record;

+ Error(StrBuf.str());

+// Class to parse a types block.

+class TypesParser : public BlockParser {

+public:

+ TypesParser(unsigned BlockID, BlockParser *EnclosingParser)

+ : BlockParser(BlockID, EnclosingParser), NextTypeId(0) {}

+ ~TypesParser() LLVM_OVERRIDE {}

+protected:

+ virtual void ProcessRecord() LLVM_OVERRIDE;

+ // The type ID that will be associated with the next type defining

+ // record in the types block.

+ unsigned NextTypeId;

+};

+void TypesParser::ProcessRecord() {

+ Type *Ty = 0;

+ const NaClBitcodeRecord::RecordVector &Values = Record.GetValues();

+ switch (Record.GetCode()) {

+ case naclbitc::TYPE_CODE_NUMENTRY:

+ // NUMENTRY: [numentries]

+ if (checkRecordSize(1, "Type count")) return;

+ Context->resizeTypeIDValues(Values[0]);

+ return;

+ case naclbitc::TYPE_CODE_VOID:

+ // VOID

+ if (checkRecordSize(0, "Type void")) break;

+ Ty = Type::getVoidTy(Context->getLLVMContext());

+ break;

+ case naclbitc::TYPE_CODE_FLOAT:

+ // FLOAT

+ if (checkRecordSize(0, "Type float")) break;

+ Ty = Type::getFloatTy(Context->getLLVMContext());

+ break;

+ case naclbitc::TYPE_CODE_DOUBLE:

+ // DOUBLE

+ if (checkRecordSize(0, "Type double")) break;

+ Ty = Type::getDoubleTy(Context->getLLVMContext());

+ break;

+ case naclbitc::TYPE_CODE_INTEGER:

+ // INTEGER: [width]

+ if (checkRecordSize(1, "Type integer")) break;

+ Ty = IntegerType::get(Context->getLLVMContext(), Values[0]);

+ // TODO(kschimpf) Check if size is legal.

+ break;

+ case naclbitc::TYPE_CODE_VECTOR:

+ // VECTOR: [numelts, eltty]

+ if (checkRecordSize(2, "Type vector")) break;

+ Ty = VectorType::get(Context->getTypeByID(Values[1]), Values[0]);

+ break;

+ case naclbitc::TYPE_CODE_FUNCTION: {

+ // FUNCTION: [vararg, retty, paramty x N]

+ if (checkRecordSizeAtLeast(2, "Type signature")) break;

+ SmallVector<Type *, 8> ArgTys;

+ for (unsigned i = 2, e = Values.size(); i != e; ++i) {

+ ArgTys.push_back(Context->getTypeByID(Values[i]));

+ }

+ Ty = FunctionType::get(Context->getTypeByID(Values[1]),

+ ArgTys, Values[0]);

+ break;

+ }

+ default:

+ BlockParser::ProcessRecord();

+ break;

+ }

+ // If Ty not defined, assume error. Use void as filler.

+ if (Ty == 0)

+ Ty = Type::getVoidTy(Context->getLLVMContext());

+ Context->setTypeID(NextTypeId++, Ty);

+/// Parses the globals block (i.e. global variables).

+class GlobalsParser : public BlockParser {

+public:

+ GlobalsParser(unsigned BlockID, BlockParser *EnclosingParser)

+ : BlockParser(BlockID, EnclosingParser),

+ InitializersNeeded(0),

+ Alignment(1),

+ IsConstant(false) {

+ NextGlobalID = Context->getNumFunctionIDs();

+ }

+ virtual ~GlobalsParser() LLVM_OVERRIDE {}

+protected:

+ virtual void ExitBlock() LLVM_OVERRIDE {

+ verifyNoMissingInitializers();

+ unsigned NumIDs = Context->getNumGlobalValueIDs();

+ if (NextGlobalID < NumIDs) {

+ unsigned NumFcnIDs = Context->getNumFunctionIDs();

+ std::string Buffer;

+ raw_string_ostream StrBuf(Buffer);

+ StrBuf << "Globals block expects "

+ << (NumIDs - NumFcnIDs)

+ << " global definitions. Found: "

+ << (NextGlobalID - NumFcnIDs);

+ Error(StrBuf.str());

+ }

+ BlockParser::ExitBlock();

+ }

+ virtual void ProcessRecord() LLVM_OVERRIDE;

+ // Holds the sequence of initializers for the global.

+ SmallVector<Constant *, 10> Initializers;

jvoung (off chromium) 2014/07/01 17:32:53 Similar, can we put all the fields in one block, a

Karl 2014/07/01 21:31:07 Done.

+ // Keeps track of how many initializers are expected for

+ // the global variable being built.

+ unsigned InitializersNeeded;

+ // The alignment assumed for the global variable being built.

+ unsigned Alignment;

+ // True if the global variable being built is a constant.

+ bool IsConstant;

+ // The index of the next global variable.

+ unsigned NextGlobalID;

+ // Checks if the number of initializers needed is the same as the

+ // number found in the bitcode file. If different, and error message

+ // is generated, and the internal state of the parser is fixed so

+ // this condition is no longer violated.

+ void verifyNoMissingInitializers() {

+ if (InitializersNeeded != Initializers.size()) {

+ std::string Buffer;

+ raw_string_ostream StrBuf(Buffer);

+ StrBuf << "Global variable @g"

+ << (NextGlobalID - Context->getNumFunctionIDs())

+ << " expected " << InitializersNeeded << " initializer";

+ if (InitializersNeeded > 1) StrBuf << "s";

+ StrBuf << ". Found: " << Initializers.size();

+ Error(StrBuf.str());

+ // Fix up state so that we can continue.

+ InitializersNeeded = Initializers.size();

+ installGlobalVar();

+ }

+ // Reserves a slot in the list of initializers being built. If there

+ // isn't room for the slot, an error message is generated.

+ void reserveInitializer(const char *RecordName) {

+ if (InitializersNeeded == Initializers.size()) {

jvoung (off chromium) 2014/07/01 17:32:52 Would it be safer to check if >= ? Otherwise, it l

Karl 2014/07/01 21:31:07 I did this so that we wouldn't get cascading error

+ std::string Buffer;

+ raw_string_ostream StrBuf(Buffer);

+ StrBuf << RecordName << " record: Too many initializers, ignoring.";

jvoung (off chromium) 2014/07/01 17:32:52 Probably could have just std::string() + ... for t

Karl 2014/07/01 21:31:07 Done.

+ Error(StrBuf.str());

+ }

+ // Takes the initializers (and other parser state values) and

+ // installs a global variable (with the initializers) into the list

+ // of ValueIDs.

+ void installGlobalVar() {

+ Constant *Init = 0;

+ switch (Initializers.size()) {

+ case 0:

+ Error("No initializer for global variable in global vars block");

+ return;

+ case 1:

+ Init = Initializers[0];

+ break;

+ default:

+ Init = ConstantStruct::getAnon(Context->getLLVMContext(),

+ Initializers, true);

+ break;

+ }

+ GlobalVariable *GV = new GlobalVariable(

+ *Context->getModule(), Init->getType(), IsConstant,

+ GlobalValue::InternalLinkage, Init, "");

+ GV->setAlignment(Alignment);

+ if (!Context->assignGlobalVariable(GV, NextGlobalID)) {

+ std::string Buffer;

+ raw_string_ostream StrBuf(Buffer);

+ StrBuf << "Defining global V[" << NextGlobalID

+ << "] not allowed. Out of range.";

+ Error(StrBuf.str());

+ }

+ ++NextGlobalID;

+ Initializers.clear();

+ InitializersNeeded = 0;

+ Alignment = 1;

+ IsConstant = false;

+ }

+};

+void GlobalsParser::ProcessRecord() {

+ const NaClBitcodeRecord::RecordVector &Values = Record.GetValues();

+ switch (Record.GetCode()) {

+ case naclbitc::GLOBALVAR_COUNT:

+ // COUNT: [n]

+ if (checkRecordSize(1, "Globals count")) return;

+ if (NextGlobalID > Context->getNumFunctionIDs()) {

jvoung (off chromium) 2014/07/01 17:32:52 I can't put my finger on it, but this checks seems

Karl 2014/07/01 21:31:07 The test is to verify it appears before any global

+ Error("Globals count record not first in block.");

+ return;

+ }

+ verifyNoMissingInitializers();

+ Context->resizeValueIDsForGlobalVarCount(Values[0]);

+ return;

+ case naclbitc::GLOBALVAR_VAR: {

+ // VAR: [align, isconst]

+ if (checkRecordSize(2, "Globals variable")) return;

+ verifyNoMissingInitializers();

+ InitializersNeeded = 1;

+ Initializers.clear();

+ Alignment = (1 << Values[0]) >> 1;

+ IsConstant = Values[0] != 0;

jvoung (off chromium) 2014/07/01 17:32:52 Values[1] != 0 Otherwise, the alignment could mak

Karl 2014/07/01 21:31:08 Done.

+ return;

+ }

+ case naclbitc::GLOBALVAR_COMPOUND:

+ // COMPOUND: [size]

+ if (checkRecordSize(1, "globals compound")) return;

+ if (Initializers.size() > 0 || InitializersNeeded != 1) {

+ Error("Globals compound record not first initializer");

+ return;

+ }

+ if (Values[0] < 2) {

+ std::string Buffer;

+ raw_string_ostream StrBuf(Buffer);

+ StrBuf << "Globals compound record size invalid. Found: "

+ << Values[0];

+ Error(StrBuf.str());

+ return;

+ }

+ InitializersNeeded = Values[0];

+ return;

+ case naclbitc::GLOBALVAR_ZEROFILL: {

+ // ZEROFILL: [size]

+ if (checkRecordSize(1, "Globals zerofill")) return;

+ reserveInitializer("Globals zerofill");

+ Type *Ty = ArrayType::get(Type::getInt8Ty(Context->getLLVMContext()),

+ Values[0]);

+ Constant *Zero = ConstantAggregateZero::get(Ty);

+ Initializers.push_back(Zero);

+ break;

+ }

+ case naclbitc::GLOBALVAR_DATA: {

+ // DATA: [b0, b1, ...]

+ if (checkRecordSizeAtLeast(1, "Globals data")) return;

+ reserveInitializer("Globals data");

+ unsigned Size = Values.size();

+ uint8_t *Buf = new uint8_t[Size];

+ assert(Buf);

+ for (unsigned i = 0; i < Size; ++i)

jvoung (off chromium) 2014/07/01 17:32:53 could memcpy this?

Karl 2014/07/01 21:31:07 Not really. We are doing a cast from uint64_t to u

+ Buf[i] = Values[i];

+ Constant *Init = ConstantDataArray::get(

+ Context->getLLVMContext(),

+ ArrayRef<uint8_t>(Buf, Buf + Size));

+ Initializers.push_back(Init);

+ delete[] Buf;

+ break;

+ }

+ case naclbitc::GLOBALVAR_RELOC: {

+ // RELOC: [val, [addend]]

+ if (checkRecordSizeInRange(1, 2, "Globals reloc")) return;

+ Constant *BaseVal =

+ Context->getOrCreateGlobalVarRef(Values[0]);

+ if (BaseVal == 0) {

+ std::string Buffer;

+ raw_string_ostream StrBuf(Buffer);

+ StrBuf << "Can't find global relocation value: " << Values[0];

+ Error(StrBuf.str());

+ return;

+ }

+ Type *IntPtrType = IntegerType::get(Context->getLLVMContext(), 32);

+ Constant *Val = ConstantExpr::getPtrToInt(BaseVal, IntPtrType);

+ if (Values.size() == 2) {

+ Val = ConstantExpr::getAdd(Val, ConstantInt::get(IntPtrType, Values[1]));

+ }

+ Initializers.push_back(Val);

+ break;

+ }

+ default:

+ BlockParser::ProcessRecord();

+ return;

+ }

+ // If reached, just processed another intializer. See if time

+ // to install global.

+ if (InitializersNeeded == Initializers.size()) installGlobalVar();

+// Parses a valuesymtab block in the bitcode file.

+class ValuesymtabParser : public BlockParser {

+ typedef SmallString<128> StringType;

+public:

+ ValuesymtabParser(unsigned BlockID,

+ BlockParser *EnclosingParser,

jvoung (off chromium) 2014/07/01 17:32:53 indent to line up to after the ( ? There is "make

Karl 2014/07/01 21:31:06 Done.

Jim Stichnoth 2014/07/07 20:50:23 This (modifying unrelated files) is usually becaus

+ bool AllowBbEntries)

+ : BlockParser(BlockID, EnclosingParser),

+ AllowBbEntries(AllowBbEntries) {}

+ virtual ~ValuesymtabParser() LLVM_OVERRIDE {}

+protected:

+ // True if entries to name basic blocks allowed.

+ bool AllowBbEntries;

+ // The last name converted to a string using convertToString.

+ StringType ConvertedName;

+ virtual void ProcessRecord() LLVM_OVERRIDE;

+ void ConvertToString() {

+ ConvertedName.clear();

+ const NaClBitcodeRecord::RecordVector &Values = Record.GetValues();

+ for (size_t i = 1, e = Values.size(); i != e; ++i) {

+ ConvertedName += static_cast<char>(Values[i]);

+ }

+};

+void ValuesymtabParser::ProcessRecord() {

+ const NaClBitcodeRecord::RecordVector &Values = Record.GetValues();

+ switch (Record.GetCode()) {

+ case naclbitc::VST_CODE_ENTRY: {

+ // VST_ENTRY: [valid, namechar x N]

jvoung (off chromium) 2014/07/01 17:32:53 valueID, or something instead of valid

Karl 2014/07/01 21:31:07 Done.

+ if (checkRecordSizeAtLeast(2, "Valuesymtab value entry")) return;

+ ConvertToString();

jvoung (off chromium) 2014/07/01 17:32:52 Feels a bit roundabout that ConvertedName is a fie

Karl 2014/07/01 21:31:07 I mainly did this to avoid allocations between cal

+ Value *V = Context->getGlobalValueByID(Values[0]);

+ if (V == 0) {

+ std::string Buffer;

+ raw_string_ostream StrBuf(Buffer);

+ StrBuf << "Invalid global address ID in valuesymtab: " << Values[0];

+ Error(StrBuf.str());

+ return;

+ }

+ V->setName(StringRef(ConvertedName.data(), ConvertedName.size()));

+ return;

+ }

+ case naclbitc::VST_CODE_BBENTRY: {

+ // VST_BBENTRY: [bbid, namechar x N]

+ // For now, since we aren't processing function blocks, don't handle.

+ if (AllowBbEntries) {

+ Error("Valuesymtab bb entry not implemented");

+ return;

+ }

+ break;

+ }

+ default:

+ break;

+ }

+ // If reached, don't know how to handle record.

+ BlockParser::ProcessRecord();

+ return;

+/// Parses the module block in the bitcode file.

+class ModuleParser : public BlockParser {

+public:

+ ModuleParser(unsigned BlockID, TopLevelParser *Context)

+ : BlockParser(BlockID, Context) {}

+ virtual ~ModuleParser() LLVM_OVERRIDE {}

+protected:

+ virtual bool ParseBlock(unsigned BlockID) LLVM_OVERRIDE;

+ virtual void ProcessRecord() LLVM_OVERRIDE;

+};

+bool ModuleParser::ParseBlock(unsigned BlockID) LLVM_OVERRIDE {

+ switch (BlockID) {

+ case naclbitc::BLOCKINFO_BLOCK_ID:

+ return NaClBitcodeParser::ParseBlock(BlockID);

+ case naclbitc::TYPE_BLOCK_ID_NEW: {

+ TypesParser Parser(BlockID, this);

+ return Parser.ParseThisBlock();

+ }

+ case naclbitc::GLOBALVAR_BLOCK_ID: {

+ GlobalsParser Parser(BlockID, this);

+ return Parser.ParseThisBlock();

+ }

+ case naclbitc::VALUE_SYMTAB_BLOCK_ID: {

+ ValuesymtabParser Parser(BlockID, this, false);

+ return Parser.ParseThisBlock();

+ }

+ case naclbitc::FUNCTION_BLOCK_ID: {

+ Error("Function block parser not yet implemented, skipping");

+ SkipBlock();

+ return false;

+ }

+ default:

+ return BlockParser::ParseBlock(BlockID);

+ }

+void ModuleParser::ProcessRecord() {

+ const NaClBitcodeRecord::RecordVector &Values = Record.GetValues();

+ switch (Record.GetCode()) {

+ case naclbitc::MODULE_CODE_VERSION: {

+ // VERSION: [version#]

+ if (checkRecordSize(1, "Module version")) return;

+ unsigned Version = Values[0];

+ if (Version != 1) {

+ std::string Buffer;

+ raw_string_ostream StrBuf(Buffer);

+ StrBuf << "Unknown bitstream version: " << Version;

+ Error(StrBuf.str());

+ }

+ return;

+ }

+ case naclbitc::MODULE_CODE_FUNCTION: {

+ // FUNCTION: [type, callingconv, isproto, linkage]

+ if (checkRecordSize(4, "Function heading")) return;

+ Type *Ty = Context->getTypeByID(Values[0]);

+ FunctionType *FTy = dyn_cast<FunctionType>(Ty);

+ if (FTy == 0) {

+ std::string Buffer;

+ raw_string_ostream StrBuf(Buffer);

+ StrBuf << "Function heading expects function type. Found: "

+ << Ty;

+ Error(StrBuf.str());

+ return;

+ }

+ CallingConv::ID CallingConv;

+ if (!naclbitc::DecodeCallingConv(Values[1], CallingConv)) {

+ std::string Buffer;

+ raw_string_ostream StrBuf(Buffer);

+ StrBuf << "Function heading has unknown calling convention: "

+ << Values[1];

+ Error(StrBuf.str());

+ return;

+ }

+ GlobalValue::LinkageTypes Linkage;

+ if (!naclbitc::DecodeLinkage(Values[3], Linkage)) {

+ std::string Buffer;

+ raw_string_ostream StrBuf(Buffer);

+ StrBuf << "Function heading has unknown linkage. Found "

+ << Values[3];

+ Error(StrBuf.str());

+ return;

+ }

+ Function *Func = Function::Create(FTy, Linkage, "", Context->getModule());

+ Func->setCallingConv(CallingConv);

+ if (Values[2] == 0) Context->setNextValueIDAsImplementedFunction();

+ Context->setNextFunctionID(Func);

+ // TODO(kschimpf) verify if Func matches PNaCl ABI.

+ return;

+ }

+ default:

+ BlockParser::ProcessRecord();

+ return;

+ }

+bool TopLevelParser::ParseBlock(unsigned BlockID) {

+ if (BlockID == naclbitc::MODULE_BLOCK_ID) {

+ ModuleParser Parser(BlockID, this);

+ bool Results = Parser.ParseThisBlock();

jvoung (off chromium) 2014/07/01 17:32:53 Singular Result? Otherwise it sounds like a collec

Karl 2014/07/01 21:31:06 Done.

+ // TODO(kschimpf): Remove once translating function blocks.

+ errs() << "Global addresses:\n";

+ for (size_t i = 0; i < ValueIDValues.size(); ++i) {

+ errs() << "[" << i << "]: " << *ValueIDValues[i] << "\n";

jvoung (off chromium) 2014/07/01 17:32:53 How will this eventually transition? This starts t

Karl 2014/07/01 21:31:08 I need to implement a FunctionParser. It will have

+ }

+ return Results;

+ }

+ // Generate error message by using default block implementation.

+ BlockParser Parser(BlockID, this);

+ return Parser.ParseThisBlock();

+namespace Ice {

+int PNaClTranslator::translate(std::string IRFilename) {

+ OwningPtr<MemoryBuffer> MemBuf;

+ if (error_code ec =

+ MemoryBuffer::getFileOrSTDIN(IRFilename.c_str(), MemBuf)) {

+ errs() << "Error reading '" << IRFilename << "': "

+ << ec.message() << "\n";

+ return ExitStatus = 1;

+ }

+ if (MemBuf->getBufferSize() % 4 != 0) {

+ errs() << IRFilename

+ << ": Bitcode stream should be a multiple of 4 bytes in length.\n";

+ return ExitStatus = 1;

+ }

+ const unsigned char *BufPtr = (const unsigned char *)MemBuf->getBufferStart();

+ const unsigned char *EndBufPtr = BufPtr+MemBuf->getBufferSize();

+ // Read header and verify it is good.

+ NaClBitcodeHeader Header;

+ if (Header.Read(BufPtr, EndBufPtr) || !Header.IsSupported()) {

+ errs() << "Invalid PNaCl bitcode header.\n";

+ return ExitStatus = 1;

+ }

+ // Create a bitstream reader to read the bitcode file.

+ NaClBitstreamReader InputStreamFile(BufPtr, EndBufPtr);

+ NaClBitstreamCursor InputStream(InputStreamFile);

+ OwningPtr<Module> Mod(

+ new Module(MemBuf->getBufferIdentifier(), getGlobalContext()));

+ Mod->setDataLayout(PNaClDataLayout);

+ TopLevelParser Parser(&*Mod, Header, InputStream);

jvoung (off chromium) 2014/07/01 17:32:52 Mod.get(), if you just want the raw pointer. Or m

Karl 2014/07/01 21:31:07 Moved into Parser constructor.

+ int TopLevelBlocks = 0;

+ while (!InputStream.AtEndOfStream()) {

+ if (Parser.Parse()) return 1;

+ ++TopLevelBlocks;

+ }

+ if (TopLevelBlocks != 1) {

+ errs() << IRFilename << ": Contains more than one module. Found: "

+ << TopLevelBlocks << "\n";

+ return ExitStatus = 1;

+ }

+ return ExitStatus = (Parser.getNumErrors() > 0);

« src/PNaClTranslator.h ('K') | « src/PNaClTranslator.h ('k') | src/llvm2ice.cpp » ('j') | no next file with comments »