| Index: src/jsregexp.h
|
| ===================================================================
|
| --- src/jsregexp.h (revision 868)
|
| +++ src/jsregexp.h (working copy)
|
| @@ -30,6 +30,10 @@
|
|
|
| namespace v8 { namespace internal {
|
|
|
| +
|
| +class RegExpMacroAssembler;
|
| +
|
| +
|
| class RegExpImpl {
|
| public:
|
| // Creates a regular expression literal in the old space.
|
| @@ -61,10 +65,28 @@
|
| static Handle<Object> ExecGlobal(Handle<JSRegExp> regexp,
|
| Handle<String> subject);
|
|
|
| + // Stores an uncompiled RegExp pattern in the JSRegExp object.
|
| + // It will be compiled by JSCRE when first executed.
|
| + static Handle<Object> JscrePrepare(Handle<JSRegExp> re,
|
| + Handle<String> pattern,
|
| + JSRegExp::Flags flags);
|
| +
|
| + // Stores a compiled RegExp pattern in the JSRegExp object.
|
| + // The pattern is compiled by Irregexp.
|
| + static Handle<Object> IrregexpPrepare(Handle<JSRegExp> re,
|
| + Handle<String> pattern,
|
| + JSRegExp::Flags flags,
|
| + Handle<FixedArray> irregexp_data);
|
| +
|
| +
|
| + // Compile the pattern using JSCRE and store the result in the
|
| + // JSRegExp object.
|
| + static Handle<Object> JscreCompile(Handle<JSRegExp> re);
|
| +
|
| static Handle<Object> AtomCompile(Handle<JSRegExp> re,
|
| Handle<String> pattern,
|
| - JSRegExp::Flags flags);
|
| -
|
| + JSRegExp::Flags flags,
|
| + Handle<String> match_pattern);
|
| static Handle<Object> AtomExec(Handle<JSRegExp> regexp,
|
| Handle<String> subject,
|
| Handle<Object> index);
|
| @@ -72,47 +94,78 @@
|
| static Handle<Object> AtomExecGlobal(Handle<JSRegExp> regexp,
|
| Handle<String> subject);
|
|
|
| - static Handle<Object> JsreCompile(Handle<JSRegExp> re,
|
| - Handle<String> pattern,
|
| - JSRegExp::Flags flags);
|
| + static Handle<Object> JscreCompile(Handle<JSRegExp> re,
|
| + Handle<String> pattern,
|
| + JSRegExp::Flags flags);
|
|
|
| - static Handle<Object> JsreExec(Handle<JSRegExp> regexp,
|
| - Handle<String> subject,
|
| - Handle<Object> index);
|
| + // Execute a compiled JSCRE pattern.
|
| + static Handle<Object> JscreExec(Handle<JSRegExp> regexp,
|
| + Handle<String> subject,
|
| + Handle<Object> index);
|
|
|
| - static Handle<Object> JsreExecGlobal(Handle<JSRegExp> regexp,
|
| - Handle<String> subject);
|
| + // Execute an Irregexp bytecode pattern.
|
| + static Handle<Object> IrregexpExec(Handle<JSRegExp> regexp,
|
| + Handle<String> subject,
|
| + Handle<Object> index);
|
|
|
| + static Handle<Object> JscreExecGlobal(Handle<JSRegExp> regexp,
|
| + Handle<String> subject);
|
| +
|
| + static Handle<Object> IrregexpExecGlobal(Handle<JSRegExp> regexp,
|
| + Handle<String> subject);
|
| +
|
| static void NewSpaceCollectionPrologue();
|
| static void OldSpaceCollectionPrologue();
|
|
|
| - private:
|
| // Converts a source string to a 16 bit flat string. The string
|
| // will be either sequential or it will be a SlicedString backed
|
| // by a flat string.
|
| static Handle<String> StringToTwoByte(Handle<String> pattern);
|
| static Handle<String> CachedStringToTwoByte(Handle<String> pattern);
|
|
|
| + static const int kIrregexpImplementationIndex = 0;
|
| + static const int kIrregexpNumberOfCapturesIndex = 1;
|
| + static const int kIrregexpNumberOfRegistersIndex = 2;
|
| + static const int kIrregexpCodeIndex = 3;
|
| + static const int kIrregexpDataLength = 4;
|
| +
|
| + static const int kJscreNumberOfCapturesIndex = 0;
|
| + static const int kJscreInternalIndex = 1;
|
| + static const int kJscreDataLength = 2;
|
| +
|
| + private:
|
| static String* last_ascii_string_;
|
| static String* two_byte_cached_string_;
|
|
|
| - // Returns the caputure from the re.
|
| - static int JsreCapture(Handle<JSRegExp> re);
|
| - static ByteArray* JsreInternal(Handle<JSRegExp> re);
|
| + static int JscreNumberOfCaptures(Handle<JSRegExp> re);
|
| + static ByteArray* JscreInternal(Handle<JSRegExp> re);
|
|
|
| + static int IrregexpNumberOfCaptures(Handle<JSRegExp> re);
|
| + static int IrregexpNumberOfRegisters(Handle<JSRegExp> re);
|
| + static Handle<ByteArray> IrregexpCode(Handle<JSRegExp> re);
|
| +
|
| // Call jsRegExpExecute once
|
| - static Handle<Object> JsreExecOnce(Handle<JSRegExp> regexp,
|
| - int num_captures,
|
| - Handle<String> subject,
|
| - int previous_index,
|
| - const uc16* utf8_subject,
|
| - int* ovector,
|
| - int ovector_length);
|
| + static Handle<Object> JscreExecOnce(Handle<JSRegExp> regexp,
|
| + int num_captures,
|
| + Handle<String> subject,
|
| + int previous_index,
|
| + const uc16* utf8_subject,
|
| + int* ovector,
|
| + int ovector_length);
|
|
|
| + static Handle<Object> IrregexpExecOnce(Handle<JSRegExp> regexp,
|
| + int num_captures,
|
| + Handle<String> subject16,
|
| + int previous_index,
|
| + int* ovector,
|
| + int ovector_length);
|
| +
|
| // Set the subject cache. The previous string buffer is not deleted, so the
|
| // caller should ensure that it doesn't leak.
|
| - static void SetSubjectCache(String* subject, char* utf8_subject,
|
| - int uft8_length, int character_position,
|
| + static void SetSubjectCache(String* subject,
|
| + char* utf8_subject,
|
| + int uft8_length,
|
| + int character_position,
|
| int utf8_position);
|
|
|
| // A one element cache of the last utf8_subject string and its length. The
|
| @@ -125,6 +178,640 @@
|
| };
|
|
|
|
|
| +class CharacterRange {
|
| + public:
|
| + CharacterRange() : from_(0), to_(0) { }
|
| + // For compatibility with the CHECK_OK macro
|
| + CharacterRange(void* null) { ASSERT_EQ(NULL, null); } //NOLINT
|
| + CharacterRange(uc16 from, uc16 to) : from_(from), to_(to) { }
|
| + static void AddClassEscape(uc16 type, ZoneList<CharacterRange>* ranges);
|
| + static inline CharacterRange Singleton(uc16 value) {
|
| + return CharacterRange(value, value);
|
| + }
|
| + static inline CharacterRange Range(uc16 from, uc16 to) {
|
| + ASSERT(from <= to);
|
| + return CharacterRange(from, to);
|
| + }
|
| + static inline CharacterRange Everything() {
|
| + return CharacterRange(0, 0xFFFF);
|
| + }
|
| + bool Contains(uc16 i) { return from_ <= i && i <= to_; }
|
| + uc16 from() const { return from_; }
|
| + void set_from(uc16 value) { from_ = value; }
|
| + uc16 to() const { return to_; }
|
| + void set_to(uc16 value) { to_ = value; }
|
| + bool is_valid() { return from_ <= to_; }
|
| + bool IsSingleton() { return (from_ == to_); }
|
| + void AddCaseEquivalents(ZoneList<CharacterRange>* ranges);
|
| + static const int kRangeCanonicalizeMax = 0x346;
|
| + static const int kStartMarker = (1 << 24);
|
| + static const int kPayloadMask = (1 << 24) - 1;
|
| + private:
|
| + uc16 from_;
|
| + uc16 to_;
|
| +};
|
| +
|
| +
|
| +template <typename Node, class Callback>
|
| +static void DoForEach(Node* node, Callback* callback);
|
| +
|
| +
|
| +// A zone splay tree. The config type parameter encapsulates the
|
| +// different configurations of a concrete splay tree:
|
| +//
|
| +// typedef Key: the key type
|
| +// typedef Value: the value type
|
| +// static const kNoKey: the dummy key used when no key is set
|
| +// static const kNoValue: the dummy value used to initialize nodes
|
| +// int (Compare)(Key& a, Key& b) -> {-1, 0, 1}: comparison function
|
| +//
|
| +template <typename Config>
|
| +class ZoneSplayTree : public ZoneObject {
|
| + public:
|
| + typedef typename Config::Key Key;
|
| + typedef typename Config::Value Value;
|
| +
|
| + class Locator;
|
| +
|
| + ZoneSplayTree() : root_(NULL) { }
|
| +
|
| + // Inserts the given key in this tree with the given value. Returns
|
| + // true if a node was inserted, otherwise false. If found the locator
|
| + // is enabled and provides access to the mapping for the key.
|
| + bool Insert(const Key& key, Locator* locator);
|
| +
|
| + // Looks up the key in this tree and returns true if it was found,
|
| + // otherwise false. If the node is found the locator is enabled and
|
| + // provides access to the mapping for the key.
|
| + bool Find(const Key& key, Locator* locator);
|
| +
|
| + // Finds the mapping with the greatest key less than or equal to the
|
| + // given key.
|
| + bool FindGreatestLessThan(const Key& key, Locator* locator);
|
| +
|
| + // Find the mapping with the greatest key in this tree.
|
| + bool FindGreatest(Locator* locator);
|
| +
|
| + // Finds the mapping with the least key greater than or equal to the
|
| + // given key.
|
| + bool FindLeastGreaterThan(const Key& key, Locator* locator);
|
| +
|
| + // Find the mapping with the least key in this tree.
|
| + bool FindLeast(Locator* locator);
|
| +
|
| + // Remove the node with the given key from the tree.
|
| + bool Remove(const Key& key);
|
| +
|
| + bool is_empty() { return root_ == NULL; }
|
| +
|
| + // Perform the splay operation for the given key. Moves the node with
|
| + // the given key to the top of the tree. If no node has the given
|
| + // key, the last node on the search path is moved to the top of the
|
| + // tree.
|
| + void Splay(const Key& key);
|
| +
|
| + class Node : public ZoneObject {
|
| + public:
|
| + Node(const Key& key, const Value& value)
|
| + : key_(key),
|
| + value_(value),
|
| + left_(NULL),
|
| + right_(NULL) { }
|
| + Key key() { return key_; }
|
| + Value value() { return value_; }
|
| + Node* left() { return left_; }
|
| + Node* right() { return right_; }
|
| + private:
|
| + friend class ZoneSplayTree;
|
| + friend class Locator;
|
| + Key key_;
|
| + Value value_;
|
| + Node* left_;
|
| + Node* right_;
|
| + };
|
| +
|
| + // A locator provides access to a node in the tree without actually
|
| + // exposing the node.
|
| + class Locator {
|
| + public:
|
| + explicit Locator(Node* node) : node_(node) { }
|
| + Locator() : node_(NULL) { }
|
| + const Key& key() { return node_->key_; }
|
| + Value& value() { return node_->value_; }
|
| + void set_value(const Value& value) { node_->value_ = value; }
|
| + inline void bind(Node* node) { node_ = node; }
|
| + private:
|
| + Node* node_;
|
| + };
|
| +
|
| + template <class Callback>
|
| + void ForEach(Callback* c) {
|
| + DoForEach<typename ZoneSplayTree<Config>::Node, Callback>(root_, c);
|
| + }
|
| +
|
| + private:
|
| + Node* root_;
|
| +};
|
| +
|
| +
|
| +// A set of unsigned integers that behaves especially well on small
|
| +// integers (< 32). May do zone-allocation.
|
| +class OutSet: public ZoneObject {
|
| + public:
|
| + OutSet() : first_(0), remaining_(NULL), successors_(NULL) { }
|
| + OutSet* Extend(unsigned value);
|
| + bool Get(unsigned value);
|
| + static const unsigned kFirstLimit = 32;
|
| +
|
| + private:
|
| + // Destructively set a value in this set. In most cases you want
|
| + // to use Extend instead to ensure that only one instance exists
|
| + // that contains the same values.
|
| + void Set(unsigned value);
|
| +
|
| + // The successors are a list of sets that contain the same values
|
| + // as this set and the one more value that is not present in this
|
| + // set.
|
| + ZoneList<OutSet*>* successors() { return successors_; }
|
| +
|
| + OutSet(uint32_t first, ZoneList<unsigned>* remaining)
|
| + : first_(first), remaining_(remaining), successors_(NULL) { }
|
| + uint32_t first_;
|
| + ZoneList<unsigned>* remaining_;
|
| + ZoneList<OutSet*>* successors_;
|
| +};
|
| +
|
| +
|
| +// A mapping from integers, specified as ranges, to a set of integers.
|
| +// Used for mapping character ranges to choices.
|
| +class DispatchTable {
|
| + public:
|
| + class Entry {
|
| + public:
|
| + Entry() : from_(0), to_(0), out_set_(NULL) { }
|
| + Entry(uc16 from, uc16 to, OutSet* out_set)
|
| + : from_(from), to_(to), out_set_(out_set) { }
|
| + uc16 from() { return from_; }
|
| + uc16 to() { return to_; }
|
| + void set_to(uc16 value) { to_ = value; }
|
| + void AddValue(int value) { out_set_ = out_set_->Extend(value); }
|
| + OutSet* out_set() { return out_set_; }
|
| + private:
|
| + uc16 from_;
|
| + uc16 to_;
|
| + OutSet* out_set_;
|
| + };
|
| +
|
| + class Config {
|
| + public:
|
| + typedef uc16 Key;
|
| + typedef Entry Value;
|
| + static const uc16 kNoKey;
|
| + static const Entry kNoValue;
|
| + static inline int Compare(uc16 a, uc16 b) {
|
| + if (a == b)
|
| + return 0;
|
| + else if (a < b)
|
| + return -1;
|
| + else
|
| + return 1;
|
| + }
|
| + };
|
| +
|
| + void AddRange(CharacterRange range, int value);
|
| + OutSet* Get(uc16 value);
|
| + void Dump();
|
| +
|
| + template <typename Callback>
|
| + void ForEach(Callback* callback) { return tree()->ForEach(callback); }
|
| + private:
|
| + // There can't be a static empty set since it allocates its
|
| + // successors in a zone and caches them.
|
| + OutSet* empty() { return &empty_; }
|
| + OutSet empty_;
|
| + ZoneSplayTree<Config>* tree() { return &tree_; }
|
| + ZoneSplayTree<Config> tree_;
|
| +};
|
| +
|
| +
|
| +#define FOR_EACH_NODE_TYPE(VISIT) \
|
| + VISIT(End) \
|
| + VISIT(Action) \
|
| + VISIT(Choice) \
|
| + VISIT(BackReference) \
|
| + VISIT(Text)
|
| +
|
| +
|
| +#define FOR_EACH_REG_EXP_TREE_TYPE(VISIT) \
|
| + VISIT(Disjunction) \
|
| + VISIT(Alternative) \
|
| + VISIT(Assertion) \
|
| + VISIT(CharacterClass) \
|
| + VISIT(Atom) \
|
| + VISIT(Quantifier) \
|
| + VISIT(Capture) \
|
| + VISIT(Lookahead) \
|
| + VISIT(BackReference) \
|
| + VISIT(Empty) \
|
| + VISIT(Text)
|
| +
|
| +
|
| +#define FORWARD_DECLARE(Name) class RegExp##Name;
|
| +FOR_EACH_REG_EXP_TREE_TYPE(FORWARD_DECLARE)
|
| +#undef FORWARD_DECLARE
|
| +
|
| +
|
| +class TextElement {
|
| + public:
|
| + enum Type {UNINITIALIZED, ATOM, CHAR_CLASS};
|
| + TextElement() : type(UNINITIALIZED) { }
|
| + explicit TextElement(Type t) : type(t) { }
|
| + static TextElement Atom(RegExpAtom* atom);
|
| + static TextElement CharClass(RegExpCharacterClass* char_class);
|
| + Type type;
|
| + union {
|
| + RegExpAtom* u_atom;
|
| + RegExpCharacterClass* u_char_class;
|
| + } data;
|
| +};
|
| +
|
| +
|
| +struct NodeInfo {
|
| + enum PrecedingInfo {
|
| + UNKNOWN = -1, FALSE = 0, TRUE = 1
|
| + };
|
| +
|
| + NodeInfo()
|
| + : being_analyzed(false),
|
| + been_analyzed(false),
|
| + determine_word(false),
|
| + determine_newline(false),
|
| + determine_start(false),
|
| + follows_word_interest(false),
|
| + follows_newline_interest(false),
|
| + follows_start_interest(false),
|
| + at_end(false),
|
| + follows_word(UNKNOWN),
|
| + follows_newline(UNKNOWN),
|
| + follows_start(UNKNOWN) { }
|
| +
|
| + bool HasSameForwardInterests(NodeInfo* that) {
|
| + return (at_end == that->at_end)
|
| + && (follows_word_interest == that->follows_word_interest)
|
| + && (follows_newline_interest == that->follows_newline_interest)
|
| + && (follows_start_interest == that->follows_start_interest);
|
| + }
|
| +
|
| + // Updates the interests of this node given the interests of the
|
| + // node preceding it.
|
| + void AddFromPreceding(NodeInfo* that) {
|
| + at_end |= that->at_end;
|
| + follows_word_interest |= that->follows_word_interest;
|
| + follows_newline_interest |= that->follows_newline_interest;
|
| + follows_start_interest |= that->follows_start_interest;
|
| + }
|
| +
|
| + // Sets the interests of this node to include the interests of the
|
| + // following node.
|
| + void AddFromFollowing(NodeInfo* that) {
|
| + follows_word_interest |= that->follows_word_interest;
|
| + follows_newline_interest |= that->follows_newline_interest;
|
| + follows_start_interest |= that->follows_start_interest;
|
| + }
|
| +
|
| + bool being_analyzed: 1;
|
| + bool been_analyzed: 1;
|
| +
|
| + // These bits are set if this node must propagate forward information
|
| + // about the last character it consumed (or, in the case of 'start',
|
| + // if it is at the start of the input).
|
| + bool determine_word: 1;
|
| + bool determine_newline: 1;
|
| + bool determine_start: 1;
|
| +
|
| + // These bits are set of this node has to know what the preceding
|
| + // character was.
|
| + bool follows_word_interest: 1;
|
| + bool follows_newline_interest: 1;
|
| + bool follows_start_interest: 1;
|
| +
|
| + bool at_end: 1;
|
| +
|
| + // These bits are set if the node can make assumptions about what
|
| + // the previous character was.
|
| + PrecedingInfo follows_word: 2;
|
| + PrecedingInfo follows_newline: 2;
|
| + PrecedingInfo follows_start: 2;
|
| +};
|
| +
|
| +
|
| +class SiblingList {
|
| + public:
|
| + SiblingList() : list_(NULL) { }
|
| + int length() {
|
| + return list_ == NULL ? 0 : list_->length();
|
| + }
|
| + void Ensure(RegExpNode* parent) {
|
| + if (list_ == NULL) {
|
| + list_ = new ZoneList<RegExpNode*>(2);
|
| + list_->Add(parent);
|
| + }
|
| + }
|
| + void Add(RegExpNode* node) { list_->Add(node); }
|
| + RegExpNode* Get(int index) { return list_->at(index); }
|
| + private:
|
| + ZoneList<RegExpNode*>* list_;
|
| +};
|
| +
|
| +
|
| +class RegExpNode: public ZoneObject {
|
| + public:
|
| + virtual ~RegExpNode() { }
|
| + virtual void Accept(NodeVisitor* visitor) = 0;
|
| + // Generates a goto to this node or actually generates the code at this point.
|
| + // Until the implementation is complete we will return true for success and
|
| + // false for failure.
|
| + virtual bool GoTo(RegExpCompiler* compiler);
|
| + Label* label();
|
| +
|
| + // Until the implementation is complete we will return true for success and
|
| + // false for failure.
|
| + virtual bool Emit(RegExpCompiler* compiler) = 0;
|
| +
|
| + // Propagates the given interest information forward. When seeing
|
| + // \bfoo for instance, the \b is implemented by propagating forward
|
| + // to the 'foo' string that it should only succeed if its first
|
| + // character is a letter xor the previous character was a letter.
|
| + virtual RegExpNode* PropagateForward(NodeInfo* info) = 0;
|
| +
|
| + NodeInfo* info() { return &info_; }
|
| + virtual bool IsBacktrack() { return false; }
|
| + RegExpNode* GetSibling(NodeInfo* info);
|
| + void EnsureSiblings() { siblings_.Ensure(this); }
|
| + void AddSibling(RegExpNode* node) { siblings_.Add(node); }
|
| + protected:
|
| + inline void Bind(RegExpMacroAssembler* macro);
|
| + private:
|
| + Label label_;
|
| + NodeInfo info_;
|
| + SiblingList siblings_;
|
| +};
|
| +
|
| +
|
| +class SeqRegExpNode: public RegExpNode {
|
| + public:
|
| + explicit SeqRegExpNode(RegExpNode* on_success)
|
| + : on_success_(on_success) { }
|
| + RegExpNode* on_success() { return on_success_; }
|
| + void set_on_success(RegExpNode* node) { on_success_ = node; }
|
| + virtual bool Emit(RegExpCompiler* compiler) { return false; }
|
| + private:
|
| + RegExpNode* on_success_;
|
| +};
|
| +
|
| +
|
| +class ActionNode: public SeqRegExpNode {
|
| + public:
|
| + enum Type {
|
| + STORE_REGISTER,
|
| + INCREMENT_REGISTER,
|
| + STORE_POSITION,
|
| + RESTORE_POSITION,
|
| + BEGIN_SUBMATCH,
|
| + ESCAPE_SUBMATCH
|
| + };
|
| + static ActionNode* StoreRegister(int reg, int val, RegExpNode* on_success);
|
| + static ActionNode* IncrementRegister(int reg, RegExpNode* on_success);
|
| + static ActionNode* StorePosition(int reg, RegExpNode* on_success);
|
| + static ActionNode* RestorePosition(int reg, RegExpNode* on_success);
|
| + static ActionNode* BeginSubmatch(int stack_pointer_reg,
|
| + int position_reg,
|
| + RegExpNode* on_success);
|
| + static ActionNode* EscapeSubmatch(int stack_pointer_reg,
|
| + bool and_restore_position,
|
| + int restore_reg,
|
| + RegExpNode* on_success);
|
| + virtual void Accept(NodeVisitor* visitor);
|
| + virtual bool Emit(RegExpCompiler* compiler);
|
| + virtual RegExpNode* PropagateForward(NodeInfo* info);
|
| + private:
|
| + union {
|
| + struct {
|
| + int reg;
|
| + int value;
|
| + } u_store_register;
|
| + struct {
|
| + int reg;
|
| + } u_increment_register;
|
| + struct {
|
| + int reg;
|
| + } u_position_register;
|
| + struct {
|
| + int stack_pointer_register;
|
| + int current_position_register;
|
| + } u_submatch;
|
| + } data_;
|
| + ActionNode(Type type, RegExpNode* on_success)
|
| + : SeqRegExpNode(on_success),
|
| + type_(type) { }
|
| + Type type_;
|
| + friend class DotPrinter;
|
| +};
|
| +
|
| +
|
| +class TextNode: public SeqRegExpNode {
|
| + public:
|
| + TextNode(ZoneList<TextElement>* elms,
|
| + RegExpNode* on_success,
|
| + RegExpNode* on_failure)
|
| + : SeqRegExpNode(on_success),
|
| + on_failure_(on_failure),
|
| + elms_(elms) { }
|
| + virtual void Accept(NodeVisitor* visitor);
|
| + virtual RegExpNode* PropagateForward(NodeInfo* info);
|
| + RegExpNode* on_failure() { return on_failure_; }
|
| + virtual bool Emit(RegExpCompiler* compiler);
|
| + ZoneList<TextElement>* elements() { return elms_; }
|
| + void MakeCaseIndependent();
|
| + private:
|
| + RegExpNode* on_failure_;
|
| + ZoneList<TextElement>* elms_;
|
| +};
|
| +
|
| +
|
| +class BackReferenceNode: public SeqRegExpNode {
|
| + public:
|
| + BackReferenceNode(int start_reg,
|
| + int end_reg,
|
| + RegExpNode* on_success,
|
| + RegExpNode* on_failure)
|
| + : SeqRegExpNode(on_success),
|
| + on_failure_(on_failure),
|
| + start_reg_(start_reg),
|
| + end_reg_(end_reg) { }
|
| + virtual void Accept(NodeVisitor* visitor);
|
| + RegExpNode* on_failure() { return on_failure_; }
|
| + int start_register() { return start_reg_; }
|
| + int end_register() { return end_reg_; }
|
| + virtual bool Emit(RegExpCompiler* compiler);
|
| + virtual RegExpNode* PropagateForward(NodeInfo* info);
|
| + private:
|
| + RegExpNode* on_failure_;
|
| + int start_reg_;
|
| + int end_reg_;
|
| +};
|
| +
|
| +
|
| +class EndNode: public RegExpNode {
|
| + public:
|
| + enum Action { ACCEPT, BACKTRACK };
|
| + explicit EndNode(Action action) : action_(action) { }
|
| + virtual void Accept(NodeVisitor* visitor);
|
| + virtual bool Emit(RegExpCompiler* compiler);
|
| + virtual RegExpNode* PropagateForward(NodeInfo* info);
|
| + virtual bool IsBacktrack() { return action_ == BACKTRACK; }
|
| + virtual bool GoTo(RegExpCompiler* compiler);
|
| + private:
|
| + Action action_;
|
| +};
|
| +
|
| +
|
| +class Guard: public ZoneObject {
|
| + public:
|
| + enum Relation { LT, GEQ };
|
| + Guard(int reg, Relation op, int value)
|
| + : reg_(reg),
|
| + op_(op),
|
| + value_(value) { }
|
| + int reg() { return reg_; }
|
| + Relation op() { return op_; }
|
| + int value() { return value_; }
|
| + private:
|
| + int reg_;
|
| + Relation op_;
|
| + int value_;
|
| +};
|
| +
|
| +
|
| +class GuardedAlternative {
|
| + public:
|
| + explicit GuardedAlternative(RegExpNode* node) : node_(node), guards_(NULL) { }
|
| + void AddGuard(Guard* guard);
|
| + RegExpNode* node() { return node_; }
|
| + void set_node(RegExpNode* node) { node_ = node; }
|
| + ZoneList<Guard*>* guards() { return guards_; }
|
| + private:
|
| + RegExpNode* node_;
|
| + ZoneList<Guard*>* guards_;
|
| +};
|
| +
|
| +
|
| +class ChoiceNode: public RegExpNode {
|
| + public:
|
| + explicit ChoiceNode(int expected_size, RegExpNode* on_failure)
|
| + : on_failure_(on_failure),
|
| + alternatives_(new ZoneList<GuardedAlternative>(expected_size)),
|
| + table_calculated_(false),
|
| + being_calculated_(false) { }
|
| + virtual void Accept(NodeVisitor* visitor);
|
| + void AddAlternative(GuardedAlternative node) { alternatives()->Add(node); }
|
| + ZoneList<GuardedAlternative>* alternatives() { return alternatives_; }
|
| + DispatchTable* table() { return &table_; }
|
| + RegExpNode* on_failure() { return on_failure_; }
|
| + virtual bool Emit(RegExpCompiler* compiler);
|
| + virtual RegExpNode* PropagateForward(NodeInfo* info);
|
| + bool table_calculated() { return table_calculated_; }
|
| + void set_table_calculated(bool b) { table_calculated_ = b; }
|
| + bool being_calculated() { return being_calculated_; }
|
| + void set_being_calculated(bool b) { being_calculated_ = b; }
|
| + private:
|
| + void GenerateGuard(RegExpMacroAssembler* macro_assembler,
|
| + Guard *guard,
|
| + Label* on_failure);
|
| + RegExpNode* on_failure_;
|
| + ZoneList<GuardedAlternative>* alternatives_;
|
| + DispatchTable table_;
|
| + bool table_calculated_;
|
| + bool being_calculated_;
|
| +};
|
| +
|
| +
|
| +class NodeVisitor {
|
| + public:
|
| + virtual ~NodeVisitor() { }
|
| +#define DECLARE_VISIT(Type) \
|
| + virtual void Visit##Type(Type##Node* that) = 0;
|
| +FOR_EACH_NODE_TYPE(DECLARE_VISIT)
|
| +#undef DECLARE_VISIT
|
| +};
|
| +
|
| +
|
| +// Node visitor used to add the start set of the alternatives to the
|
| +// dispatch table of a choice node.
|
| +class DispatchTableConstructor: public NodeVisitor {
|
| + public:
|
| + explicit DispatchTableConstructor(DispatchTable* table)
|
| + : table_(table),
|
| + choice_index_(-1) { }
|
| +
|
| + void BuildTable(ChoiceNode* node);
|
| +
|
| + void AddRange(CharacterRange range) {
|
| + table()->AddRange(range, choice_index_);
|
| + }
|
| +
|
| + void AddInverse(ZoneList<CharacterRange>* ranges);
|
| +
|
| +#define DECLARE_VISIT(Type) \
|
| + virtual void Visit##Type(Type##Node* that);
|
| +FOR_EACH_NODE_TYPE(DECLARE_VISIT)
|
| +#undef DECLARE_VISIT
|
| +
|
| + DispatchTable* table() { return table_; }
|
| + void set_choice_index(int value) { choice_index_ = value; }
|
| +
|
| + protected:
|
| + DispatchTable *table_;
|
| + int choice_index_;
|
| +};
|
| +
|
| +
|
| +class Analysis: public NodeVisitor {
|
| + public:
|
| + explicit Analysis(bool ignore_case)
|
| + : ignore_case_(ignore_case) { }
|
| + void EnsureAnalyzed(RegExpNode* node);
|
| +
|
| +#define DECLARE_VISIT(Type) \
|
| + virtual void Visit##Type(Type##Node* that);
|
| +FOR_EACH_NODE_TYPE(DECLARE_VISIT)
|
| +#undef DECLARE_VISIT
|
| +
|
| + private:
|
| + bool ignore_case_;
|
| +
|
| + DISALLOW_IMPLICIT_CONSTRUCTORS(Analysis);
|
| +};
|
| +
|
| +
|
| +struct RegExpParseResult {
|
| + RegExpTree* tree;
|
| + bool has_character_escapes;
|
| + Handle<String> error;
|
| + int capture_count;
|
| +};
|
| +
|
| +
|
| +class RegExpEngine: public AllStatic {
|
| + public:
|
| + static Handle<FixedArray> Compile(RegExpParseResult* input,
|
| + RegExpNode** node_return,
|
| + bool ignore_case,
|
| + bool multiline);
|
| + static void DotPrint(const char* label, RegExpNode* node);
|
| +};
|
| +
|
| +
|
| } } // namespace v8::internal
|
|
|
| #endif // V8_JSREGEXP_H_
|
|
|