Chromium Code Reviews| Index: src/jsregexp.h |
| =================================================================== |
| --- src/jsregexp.h (revision 830) |
| +++ src/jsregexp.h (working copy) |
| @@ -30,6 +30,10 @@ |
| namespace v8 { namespace internal { |
| + |
| +class RegExpMacroAssembler; |
| + |
| + |
| class RegExpImpl { |
| public: |
| // Creates a regular expression literal in the old space. |
| @@ -61,10 +65,28 @@ |
| static Handle<Object> ExecGlobal(Handle<JSRegExp> regexp, |
| Handle<String> subject); |
| + // Stores an uncompiled RegExp pattern in the JSRegExp object. |
| + // It will be compiled by JSCRE when first executed. |
| + static Handle<Object> JscrePrepare(Handle<JSRegExp> re, |
| + Handle<String> pattern, |
| + JSRegExp::Flags flags); |
| + |
| + // Stores a compiled RegExp pattern in the JSRegExp object. |
| + // The pattern is compiled by Irregexp. |
| + static Handle<Object> IrregexpPrepare(Handle<JSRegExp> re, |
| + Handle<String> pattern, |
| + JSRegExp::Flags flags, |
| + Handle<FixedArray> irregexp_data); |
| + |
| + |
| + // Compile the pattern using JSCRE and store the result in the |
| + // JSRegExp object. |
| + static Handle<Object> JscreCompile(Handle<JSRegExp> re); |
| + |
| static Handle<Object> AtomCompile(Handle<JSRegExp> re, |
| Handle<String> pattern, |
| - JSRegExp::Flags flags); |
| - |
| + JSRegExp::Flags flags, |
| + Handle<String> match_pattern); |
| static Handle<Object> AtomExec(Handle<JSRegExp> regexp, |
| Handle<String> subject, |
| Handle<Object> index); |
| @@ -72,47 +94,78 @@ |
| static Handle<Object> AtomExecGlobal(Handle<JSRegExp> regexp, |
| Handle<String> subject); |
| - static Handle<Object> JsreCompile(Handle<JSRegExp> re, |
| - Handle<String> pattern, |
| - JSRegExp::Flags flags); |
| + static Handle<Object> JscreCompile(Handle<JSRegExp> re, |
| + Handle<String> pattern, |
| + JSRegExp::Flags flags); |
| - static Handle<Object> JsreExec(Handle<JSRegExp> regexp, |
| - Handle<String> subject, |
| - Handle<Object> index); |
| + // Execute a compiled JSCRE pattern. |
| + static Handle<Object> JscreExec(Handle<JSRegExp> regexp, |
| + Handle<String> subject, |
| + Handle<Object> index); |
| - static Handle<Object> JsreExecGlobal(Handle<JSRegExp> regexp, |
| - Handle<String> subject); |
| + // Execute an Irregexp bytecode pattern. |
| + static Handle<Object> IrregexpExec(Handle<JSRegExp> regexp, |
| + Handle<String> subject, |
| + Handle<Object> index); |
| + static Handle<Object> JscreExecGlobal(Handle<JSRegExp> regexp, |
| + Handle<String> subject); |
| + |
| + static Handle<Object> IrregexpExecGlobal(Handle<JSRegExp> regexp, |
| + Handle<String> subject); |
| + |
| static void NewSpaceCollectionPrologue(); |
| static void OldSpaceCollectionPrologue(); |
| - private: |
| // Converts a source string to a 16 bit flat string. The string |
| // will be either sequential or it will be a SlicedString backed |
| // by a flat string. |
| static Handle<String> StringToTwoByte(Handle<String> pattern); |
| static Handle<String> CachedStringToTwoByte(Handle<String> pattern); |
| + static const int kIrregexpImplementationIndex = 0; |
| + static const int kIrregexpNumberOfCapturesIndex = 1; |
| + static const int kIrregexpNumberOfRegistersIndex = 2; |
| + static const int kIrregexpCodeIndex = 3; |
| + static const int kIrregexpDataLength = 4; |
| + |
| + static const int kJscreNumberOfCapturesIndex = 0; |
| + static const int kJscreInternalIndex = 1; |
| + static const int kJscreDataLength = 2; |
| + |
| + private: |
| static String* last_ascii_string_; |
| static String* two_byte_cached_string_; |
| - // Returns the caputure from the re. |
| - static int JsreCapture(Handle<JSRegExp> re); |
| - static ByteArray* JsreInternal(Handle<JSRegExp> re); |
| + static int JscreNumberOfCaptures(Handle<JSRegExp> re); |
| + static ByteArray* JscreInternal(Handle<JSRegExp> re); |
| + static int IrregexpNumberOfCaptures(Handle<JSRegExp> re); |
| + static int IrregexpNumberOfRegisters(Handle<JSRegExp> re); |
| + static Handle<ByteArray> IrregexpCode(Handle<JSRegExp> re); |
| + |
| // Call jsRegExpExecute once |
| - static Handle<Object> JsreExecOnce(Handle<JSRegExp> regexp, |
| - int num_captures, |
| - Handle<String> subject, |
| - int previous_index, |
| - const uc16* utf8_subject, |
| - int* ovector, |
| - int ovector_length); |
| + static Handle<Object> JscreExecOnce(Handle<JSRegExp> regexp, |
| + int num_captures, |
| + Handle<String> subject, |
| + int previous_index, |
| + const uc16* utf8_subject, |
| + int* ovector, |
| + int ovector_length); |
| + static Handle<Object> IrregexpExecOnce(Handle<JSRegExp> regexp, |
| + int num_captures, |
| + Handle<String> subject16, |
| + int previous_index, |
| + int* ovector, |
| + int ovector_length); |
| + |
| // Set the subject cache. The previous string buffer is not deleted, so the |
| // caller should ensure that it doesn't leak. |
| - static void SetSubjectCache(String* subject, char* utf8_subject, |
| - int uft8_length, int character_position, |
| + static void SetSubjectCache(String* subject, |
| + char* utf8_subject, |
| + int uft8_length, |
| + int character_position, |
| int utf8_position); |
| // A one element cache of the last utf8_subject string and its length. The |
| @@ -125,6 +178,599 @@ |
| }; |
| +class CharacterRange { |
|
iposva
2008/11/26 06:56:22
Please add comments about this class.
|
| + public: |
| + CharacterRange() : from_(0), to_(0) { } |
| + // For compatibility with the CHECK_OK macro |
| + CharacterRange(void* null) { ASSERT_EQ(NULL, null); } //NOLINT |
| + CharacterRange(uc16 from, uc16 to) |
| + : from_(from), |
|
Mads Ager (chromium)
2008/11/25 21:09:41
Four space indent. This migth all fit on one line
Christian Plesner Hansen
2008/11/26 06:49:56
Fixed.
|
| + to_(to) { |
| + } |
| + static void AddClassEscape(uc16 type, ZoneList<CharacterRange>* ranges); |
| + static inline CharacterRange Singleton(uc16 value) { |
| + return CharacterRange(value, value); |
| + } |
| + static inline CharacterRange Range(uc16 from, uc16 to) { |
| + ASSERT(from <= to); |
| + return CharacterRange(from, to); |
| + } |
| + static inline CharacterRange Everything() { |
| + return CharacterRange(0, 0xFFFF); |
| + } |
| + bool Contains(uc16 i) { return from_ <= i && i <= to_; } |
| + uc16 from() const { return from_; } |
| + void set_from(uc16 value) { from_ = value; } |
| + uc16 to() const { return to_; } |
| + void set_to(uc16 value) { to_ = value; } |
| + bool is_valid() { return from_ <= to_; } |
| + bool IsSingleton() { return (from_ == to_); } |
| + void AddCaseEquivalents(ZoneList<CharacterRange>* ranges); |
| + static const int kRangeCanonicalizeMax = 0x200; |
|
iposva
2008/11/26 06:56:22
Declaration order: constants before constructors.
Christian Plesner Hansen
2008/11/26 07:49:51
We've never followed that rule. In fact, as far a
|
| + static const int kStartMarker = (1 << 24); |
| + static const int kPayloadMask = (1 << 24) - 1; |
| + private: |
|
iposva
2008/11/26 06:56:22
Please leave a blank line before "private:" in acc
Christian Plesner Hansen
2008/11/26 07:49:51
Again, that's not a rule we've been consistent abo
|
| + uc16 from_; |
| + uc16 to_; |
| +}; |
| + |
| + |
| +template <typename Node, class Callback> |
| +static void DoForEach(Node* node, Callback* callback); |
| + |
| + |
| +// A zone splay tree. The config type parameter encapsulates the |
| +// different configurations of a concrete splay tree: |
| +// |
| +// typedef Key: the key type |
| +// typedef Value: the value type |
| +// static const kNoKey: the dummy key used when no key is set |
| +// static const kNoValue: the dummy value used to initialize nodes |
| +// int (Compare)(Key& a, Key& b) -> {-1, 0, 1}: comparison function |
| +// |
| +template <typename Config> |
| +class ZoneSplayTree : public ZoneObject { |
| + public: |
| + typedef typename Config::Key Key; |
| + typedef typename Config::Value Value; |
| + |
| + class Locator; |
| + |
| + ZoneSplayTree() : root_(NULL) { } |
| + |
| + // Inserts the given key in this tree with the given value. Returns |
| + // true if a node was inserted, otherwise false. If found the locator |
| + // is enabled and provides access to the mapping for the key. |
| + bool Insert(const Key& key, Locator* locator); |
| + |
| + // Looks up the key in this tree and returns true if it was found, |
| + // otherwise false. If the node is found the locator is enabled and |
| + // provides access to the mapping for the key. |
| + bool Find(const Key& key, Locator* locator); |
| + |
| + // Finds the mapping with the greatest key less than or equal to the |
| + // given key. |
| + bool FindGreatestLessThan(const Key& key, Locator* locator); |
| + |
| + // Find the mapping with the greatest key in this tree. |
| + bool FindGreatest(Locator* locator); |
| + |
| + // Finds the mapping with the least key greater than or equal to the |
| + // given key. |
| + bool FindLeastGreaterThan(const Key& key, Locator* locator); |
| + |
| + // Find the mapping with the least key in this tree. |
| + bool FindLeast(Locator* locator); |
| + |
| + // Remove the node with the given key from the tree. |
| + bool Remove(const Key& key); |
| + |
| + bool is_empty() { return root_ == NULL; } |
| + |
| + // Perform the splay operation for the given key. Moves the node with |
| + // the given key to the top of the tree. If no node has the given |
| + // key, the last node on the search path is moved to the top of the |
| + // tree. |
| + void Splay(const Key& key); |
| + |
| + class Node : public ZoneObject { |
| + public: |
| + Node(const Key& key, const Value& value) |
| + : key_(key), |
|
Mads Ager (chromium)
2008/11/25 21:09:41
Four space indent. Many more occurrences below.
Christian Plesner Hansen
2008/11/26 06:49:56
Fixed.
|
| + value_(value), |
| + left_(NULL), |
| + right_(NULL) { } |
| + Key key() { return key_; } |
|
Mads Ager (chromium)
2008/11/25 21:09:41
Indentation is off for all the accessors.
Christian Plesner Hansen
2008/11/26 06:49:56
Fixed. I wonder why lint didn't catch this?
|
| + Value value() { return value_; } |
| + Node* left() { return left_; } |
| + Node* right() { return right_; } |
| + private: |
| + friend class ZoneSplayTree; |
| + friend class Locator; |
| + Key key_; |
| + Value value_; |
| + Node* left_; |
| + Node* right_; |
| + }; |
| + |
| + // A locator provides access to a node in the tree without actually |
| + // exposing the node. |
| + class Locator { |
| + public: |
| + explicit Locator(Node* node) : node_(node) { } |
| + Locator() : node_(NULL) { } |
| + const Key& key() { return node_->key_; } |
| + Value& value() { return node_->value_; } |
| + void set_value(const Value& value) { node_->value_ = value; } |
| + inline void bind(Node* node) { node_ = node; } |
| + private: |
| + Node* node_; |
| + }; |
| + |
| + template <class Callback> |
| + void ForEach(Callback* c) { |
| + DoForEach<typename ZoneSplayTree<Config>::Node, Callback>(root_, c); |
| + } |
| + |
| + private: |
| + Node* root_; |
| +}; |
| + |
| + |
| +// A set of unsigned integers that behaves especially well on small |
| +// integers (< 32). May do zone-allocation. |
| +class OutSet: public ZoneObject { |
| + public: |
| + OutSet() : first_(0), remaining_(NULL), successors_(NULL) { } |
| + OutSet* Extend(unsigned value); |
| + bool Get(unsigned value); |
| + static const unsigned kFirstLimit = 32; |
| + private: |
|
Mads Ager (chromium)
2008/11/25 21:09:41
Have the empty line before private instead of afte
Christian Plesner Hansen
2008/11/26 06:49:56
Fixed.
|
| + |
| + // Destructively set a value in this set. In most cases you want |
| + // to use Extend instead to ensure that only one instance exists |
| + // that contains the same values. |
| + void Set(unsigned value); |
| + |
| + // The successors are a list of sets that contain the same values |
| + // as this set and the one more value that is not present in this |
| + // set. |
| + ZoneList<OutSet*>* successors() { return successors_; } |
| + |
| + OutSet(uint32_t first, ZoneList<unsigned>* remaining) |
| + : first_(first), remaining_(remaining), successors_(NULL) { } |
| + uint32_t first_; |
| + ZoneList<unsigned>* remaining_; |
| + ZoneList<OutSet*>* successors_; |
| +}; |
| + |
| + |
| +// A mapping from integers, specified as ranges, to a set of integers. |
| +// Used for mapping character ranges to choices. |
| +class DispatchTable { |
| + public: |
| + class Entry { |
| + public: |
| + Entry() |
| + : from_(0), to_(0), out_set_(NULL) { } |
|
Mads Ager (chromium)
2008/11/25 21:09:41
Put this on one line.
Christian Plesner Hansen
2008/11/26 06:49:56
Fixed.
|
| + Entry(uc16 from, uc16 to, OutSet* out_set) |
| + : from_(from), to_(to), out_set_(out_set) { } |
| + uc16 from() { return from_; } |
| + uc16 to() { return to_; } |
| + void set_to(uc16 value) { to_ = value; } |
| + void AddValue(int value) { out_set_ = out_set_->Extend(value); } |
| + OutSet* out_set() { return out_set_; } |
| + private: |
| + uc16 from_; |
| + uc16 to_; |
| + OutSet* out_set_; |
| + }; |
| + |
| + class Config { |
| + public: |
| + typedef uc16 Key; |
| + typedef Entry Value; |
| + static const uc16 kNoKey; |
| + static const Entry kNoValue; |
| + static inline int Compare(uc16 a, uc16 b) { |
| + if (a == b) |
|
Mads Ager (chromium)
2008/11/25 21:09:41
How about:
if (a == b) return 0;
if (a < b) retur
Christian Plesner Hansen
2008/11/26 06:49:56
That's a religious question: should there be an 'e
|
| + return 0; |
| + else if (a < b) |
| + return -1; |
| + else |
| + return 1; |
| + } |
| + }; |
| + |
| + void AddRange(CharacterRange range, int value); |
| + OutSet* Get(uc16 value); |
| + void Dump(); |
| + |
| + template <typename Callback> |
| + void ForEach(Callback* callback) { return tree()->ForEach(callback); } |
| + private: |
| + // There can't be a static empty set since it allocates its |
| + // successors in a zone and caches them. |
| + OutSet* empty() { return &empty_; } |
| + OutSet empty_; |
| + ZoneSplayTree<Config>* tree() { return &tree_; } |
| + ZoneSplayTree<Config> tree_; |
| +}; |
| + |
| + |
| +#define FOR_EACH_NODE_TYPE(VISIT) \ |
| + VISIT(End) \ |
| + VISIT(Action) \ |
| + VISIT(Choice) \ |
| + VISIT(BackReference) \ |
| + VISIT(Text) |
| + |
| + |
| +#define FOR_EACH_REG_EXP_TREE_TYPE(VISIT) \ |
| + VISIT(Disjunction) \ |
| + VISIT(Alternative) \ |
| + VISIT(Assertion) \ |
| + VISIT(CharacterClass) \ |
| + VISIT(Atom) \ |
| + VISIT(Quantifier) \ |
| + VISIT(Capture) \ |
| + VISIT(Lookahead) \ |
| + VISIT(BackReference) \ |
| + VISIT(Empty) \ |
| + VISIT(Text) |
| + |
| + |
| +#define FORWARD_DECLARE(Name) class RegExp##Name; |
| +FOR_EACH_REG_EXP_TREE_TYPE(FORWARD_DECLARE) |
| +#undef FORWARD_DECLARE |
| + |
| + |
| +class TextElement { |
| + public: |
| + enum Type {UNINITIALIZED, ATOM, CHAR_CLASS}; |
| + TextElement() : type(UNINITIALIZED) { } |
| + explicit TextElement(Type t) : type(t) { } |
| + static TextElement Atom(RegExpAtom* atom); |
| + static TextElement CharClass(RegExpCharacterClass* char_class); |
| + Type type; |
| + union { |
| + RegExpAtom* u_atom; |
| + RegExpCharacterClass* u_char_class; |
| + } data; |
| +}; |
| + |
| + |
| +struct NodeInfo { |
| + NodeInfo() |
| + : being_analyzed(false), |
| + been_analyzed(false), |
| + determine_word(false), |
| + determine_newline(false), |
| + determine_start(false), |
| + follows_word_interest(false), |
| + follows_newline_interest(false), |
| + follows_start_interest(false) { } |
| + bool SameInterests(NodeInfo* that) { |
| + return (follows_word_interest == that->follows_word_interest) |
| + && (follows_newline_interest == that->follows_newline_interest) |
| + && (follows_start_interest == that->follows_start_interest); |
| + } |
| + void AdoptInterests(NodeInfo* that) { |
| + follows_word_interest = that->follows_word_interest; |
| + follows_newline_interest = that->follows_newline_interest; |
| + follows_start_interest = that->follows_start_interest; |
| + } |
| + bool prev_determine_word() { |
| + return determine_word || follows_word_interest; |
| + } |
| + bool prev_determine_newline() { |
| + return determine_newline || follows_newline_interest; |
| + } |
| + bool prev_determine_start() { |
| + return determine_start || follows_start_interest; |
| + } |
| + bool being_analyzed: 1; |
| + bool been_analyzed: 1; |
| + bool determine_word: 1; |
| + bool determine_newline: 1; |
| + bool determine_start: 1; |
| + bool follows_word_interest: 1; |
| + bool follows_newline_interest: 1; |
| + bool follows_start_interest: 1; |
| +}; |
| + |
| + |
| +STATIC_CHECK(sizeof(NodeInfo) <= sizeof(int)); // NOLINT |
| + |
| + |
| +class SiblingList { |
| + public: |
| + SiblingList() : list_(NULL) { } |
| + int length() { |
| + return list_ == NULL ? 0 : list_->length(); |
| + } |
| + void Ensure(RegExpNode* parent) { |
| + if (list_ == NULL) { |
| + list_ = new ZoneList<RegExpNode*>(2); |
| + list_->Add(parent); |
| + } |
| + } |
| + void Add(RegExpNode* node) { list_->Add(node); } |
| + RegExpNode* Get(int index) { return list_->at(index); } |
| + private: |
| + ZoneList<RegExpNode*>* list_; |
| +}; |
| + |
| + |
| +class RegExpNode: public ZoneObject { |
| + public: |
| + virtual ~RegExpNode() { } |
| + virtual void Accept(NodeVisitor* visitor) = 0; |
| + // Generates a goto to this node or actually generates the code at this point. |
| + // Until the implementation is complete we will return true for success and |
| + // false for failure. |
| + virtual bool GoTo(RegExpCompiler* compiler); |
| + Label* label(); |
| + |
| + // Until the implementation is complete we will return true for success and |
| + // false for failure. |
| + virtual bool Emit(RegExpCompiler* compiler) = 0; |
| + virtual RegExpNode* PropagateInterest(NodeInfo* info) = 0; |
| + NodeInfo* info() { return &info_; } |
| + virtual bool IsBacktrack() { return false; } |
| + RegExpNode* GetSibling(NodeInfo* info); |
| + void EnsureSiblings() { siblings_.Ensure(this); } |
| + void AddSibling(RegExpNode* node) { siblings_.Add(node); } |
| + protected: |
| + inline void Bind(RegExpMacroAssembler* macro); |
| + private: |
| + Label label_; |
| + NodeInfo info_; |
| + SiblingList siblings_; |
| +}; |
| + |
| + |
| +class SeqRegExpNode: public RegExpNode { |
| + public: |
| + explicit SeqRegExpNode(RegExpNode* on_success) |
| + : on_success_(on_success) { } |
| + RegExpNode* on_success() { return on_success_; } |
| + void set_on_success(RegExpNode* node) { on_success_ = node; } |
| + virtual bool Emit(RegExpCompiler* compiler) { return false; } |
| + private: |
| + RegExpNode* on_success_; |
| +}; |
| + |
| + |
| +class ActionNode: public SeqRegExpNode { |
| + public: |
| + enum Type { |
| + STORE_REGISTER, |
| + INCREMENT_REGISTER, |
| + STORE_POSITION, |
| + SAVE_POSITION, |
| + RESTORE_POSITION, |
| + BEGIN_SUBMATCH, |
| + ESCAPE_SUBMATCH |
| + }; |
| + static ActionNode* StoreRegister(int reg, int val, RegExpNode* on_success); |
| + static ActionNode* IncrementRegister(int reg, RegExpNode* on_success); |
| + static ActionNode* StorePosition(int reg, RegExpNode* on_success); |
| + static ActionNode* SavePosition(int reg, RegExpNode* on_success); |
| + static ActionNode* RestorePosition(int reg, RegExpNode* on_success); |
| + static ActionNode* BeginSubmatch(int reg, RegExpNode* on_success); |
| + static ActionNode* EscapeSubmatch(int reg, RegExpNode* on_success); |
| + virtual void Accept(NodeVisitor* visitor); |
| + virtual bool Emit(RegExpCompiler* compiler); |
| + virtual RegExpNode* PropagateInterest(NodeInfo* info); |
| + private: |
| + union { |
| + struct { |
| + int reg; |
| + int value; |
| + } u_store_register; |
| + struct { |
| + int reg; |
| + } u_increment_register; |
| + struct { |
| + int reg; |
| + } u_position_register; |
| + struct { |
| + int reg; |
| + } u_submatch_stack_pointer_register; |
| + } data_; |
| + ActionNode(Type type, RegExpNode* on_success) |
| + : SeqRegExpNode(on_success), |
| + type_(type) { } |
| + Type type_; |
| + friend class DotPrinter; |
| +}; |
| + |
| + |
| +class TextNode: public SeqRegExpNode { |
| + public: |
| + TextNode(ZoneList<TextElement>* elms, |
| + RegExpNode* on_success, |
| + RegExpNode* on_failure) |
| + : SeqRegExpNode(on_success), |
| + on_failure_(on_failure), |
| + elms_(elms) { } |
| + virtual void Accept(NodeVisitor* visitor); |
| + virtual RegExpNode* PropagateInterest(NodeInfo* info); |
| + RegExpNode* on_failure() { return on_failure_; } |
| + virtual bool Emit(RegExpCompiler* compiler); |
| + ZoneList<TextElement>* elements() { return elms_; } |
| + private: |
| + RegExpNode* on_failure_; |
| + ZoneList<TextElement>* elms_; |
| +}; |
| + |
| + |
| +class BackReferenceNode: public SeqRegExpNode { |
| + public: |
| + BackReferenceNode(int start_reg, |
| + int end_reg, |
| + RegExpNode* on_success, |
| + RegExpNode* on_failure) |
| + : SeqRegExpNode(on_success), |
| + on_failure_(on_failure), |
| + start_reg_(start_reg), |
| + end_reg_(end_reg) { } |
| + virtual void Accept(NodeVisitor* visitor); |
| + RegExpNode* on_failure() { return on_failure_; } |
| + int start_register() { return start_reg_; } |
| + int end_register() { return end_reg_; } |
| + virtual bool Emit(RegExpCompiler* compiler); |
| + virtual RegExpNode* PropagateInterest(NodeInfo* info); |
| + private: |
| + RegExpNode* on_failure_; |
| + int start_reg_; |
| + int end_reg_; |
| +}; |
| + |
| + |
| +class EndNode: public RegExpNode { |
| + public: |
| + enum Action { ACCEPT, BACKTRACK }; |
| + explicit EndNode(Action action) : action_(action) { } |
| + virtual void Accept(NodeVisitor* visitor); |
| + virtual bool Emit(RegExpCompiler* compiler); |
| + virtual RegExpNode* PropagateInterest(NodeInfo* info); |
| + virtual bool IsBacktrack() { return action_ == BACKTRACK; } |
| + virtual bool GoTo(RegExpCompiler* compiler); |
| + private: |
| + Action action_; |
| +}; |
| + |
| + |
| +class Guard: public ZoneObject { |
| + public: |
| + enum Relation { LT, GEQ }; |
| + Guard(int reg, Relation op, int value) |
| + : reg_(reg), |
| + op_(op), |
| + value_(value) { } |
| + int reg() { return reg_; } |
| + Relation op() { return op_; } |
| + int value() { return value_; } |
| + private: |
| + int reg_; |
| + Relation op_; |
| + int value_; |
| +}; |
| + |
| + |
| +class GuardedAlternative { |
| + public: |
| + explicit GuardedAlternative(RegExpNode* node) : node_(node), guards_(NULL) { } |
| + void AddGuard(Guard* guard); |
| + RegExpNode* node() { return node_; } |
| + void set_node(RegExpNode* node) { node_ = node; } |
| + ZoneList<Guard*>* guards() { return guards_; } |
| + private: |
| + RegExpNode* node_; |
| + ZoneList<Guard*>* guards_; |
| +}; |
| + |
| + |
| +class ChoiceNode: public RegExpNode { |
| + public: |
| + explicit ChoiceNode(int expected_size, RegExpNode* on_failure) |
| + : on_failure_(on_failure), |
| + alternatives_(new ZoneList<GuardedAlternative>(expected_size)), |
| + table_calculated_(false), |
| + being_calculated_(false) { } |
| + virtual void Accept(NodeVisitor* visitor); |
| + void AddAlternative(GuardedAlternative node) { alternatives()->Add(node); } |
| + ZoneList<GuardedAlternative>* alternatives() { return alternatives_; } |
| + DispatchTable* table() { return &table_; } |
| + RegExpNode* on_failure() { return on_failure_; } |
| + virtual bool Emit(RegExpCompiler* compiler); |
| + virtual RegExpNode* PropagateInterest(NodeInfo* info); |
| + bool table_calculated() { return table_calculated_; } |
| + void set_table_calculated(bool b) { table_calculated_ = b; } |
| + bool being_calculated() { return being_calculated_; } |
| + void set_being_calculated(bool b) { being_calculated_ = b; } |
| + private: |
| + void GenerateGuard(RegExpMacroAssembler* macro_assembler, |
| + Guard *guard, |
|
Erik Corry
2008/11/25 11:03:52
Misplaced asterisk.
Mads Ager (chromium)
2008/11/25 21:09:41
This one is still there.
|
| + Label* on_failure); |
| + RegExpNode* on_failure_; |
| + ZoneList<GuardedAlternative>* alternatives_; |
| + DispatchTable table_; |
| + bool table_calculated_; |
| + bool being_calculated_; |
| +}; |
| + |
| + |
| +class NodeVisitor { |
| + public: |
| + virtual ~NodeVisitor() { } |
| +#define DECLARE_VISIT(Type) \ |
| + virtual void Visit##Type(Type##Node* that) = 0; |
| +FOR_EACH_NODE_TYPE(DECLARE_VISIT) |
| +#undef DECLARE_VISIT |
| +}; |
| + |
| + |
| +// Node visitor used to add the start set of the alternatives to the |
| +// dispatch table of a choice node. |
| +class DispatchTableConstructor: public NodeVisitor { |
| + public: |
| + explicit DispatchTableConstructor(DispatchTable* table) |
| + : table_(table), |
| + choice_index_(-1) { } |
| + |
| + void BuildTable(ChoiceNode* node); |
| + |
| + void AddRange(CharacterRange range) { |
| + table()->AddRange(range, choice_index_); |
| + } |
| + |
| + void AddInverse(ZoneList<CharacterRange>* ranges); |
| + |
| +#define DECLARE_VISIT(Type) \ |
| + virtual void Visit##Type(Type##Node* that); |
| +FOR_EACH_NODE_TYPE(DECLARE_VISIT) |
| +#undef DECLARE_VISIT |
| + |
| + DispatchTable* table() { return table_; } |
| + void set_choice_index(int value) { choice_index_ = value; } |
| + |
| + protected: |
| + DispatchTable *table_; |
|
Erik Corry
2008/11/25 11:03:52
Misplaced asterisk.
Mads Ager (chromium)
2008/11/25 21:09:41
This is still there.
|
| + int choice_index_; |
| +}; |
| + |
| + |
| +class Analysis: public NodeVisitor { |
| + public: |
| + void EnsureAnalyzed(RegExpNode* node); |
| + |
| +#define DECLARE_VISIT(Type) \ |
| + virtual void Visit##Type(Type##Node* that); |
| +FOR_EACH_NODE_TYPE(DECLARE_VISIT) |
| +#undef DECLARE_VISIT |
| +}; |
| + |
| + |
| +struct RegExpParseResult { |
| + RegExpTree* tree; |
| + bool has_character_escapes; |
| + Handle<String> error; |
| + int capture_count; |
| +}; |
| + |
| + |
| +class RegExpEngine: public AllStatic { |
| + public: |
| + static Handle<FixedArray> Compile(RegExpParseResult* input, |
| + RegExpNode** node_return, |
| + bool ignore_case); |
| + static void DotPrint(const char* label, RegExpNode* node); |
| +}; |
| + |
| + |
| } } // namespace v8::internal |
| #endif // V8_JSREGEXP_H_ |