Index: src/jsregexp.h |
=================================================================== |
--- src/jsregexp.h (revision 830) |
+++ src/jsregexp.h (working copy) |
@@ -30,6 +30,10 @@ |
namespace v8 { namespace internal { |
+ |
+class RegExpMacroAssembler; |
+ |
+ |
class RegExpImpl { |
public: |
// Creates a regular expression literal in the old space. |
@@ -61,10 +65,28 @@ |
static Handle<Object> ExecGlobal(Handle<JSRegExp> regexp, |
Handle<String> subject); |
+ // Stores an uncompiled RegExp pattern in the JSRegExp object. |
+ // It will be compiled by JSCRE when first executed. |
+ static Handle<Object> JscrePrepare(Handle<JSRegExp> re, |
+ Handle<String> pattern, |
+ JSRegExp::Flags flags); |
+ |
+ // Stores a compiled RegExp pattern in the JSRegExp object. |
+ // The pattern is compiled by Irregexp. |
+ static Handle<Object> IrregexpPrepare(Handle<JSRegExp> re, |
+ Handle<String> pattern, |
+ JSRegExp::Flags flags, |
+ Handle<FixedArray> irregexp_data); |
+ |
+ |
+ // Compile the pattern using JSCRE and store the result in the |
+ // JSRegExp object. |
+ static Handle<Object> JscreCompile(Handle<JSRegExp> re); |
+ |
static Handle<Object> AtomCompile(Handle<JSRegExp> re, |
Handle<String> pattern, |
- JSRegExp::Flags flags); |
- |
+ JSRegExp::Flags flags, |
+ Handle<String> match_pattern); |
static Handle<Object> AtomExec(Handle<JSRegExp> regexp, |
Handle<String> subject, |
Handle<Object> index); |
@@ -72,47 +94,78 @@ |
static Handle<Object> AtomExecGlobal(Handle<JSRegExp> regexp, |
Handle<String> subject); |
- static Handle<Object> JsreCompile(Handle<JSRegExp> re, |
- Handle<String> pattern, |
- JSRegExp::Flags flags); |
+ static Handle<Object> JscreCompile(Handle<JSRegExp> re, |
+ Handle<String> pattern, |
+ JSRegExp::Flags flags); |
- static Handle<Object> JsreExec(Handle<JSRegExp> regexp, |
- Handle<String> subject, |
- Handle<Object> index); |
+ // Execute a compiled JSCRE pattern. |
+ static Handle<Object> JscreExec(Handle<JSRegExp> regexp, |
+ Handle<String> subject, |
+ Handle<Object> index); |
- static Handle<Object> JsreExecGlobal(Handle<JSRegExp> regexp, |
- Handle<String> subject); |
+ // Execute an Irregexp bytecode pattern. |
+ static Handle<Object> IrregexpExec(Handle<JSRegExp> regexp, |
+ Handle<String> subject, |
+ Handle<Object> index); |
+ static Handle<Object> JscreExecGlobal(Handle<JSRegExp> regexp, |
+ Handle<String> subject); |
+ |
+ static Handle<Object> IrregexpExecGlobal(Handle<JSRegExp> regexp, |
+ Handle<String> subject); |
+ |
static void NewSpaceCollectionPrologue(); |
static void OldSpaceCollectionPrologue(); |
- private: |
// Converts a source string to a 16 bit flat string. The string |
// will be either sequential or it will be a SlicedString backed |
// by a flat string. |
static Handle<String> StringToTwoByte(Handle<String> pattern); |
static Handle<String> CachedStringToTwoByte(Handle<String> pattern); |
+ static const int kIrregexpImplementationIndex = 0; |
+ static const int kIrregexpNumberOfCapturesIndex = 1; |
+ static const int kIrregexpNumberOfRegistersIndex = 2; |
+ static const int kIrregexpCodeIndex = 3; |
+ static const int kIrregexpDataLength = 4; |
+ |
+ static const int kJscreNumberOfCapturesIndex = 0; |
+ static const int kJscreInternalIndex = 1; |
+ static const int kJscreDataLength = 2; |
+ |
+ private: |
static String* last_ascii_string_; |
static String* two_byte_cached_string_; |
- // Returns the caputure from the re. |
- static int JsreCapture(Handle<JSRegExp> re); |
- static ByteArray* JsreInternal(Handle<JSRegExp> re); |
+ static int JscreNumberOfCaptures(Handle<JSRegExp> re); |
+ static ByteArray* JscreInternal(Handle<JSRegExp> re); |
+ static int IrregexpNumberOfCaptures(Handle<JSRegExp> re); |
+ static int IrregexpNumberOfRegisters(Handle<JSRegExp> re); |
+ static Handle<ByteArray> IrregexpCode(Handle<JSRegExp> re); |
+ |
// Call jsRegExpExecute once |
- static Handle<Object> JsreExecOnce(Handle<JSRegExp> regexp, |
- int num_captures, |
- Handle<String> subject, |
- int previous_index, |
- const uc16* utf8_subject, |
- int* ovector, |
- int ovector_length); |
+ static Handle<Object> JscreExecOnce(Handle<JSRegExp> regexp, |
+ int num_captures, |
+ Handle<String> subject, |
+ int previous_index, |
+ const uc16* utf8_subject, |
+ int* ovector, |
+ int ovector_length); |
+ static Handle<Object> IrregexpExecOnce(Handle<JSRegExp> regexp, |
+ int num_captures, |
+ Handle<String> subject16, |
+ int previous_index, |
+ int* ovector, |
+ int ovector_length); |
+ |
// Set the subject cache. The previous string buffer is not deleted, so the |
// caller should ensure that it doesn't leak. |
- static void SetSubjectCache(String* subject, char* utf8_subject, |
- int uft8_length, int character_position, |
+ static void SetSubjectCache(String* subject, |
+ char* utf8_subject, |
+ int uft8_length, |
+ int character_position, |
int utf8_position); |
// A one element cache of the last utf8_subject string and its length. The |
@@ -125,6 +178,599 @@ |
}; |
+class CharacterRange { |
iposva
2008/11/26 06:56:22
Please add comments about this class.
|
+ public: |
+ CharacterRange() : from_(0), to_(0) { } |
+ // For compatibility with the CHECK_OK macro |
+ CharacterRange(void* null) { ASSERT_EQ(NULL, null); } //NOLINT |
+ CharacterRange(uc16 from, uc16 to) |
+ : from_(from), |
Mads Ager (chromium)
2008/11/25 21:09:41
Four space indent. This migth all fit on one line
Christian Plesner Hansen
2008/11/26 06:49:56
Fixed.
|
+ to_(to) { |
+ } |
+ static void AddClassEscape(uc16 type, ZoneList<CharacterRange>* ranges); |
+ static inline CharacterRange Singleton(uc16 value) { |
+ return CharacterRange(value, value); |
+ } |
+ static inline CharacterRange Range(uc16 from, uc16 to) { |
+ ASSERT(from <= to); |
+ return CharacterRange(from, to); |
+ } |
+ static inline CharacterRange Everything() { |
+ return CharacterRange(0, 0xFFFF); |
+ } |
+ bool Contains(uc16 i) { return from_ <= i && i <= to_; } |
+ uc16 from() const { return from_; } |
+ void set_from(uc16 value) { from_ = value; } |
+ uc16 to() const { return to_; } |
+ void set_to(uc16 value) { to_ = value; } |
+ bool is_valid() { return from_ <= to_; } |
+ bool IsSingleton() { return (from_ == to_); } |
+ void AddCaseEquivalents(ZoneList<CharacterRange>* ranges); |
+ static const int kRangeCanonicalizeMax = 0x200; |
iposva
2008/11/26 06:56:22
Declaration order: constants before constructors.
Christian Plesner Hansen
2008/11/26 07:49:51
We've never followed that rule. In fact, as far a
|
+ static const int kStartMarker = (1 << 24); |
+ static const int kPayloadMask = (1 << 24) - 1; |
+ private: |
iposva
2008/11/26 06:56:22
Please leave a blank line before "private:" in acc
Christian Plesner Hansen
2008/11/26 07:49:51
Again, that's not a rule we've been consistent abo
|
+ uc16 from_; |
+ uc16 to_; |
+}; |
+ |
+ |
+template <typename Node, class Callback> |
+static void DoForEach(Node* node, Callback* callback); |
+ |
+ |
+// A zone splay tree. The config type parameter encapsulates the |
+// different configurations of a concrete splay tree: |
+// |
+// typedef Key: the key type |
+// typedef Value: the value type |
+// static const kNoKey: the dummy key used when no key is set |
+// static const kNoValue: the dummy value used to initialize nodes |
+// int (Compare)(Key& a, Key& b) -> {-1, 0, 1}: comparison function |
+// |
+template <typename Config> |
+class ZoneSplayTree : public ZoneObject { |
+ public: |
+ typedef typename Config::Key Key; |
+ typedef typename Config::Value Value; |
+ |
+ class Locator; |
+ |
+ ZoneSplayTree() : root_(NULL) { } |
+ |
+ // Inserts the given key in this tree with the given value. Returns |
+ // true if a node was inserted, otherwise false. If found the locator |
+ // is enabled and provides access to the mapping for the key. |
+ bool Insert(const Key& key, Locator* locator); |
+ |
+ // Looks up the key in this tree and returns true if it was found, |
+ // otherwise false. If the node is found the locator is enabled and |
+ // provides access to the mapping for the key. |
+ bool Find(const Key& key, Locator* locator); |
+ |
+ // Finds the mapping with the greatest key less than or equal to the |
+ // given key. |
+ bool FindGreatestLessThan(const Key& key, Locator* locator); |
+ |
+ // Find the mapping with the greatest key in this tree. |
+ bool FindGreatest(Locator* locator); |
+ |
+ // Finds the mapping with the least key greater than or equal to the |
+ // given key. |
+ bool FindLeastGreaterThan(const Key& key, Locator* locator); |
+ |
+ // Find the mapping with the least key in this tree. |
+ bool FindLeast(Locator* locator); |
+ |
+ // Remove the node with the given key from the tree. |
+ bool Remove(const Key& key); |
+ |
+ bool is_empty() { return root_ == NULL; } |
+ |
+ // Perform the splay operation for the given key. Moves the node with |
+ // the given key to the top of the tree. If no node has the given |
+ // key, the last node on the search path is moved to the top of the |
+ // tree. |
+ void Splay(const Key& key); |
+ |
+ class Node : public ZoneObject { |
+ public: |
+ Node(const Key& key, const Value& value) |
+ : key_(key), |
Mads Ager (chromium)
2008/11/25 21:09:41
Four space indent. Many more occurrences below.
Christian Plesner Hansen
2008/11/26 06:49:56
Fixed.
|
+ value_(value), |
+ left_(NULL), |
+ right_(NULL) { } |
+ Key key() { return key_; } |
Mads Ager (chromium)
2008/11/25 21:09:41
Indentation is off for all the accessors.
Christian Plesner Hansen
2008/11/26 06:49:56
Fixed. I wonder why lint didn't catch this?
|
+ Value value() { return value_; } |
+ Node* left() { return left_; } |
+ Node* right() { return right_; } |
+ private: |
+ friend class ZoneSplayTree; |
+ friend class Locator; |
+ Key key_; |
+ Value value_; |
+ Node* left_; |
+ Node* right_; |
+ }; |
+ |
+ // A locator provides access to a node in the tree without actually |
+ // exposing the node. |
+ class Locator { |
+ public: |
+ explicit Locator(Node* node) : node_(node) { } |
+ Locator() : node_(NULL) { } |
+ const Key& key() { return node_->key_; } |
+ Value& value() { return node_->value_; } |
+ void set_value(const Value& value) { node_->value_ = value; } |
+ inline void bind(Node* node) { node_ = node; } |
+ private: |
+ Node* node_; |
+ }; |
+ |
+ template <class Callback> |
+ void ForEach(Callback* c) { |
+ DoForEach<typename ZoneSplayTree<Config>::Node, Callback>(root_, c); |
+ } |
+ |
+ private: |
+ Node* root_; |
+}; |
+ |
+ |
+// A set of unsigned integers that behaves especially well on small |
+// integers (< 32). May do zone-allocation. |
+class OutSet: public ZoneObject { |
+ public: |
+ OutSet() : first_(0), remaining_(NULL), successors_(NULL) { } |
+ OutSet* Extend(unsigned value); |
+ bool Get(unsigned value); |
+ static const unsigned kFirstLimit = 32; |
+ private: |
Mads Ager (chromium)
2008/11/25 21:09:41
Have the empty line before private instead of afte
Christian Plesner Hansen
2008/11/26 06:49:56
Fixed.
|
+ |
+ // Destructively set a value in this set. In most cases you want |
+ // to use Extend instead to ensure that only one instance exists |
+ // that contains the same values. |
+ void Set(unsigned value); |
+ |
+ // The successors are a list of sets that contain the same values |
+ // as this set and the one more value that is not present in this |
+ // set. |
+ ZoneList<OutSet*>* successors() { return successors_; } |
+ |
+ OutSet(uint32_t first, ZoneList<unsigned>* remaining) |
+ : first_(first), remaining_(remaining), successors_(NULL) { } |
+ uint32_t first_; |
+ ZoneList<unsigned>* remaining_; |
+ ZoneList<OutSet*>* successors_; |
+}; |
+ |
+ |
+// A mapping from integers, specified as ranges, to a set of integers. |
+// Used for mapping character ranges to choices. |
+class DispatchTable { |
+ public: |
+ class Entry { |
+ public: |
+ Entry() |
+ : from_(0), to_(0), out_set_(NULL) { } |
Mads Ager (chromium)
2008/11/25 21:09:41
Put this on one line.
Christian Plesner Hansen
2008/11/26 06:49:56
Fixed.
|
+ Entry(uc16 from, uc16 to, OutSet* out_set) |
+ : from_(from), to_(to), out_set_(out_set) { } |
+ uc16 from() { return from_; } |
+ uc16 to() { return to_; } |
+ void set_to(uc16 value) { to_ = value; } |
+ void AddValue(int value) { out_set_ = out_set_->Extend(value); } |
+ OutSet* out_set() { return out_set_; } |
+ private: |
+ uc16 from_; |
+ uc16 to_; |
+ OutSet* out_set_; |
+ }; |
+ |
+ class Config { |
+ public: |
+ typedef uc16 Key; |
+ typedef Entry Value; |
+ static const uc16 kNoKey; |
+ static const Entry kNoValue; |
+ static inline int Compare(uc16 a, uc16 b) { |
+ if (a == b) |
Mads Ager (chromium)
2008/11/25 21:09:41
How about:
if (a == b) return 0;
if (a < b) retur
Christian Plesner Hansen
2008/11/26 06:49:56
That's a religious question: should there be an 'e
|
+ return 0; |
+ else if (a < b) |
+ return -1; |
+ else |
+ return 1; |
+ } |
+ }; |
+ |
+ void AddRange(CharacterRange range, int value); |
+ OutSet* Get(uc16 value); |
+ void Dump(); |
+ |
+ template <typename Callback> |
+ void ForEach(Callback* callback) { return tree()->ForEach(callback); } |
+ private: |
+ // There can't be a static empty set since it allocates its |
+ // successors in a zone and caches them. |
+ OutSet* empty() { return &empty_; } |
+ OutSet empty_; |
+ ZoneSplayTree<Config>* tree() { return &tree_; } |
+ ZoneSplayTree<Config> tree_; |
+}; |
+ |
+ |
+#define FOR_EACH_NODE_TYPE(VISIT) \ |
+ VISIT(End) \ |
+ VISIT(Action) \ |
+ VISIT(Choice) \ |
+ VISIT(BackReference) \ |
+ VISIT(Text) |
+ |
+ |
+#define FOR_EACH_REG_EXP_TREE_TYPE(VISIT) \ |
+ VISIT(Disjunction) \ |
+ VISIT(Alternative) \ |
+ VISIT(Assertion) \ |
+ VISIT(CharacterClass) \ |
+ VISIT(Atom) \ |
+ VISIT(Quantifier) \ |
+ VISIT(Capture) \ |
+ VISIT(Lookahead) \ |
+ VISIT(BackReference) \ |
+ VISIT(Empty) \ |
+ VISIT(Text) |
+ |
+ |
+#define FORWARD_DECLARE(Name) class RegExp##Name; |
+FOR_EACH_REG_EXP_TREE_TYPE(FORWARD_DECLARE) |
+#undef FORWARD_DECLARE |
+ |
+ |
+class TextElement { |
+ public: |
+ enum Type {UNINITIALIZED, ATOM, CHAR_CLASS}; |
+ TextElement() : type(UNINITIALIZED) { } |
+ explicit TextElement(Type t) : type(t) { } |
+ static TextElement Atom(RegExpAtom* atom); |
+ static TextElement CharClass(RegExpCharacterClass* char_class); |
+ Type type; |
+ union { |
+ RegExpAtom* u_atom; |
+ RegExpCharacterClass* u_char_class; |
+ } data; |
+}; |
+ |
+ |
+struct NodeInfo { |
+ NodeInfo() |
+ : being_analyzed(false), |
+ been_analyzed(false), |
+ determine_word(false), |
+ determine_newline(false), |
+ determine_start(false), |
+ follows_word_interest(false), |
+ follows_newline_interest(false), |
+ follows_start_interest(false) { } |
+ bool SameInterests(NodeInfo* that) { |
+ return (follows_word_interest == that->follows_word_interest) |
+ && (follows_newline_interest == that->follows_newline_interest) |
+ && (follows_start_interest == that->follows_start_interest); |
+ } |
+ void AdoptInterests(NodeInfo* that) { |
+ follows_word_interest = that->follows_word_interest; |
+ follows_newline_interest = that->follows_newline_interest; |
+ follows_start_interest = that->follows_start_interest; |
+ } |
+ bool prev_determine_word() { |
+ return determine_word || follows_word_interest; |
+ } |
+ bool prev_determine_newline() { |
+ return determine_newline || follows_newline_interest; |
+ } |
+ bool prev_determine_start() { |
+ return determine_start || follows_start_interest; |
+ } |
+ bool being_analyzed: 1; |
+ bool been_analyzed: 1; |
+ bool determine_word: 1; |
+ bool determine_newline: 1; |
+ bool determine_start: 1; |
+ bool follows_word_interest: 1; |
+ bool follows_newline_interest: 1; |
+ bool follows_start_interest: 1; |
+}; |
+ |
+ |
+STATIC_CHECK(sizeof(NodeInfo) <= sizeof(int)); // NOLINT |
+ |
+ |
+class SiblingList { |
+ public: |
+ SiblingList() : list_(NULL) { } |
+ int length() { |
+ return list_ == NULL ? 0 : list_->length(); |
+ } |
+ void Ensure(RegExpNode* parent) { |
+ if (list_ == NULL) { |
+ list_ = new ZoneList<RegExpNode*>(2); |
+ list_->Add(parent); |
+ } |
+ } |
+ void Add(RegExpNode* node) { list_->Add(node); } |
+ RegExpNode* Get(int index) { return list_->at(index); } |
+ private: |
+ ZoneList<RegExpNode*>* list_; |
+}; |
+ |
+ |
+class RegExpNode: public ZoneObject { |
+ public: |
+ virtual ~RegExpNode() { } |
+ virtual void Accept(NodeVisitor* visitor) = 0; |
+ // Generates a goto to this node or actually generates the code at this point. |
+ // Until the implementation is complete we will return true for success and |
+ // false for failure. |
+ virtual bool GoTo(RegExpCompiler* compiler); |
+ Label* label(); |
+ |
+ // Until the implementation is complete we will return true for success and |
+ // false for failure. |
+ virtual bool Emit(RegExpCompiler* compiler) = 0; |
+ virtual RegExpNode* PropagateInterest(NodeInfo* info) = 0; |
+ NodeInfo* info() { return &info_; } |
+ virtual bool IsBacktrack() { return false; } |
+ RegExpNode* GetSibling(NodeInfo* info); |
+ void EnsureSiblings() { siblings_.Ensure(this); } |
+ void AddSibling(RegExpNode* node) { siblings_.Add(node); } |
+ protected: |
+ inline void Bind(RegExpMacroAssembler* macro); |
+ private: |
+ Label label_; |
+ NodeInfo info_; |
+ SiblingList siblings_; |
+}; |
+ |
+ |
+class SeqRegExpNode: public RegExpNode { |
+ public: |
+ explicit SeqRegExpNode(RegExpNode* on_success) |
+ : on_success_(on_success) { } |
+ RegExpNode* on_success() { return on_success_; } |
+ void set_on_success(RegExpNode* node) { on_success_ = node; } |
+ virtual bool Emit(RegExpCompiler* compiler) { return false; } |
+ private: |
+ RegExpNode* on_success_; |
+}; |
+ |
+ |
+class ActionNode: public SeqRegExpNode { |
+ public: |
+ enum Type { |
+ STORE_REGISTER, |
+ INCREMENT_REGISTER, |
+ STORE_POSITION, |
+ SAVE_POSITION, |
+ RESTORE_POSITION, |
+ BEGIN_SUBMATCH, |
+ ESCAPE_SUBMATCH |
+ }; |
+ static ActionNode* StoreRegister(int reg, int val, RegExpNode* on_success); |
+ static ActionNode* IncrementRegister(int reg, RegExpNode* on_success); |
+ static ActionNode* StorePosition(int reg, RegExpNode* on_success); |
+ static ActionNode* SavePosition(int reg, RegExpNode* on_success); |
+ static ActionNode* RestorePosition(int reg, RegExpNode* on_success); |
+ static ActionNode* BeginSubmatch(int reg, RegExpNode* on_success); |
+ static ActionNode* EscapeSubmatch(int reg, RegExpNode* on_success); |
+ virtual void Accept(NodeVisitor* visitor); |
+ virtual bool Emit(RegExpCompiler* compiler); |
+ virtual RegExpNode* PropagateInterest(NodeInfo* info); |
+ private: |
+ union { |
+ struct { |
+ int reg; |
+ int value; |
+ } u_store_register; |
+ struct { |
+ int reg; |
+ } u_increment_register; |
+ struct { |
+ int reg; |
+ } u_position_register; |
+ struct { |
+ int reg; |
+ } u_submatch_stack_pointer_register; |
+ } data_; |
+ ActionNode(Type type, RegExpNode* on_success) |
+ : SeqRegExpNode(on_success), |
+ type_(type) { } |
+ Type type_; |
+ friend class DotPrinter; |
+}; |
+ |
+ |
+class TextNode: public SeqRegExpNode { |
+ public: |
+ TextNode(ZoneList<TextElement>* elms, |
+ RegExpNode* on_success, |
+ RegExpNode* on_failure) |
+ : SeqRegExpNode(on_success), |
+ on_failure_(on_failure), |
+ elms_(elms) { } |
+ virtual void Accept(NodeVisitor* visitor); |
+ virtual RegExpNode* PropagateInterest(NodeInfo* info); |
+ RegExpNode* on_failure() { return on_failure_; } |
+ virtual bool Emit(RegExpCompiler* compiler); |
+ ZoneList<TextElement>* elements() { return elms_; } |
+ private: |
+ RegExpNode* on_failure_; |
+ ZoneList<TextElement>* elms_; |
+}; |
+ |
+ |
+class BackReferenceNode: public SeqRegExpNode { |
+ public: |
+ BackReferenceNode(int start_reg, |
+ int end_reg, |
+ RegExpNode* on_success, |
+ RegExpNode* on_failure) |
+ : SeqRegExpNode(on_success), |
+ on_failure_(on_failure), |
+ start_reg_(start_reg), |
+ end_reg_(end_reg) { } |
+ virtual void Accept(NodeVisitor* visitor); |
+ RegExpNode* on_failure() { return on_failure_; } |
+ int start_register() { return start_reg_; } |
+ int end_register() { return end_reg_; } |
+ virtual bool Emit(RegExpCompiler* compiler); |
+ virtual RegExpNode* PropagateInterest(NodeInfo* info); |
+ private: |
+ RegExpNode* on_failure_; |
+ int start_reg_; |
+ int end_reg_; |
+}; |
+ |
+ |
+class EndNode: public RegExpNode { |
+ public: |
+ enum Action { ACCEPT, BACKTRACK }; |
+ explicit EndNode(Action action) : action_(action) { } |
+ virtual void Accept(NodeVisitor* visitor); |
+ virtual bool Emit(RegExpCompiler* compiler); |
+ virtual RegExpNode* PropagateInterest(NodeInfo* info); |
+ virtual bool IsBacktrack() { return action_ == BACKTRACK; } |
+ virtual bool GoTo(RegExpCompiler* compiler); |
+ private: |
+ Action action_; |
+}; |
+ |
+ |
+class Guard: public ZoneObject { |
+ public: |
+ enum Relation { LT, GEQ }; |
+ Guard(int reg, Relation op, int value) |
+ : reg_(reg), |
+ op_(op), |
+ value_(value) { } |
+ int reg() { return reg_; } |
+ Relation op() { return op_; } |
+ int value() { return value_; } |
+ private: |
+ int reg_; |
+ Relation op_; |
+ int value_; |
+}; |
+ |
+ |
+class GuardedAlternative { |
+ public: |
+ explicit GuardedAlternative(RegExpNode* node) : node_(node), guards_(NULL) { } |
+ void AddGuard(Guard* guard); |
+ RegExpNode* node() { return node_; } |
+ void set_node(RegExpNode* node) { node_ = node; } |
+ ZoneList<Guard*>* guards() { return guards_; } |
+ private: |
+ RegExpNode* node_; |
+ ZoneList<Guard*>* guards_; |
+}; |
+ |
+ |
+class ChoiceNode: public RegExpNode { |
+ public: |
+ explicit ChoiceNode(int expected_size, RegExpNode* on_failure) |
+ : on_failure_(on_failure), |
+ alternatives_(new ZoneList<GuardedAlternative>(expected_size)), |
+ table_calculated_(false), |
+ being_calculated_(false) { } |
+ virtual void Accept(NodeVisitor* visitor); |
+ void AddAlternative(GuardedAlternative node) { alternatives()->Add(node); } |
+ ZoneList<GuardedAlternative>* alternatives() { return alternatives_; } |
+ DispatchTable* table() { return &table_; } |
+ RegExpNode* on_failure() { return on_failure_; } |
+ virtual bool Emit(RegExpCompiler* compiler); |
+ virtual RegExpNode* PropagateInterest(NodeInfo* info); |
+ bool table_calculated() { return table_calculated_; } |
+ void set_table_calculated(bool b) { table_calculated_ = b; } |
+ bool being_calculated() { return being_calculated_; } |
+ void set_being_calculated(bool b) { being_calculated_ = b; } |
+ private: |
+ void GenerateGuard(RegExpMacroAssembler* macro_assembler, |
+ Guard *guard, |
Erik Corry
2008/11/25 11:03:52
Misplaced asterisk.
Mads Ager (chromium)
2008/11/25 21:09:41
This one is still there.
|
+ Label* on_failure); |
+ RegExpNode* on_failure_; |
+ ZoneList<GuardedAlternative>* alternatives_; |
+ DispatchTable table_; |
+ bool table_calculated_; |
+ bool being_calculated_; |
+}; |
+ |
+ |
+class NodeVisitor { |
+ public: |
+ virtual ~NodeVisitor() { } |
+#define DECLARE_VISIT(Type) \ |
+ virtual void Visit##Type(Type##Node* that) = 0; |
+FOR_EACH_NODE_TYPE(DECLARE_VISIT) |
+#undef DECLARE_VISIT |
+}; |
+ |
+ |
+// Node visitor used to add the start set of the alternatives to the |
+// dispatch table of a choice node. |
+class DispatchTableConstructor: public NodeVisitor { |
+ public: |
+ explicit DispatchTableConstructor(DispatchTable* table) |
+ : table_(table), |
+ choice_index_(-1) { } |
+ |
+ void BuildTable(ChoiceNode* node); |
+ |
+ void AddRange(CharacterRange range) { |
+ table()->AddRange(range, choice_index_); |
+ } |
+ |
+ void AddInverse(ZoneList<CharacterRange>* ranges); |
+ |
+#define DECLARE_VISIT(Type) \ |
+ virtual void Visit##Type(Type##Node* that); |
+FOR_EACH_NODE_TYPE(DECLARE_VISIT) |
+#undef DECLARE_VISIT |
+ |
+ DispatchTable* table() { return table_; } |
+ void set_choice_index(int value) { choice_index_ = value; } |
+ |
+ protected: |
+ DispatchTable *table_; |
Erik Corry
2008/11/25 11:03:52
Misplaced asterisk.
Mads Ager (chromium)
2008/11/25 21:09:41
This is still there.
|
+ int choice_index_; |
+}; |
+ |
+ |
+class Analysis: public NodeVisitor { |
+ public: |
+ void EnsureAnalyzed(RegExpNode* node); |
+ |
+#define DECLARE_VISIT(Type) \ |
+ virtual void Visit##Type(Type##Node* that); |
+FOR_EACH_NODE_TYPE(DECLARE_VISIT) |
+#undef DECLARE_VISIT |
+}; |
+ |
+ |
+struct RegExpParseResult { |
+ RegExpTree* tree; |
+ bool has_character_escapes; |
+ Handle<String> error; |
+ int capture_count; |
+}; |
+ |
+ |
+class RegExpEngine: public AllStatic { |
+ public: |
+ static Handle<FixedArray> Compile(RegExpParseResult* input, |
+ RegExpNode** node_return, |
+ bool ignore_case); |
+ static void DotPrint(const char* label, RegExpNode* node); |
+}; |
+ |
+ |
} } // namespace v8::internal |
#endif // V8_JSREGEXP_H_ |