OLD | NEW |
---|---|
1 // Copyright 2006-2008 the V8 project authors. All rights reserved. | 1 // Copyright 2006-2008 the V8 project authors. All rights reserved. |
2 // Redistribution and use in source and binary forms, with or without | 2 // Redistribution and use in source and binary forms, with or without |
3 // modification, are permitted provided that the following conditions are | 3 // modification, are permitted provided that the following conditions are |
4 // met: | 4 // met: |
5 // | 5 // |
6 // * Redistributions of source code must retain the above copyright | 6 // * Redistributions of source code must retain the above copyright |
7 // notice, this list of conditions and the following disclaimer. | 7 // notice, this list of conditions and the following disclaimer. |
8 // * Redistributions in binary form must reproduce the above | 8 // * Redistributions in binary form must reproduce the above |
9 // copyright notice, this list of conditions and the following | 9 // copyright notice, this list of conditions and the following |
10 // disclaimer in the documentation and/or other materials provided | 10 // disclaimer in the documentation and/or other materials provided |
(...skipping 33 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
44 bool* has_pending_exception); | 44 bool* has_pending_exception); |
45 | 45 |
46 // Returns a string representation of a regular expression. | 46 // Returns a string representation of a regular expression. |
47 // Implements RegExp.prototype.toString, see ECMA-262 section 15.10.6.4. | 47 // Implements RegExp.prototype.toString, see ECMA-262 section 15.10.6.4. |
48 // This function calls the garbage collector if necessary. | 48 // This function calls the garbage collector if necessary. |
49 static Handle<String> ToString(Handle<Object> value); | 49 static Handle<String> ToString(Handle<Object> value); |
50 | 50 |
51 // Parses the RegExp pattern and prepares the JSRegExp object with | 51 // Parses the RegExp pattern and prepares the JSRegExp object with |
52 // generic data and choice of implementation - as well as what | 52 // generic data and choice of implementation - as well as what |
53 // the implementation wants to store in the data field. | 53 // the implementation wants to store in the data field. |
54 // Returns false if compilation fails. | |
54 static Handle<Object> Compile(Handle<JSRegExp> re, | 55 static Handle<Object> Compile(Handle<JSRegExp> re, |
55 Handle<String> pattern, | 56 Handle<String> pattern, |
56 Handle<String> flags); | 57 Handle<String> flags); |
57 | 58 |
58 // See ECMA-262 section 15.10.6.2. | 59 // See ECMA-262 section 15.10.6.2. |
59 // This function calls the garbage collector if necessary. | 60 // This function calls the garbage collector if necessary. |
60 static Handle<Object> Exec(Handle<JSRegExp> regexp, | 61 static Handle<Object> Exec(Handle<JSRegExp> regexp, |
61 Handle<String> subject, | 62 Handle<String> subject, |
62 Handle<Object> index); | 63 int index, |
64 Handle<JSArray> lastMatchInfo); | |
63 | 65 |
64 // Call RegExp.prototyp.exec(string) in a loop. | 66 // Call RegExp.prototyp.exec(string) in a loop. |
65 // Used by String.prototype.match and String.prototype.replace. | 67 // Used by String.prototype.match and String.prototype.replace. |
66 // This function calls the garbage collector if necessary. | 68 // This function calls the garbage collector if necessary. |
67 static Handle<Object> ExecGlobal(Handle<JSRegExp> regexp, | 69 static Handle<Object> ExecGlobal(Handle<JSRegExp> regexp, |
68 Handle<String> subject); | 70 Handle<String> subject, |
71 Handle<JSArray> lastMatchInfo); | |
69 | 72 |
70 // Prepares a JSRegExp object with Irregexp-specific data. | 73 // Prepares a JSRegExp object with Irregexp-specific data. |
71 static Handle<Object> IrregexpPrepare(Handle<JSRegExp> re, | 74 static void IrregexpPrepare(Handle<JSRegExp> re, |
72 Handle<String> pattern, | 75 Handle<String> pattern, |
73 JSRegExp::Flags flags); | 76 JSRegExp::Flags flags, |
77 int capture_register_count); | |
74 | 78 |
75 | 79 |
76 static Handle<Object> AtomCompile(Handle<JSRegExp> re, | 80 static void AtomCompile(Handle<JSRegExp> re, |
77 Handle<String> pattern, | 81 Handle<String> pattern, |
78 JSRegExp::Flags flags, | 82 JSRegExp::Flags flags, |
79 Handle<String> match_pattern); | 83 Handle<String> match_pattern); |
80 static Handle<Object> AtomExec(Handle<JSRegExp> regexp, | 84 static Handle<Object> AtomExec(Handle<JSRegExp> regexp, |
81 Handle<String> subject, | 85 Handle<String> subject, |
82 Handle<Object> index); | 86 int index, |
87 Handle<JSArray> lastMatchInfo); | |
83 | 88 |
84 static Handle<Object> AtomExecGlobal(Handle<JSRegExp> regexp, | 89 static Handle<Object> AtomExecGlobal(Handle<JSRegExp> regexp, |
85 Handle<String> subject); | 90 Handle<String> subject, |
91 Handle<JSArray> lastMatchInfo); | |
86 | 92 |
87 // Execute an Irregexp bytecode pattern. | 93 // Execute an Irregexp bytecode pattern. |
88 static Handle<Object> IrregexpExec(Handle<JSRegExp> regexp, | 94 static Handle<Object> IrregexpExec(Handle<JSRegExp> regexp, |
89 Handle<String> subject, | 95 Handle<String> subject, |
90 Handle<Object> index); | 96 int index, |
97 Handle<JSArray> lastMatchInfo); | |
91 | 98 |
92 static Handle<Object> IrregexpExecGlobal(Handle<JSRegExp> regexp, | 99 static Handle<Object> IrregexpExecGlobal(Handle<JSRegExp> regexp, |
93 Handle<String> subject); | 100 Handle<String> subject, |
101 Handle<JSArray> lastMatchInfo); | |
94 | 102 |
95 static void NewSpaceCollectionPrologue(); | 103 static void NewSpaceCollectionPrologue(); |
96 static void OldSpaceCollectionPrologue(); | 104 static void OldSpaceCollectionPrologue(); |
97 | 105 |
98 // Converts a source string to a 16 bit flat string. The string | 106 // Converts a source string to a 16 bit flat string. The string |
99 // will be either sequential or it will be a SlicedString backed | 107 // will be either sequential or it will be a SlicedString backed |
100 // by a flat string. | 108 // by a flat string. |
101 static Handle<String> StringToTwoByte(Handle<String> pattern); | 109 static Handle<String> StringToTwoByte(Handle<String> pattern); |
102 static Handle<String> CachedStringToTwoByte(Handle<String> pattern); | 110 static Handle<String> CachedStringToTwoByte(Handle<String> pattern); |
103 | 111 |
104 static const int kIrregexpImplementationIndex = 0; | 112 // Offsets in the lastMatchInfo array. |
105 static const int kIrregexpNumberOfCapturesIndex = 1; | 113 static const int kLastCaptureCount = 0; |
106 static const int kIrregexpNumberOfRegistersIndex = 2; | 114 static const int kLastSubject = 1; |
107 static const int kIrregexpCodeIndex = 3; | 115 static const int kLastInput = 2; |
108 static const int kIrregexpDataLength = 4; | 116 static const int kFirstCapture = 1; |
117 static const int kLastMatchOverhead = 3; | |
118 static int GetCapture(FixedArray* array, int index) { | |
Mads Ager (chromium)
2009/03/11 13:49:17
This is a general comment on this code. Don't let
Erik Corry
2009/03/11 14:01:06
Changed here, left alone other places in the file.
| |
119 return Smi::cast(array->get(index + kFirstCapture))->value(); | |
120 } | |
121 static void SetLastCaptureCount(FixedArray* array, int to) { | |
122 array->set(kLastCaptureCount, Smi::FromInt(to)); | |
123 } | |
124 static void SetLastSubject(FixedArray* array, String* to) { | |
125 int capture_count = GetLastCaptureCount(array); | |
126 array->set(capture_count + kLastSubject, to); | |
127 } | |
128 static void SetLastInput(FixedArray* array, String* to) { | |
129 int capture_count = GetLastCaptureCount(array); | |
130 array->set(capture_count + kLastInput, to); | |
131 } | |
132 static void SetCapture(FixedArray* array, int index, int to) { | |
133 array->set(index + kFirstCapture, Smi::FromInt(to)); | |
134 } | |
109 | 135 |
110 private: | 136 private: |
111 static String* last_ascii_string_; | 137 static String* last_ascii_string_; |
112 static String* two_byte_cached_string_; | 138 static String* two_byte_cached_string_; |
113 | 139 |
114 static int IrregexpNumberOfCaptures(Handle<FixedArray> re); | 140 static bool EnsureCompiledIrregexp(Handle<JSRegExp> re, bool is_ascii); |
115 static int IrregexpNumberOfRegisters(Handle<FixedArray> re); | 141 |
116 static Handle<ByteArray> IrregexpByteCode(Handle<FixedArray> re); | 142 static int IrregexpMaxRegisterCount(FixedArray* re); |
117 static Handle<Code> IrregexpNativeCode(Handle<FixedArray> re); | 143 static void SetIrregexpMaxRegisterCount(FixedArray* re, int value); |
144 static int IrregexpNumberOfCaptures(FixedArray* re); | |
145 static int IrregexpNumberOfRegisters(FixedArray* re); | |
146 static ByteArray* IrregexpByteCode(FixedArray* re, bool is_ascii); | |
147 static Code* IrregexpNativeCode(FixedArray* re, bool is_ascii); | |
118 | 148 |
119 // On a successful match, the result is a JSArray containing | 149 // On a successful match, the result is a JSArray containing |
120 // captured positions. On a failure, the result is the null value. | 150 // captured positions. On a failure, the result is the null value. |
121 // Returns an empty handle in case of an exception. | 151 // Returns an empty handle in case of an exception. |
122 static Handle<Object> IrregexpExecOnce(Handle<FixedArray> regexp, | 152 static Handle<Object> IrregexpExecOnce(Handle<FixedArray> regexp, |
123 int num_captures, | 153 int num_captures, |
154 Handle<JSArray> lastMatchInfo, | |
124 Handle<String> subject16, | 155 Handle<String> subject16, |
125 int previous_index, | 156 int previous_index, |
126 int* ovector, | 157 int* ovector, |
127 int ovector_length); | 158 int ovector_length); |
128 | 159 |
129 // Set the subject cache. The previous string buffer is not deleted, so the | 160 // Set the subject cache. The previous string buffer is not deleted, so the |
130 // caller should ensure that it doesn't leak. | 161 // caller should ensure that it doesn't leak. |
131 static void SetSubjectCache(String* subject, | 162 static void SetSubjectCache(String* subject, |
132 char* utf8_subject, | 163 char* utf8_subject, |
133 int uft8_length, | 164 int uft8_length, |
134 int character_position, | 165 int character_position, |
135 int utf8_position); | 166 int utf8_position); |
136 | 167 |
168 // Used to access the lastMatchInfo array. | |
169 static int GetLastCaptureCount(FixedArray* array) { | |
170 return Smi::cast(array->get(kLastCaptureCount))->value(); | |
171 } | |
137 // A one element cache of the last utf8_subject string and its length. The | 172 // A one element cache of the last utf8_subject string and its length. The |
138 // subject JS String object is cached in the heap. We also cache a | 173 // subject JS String object is cached in the heap. We also cache a |
139 // translation between position and utf8 position. | 174 // translation between position and utf8 position. |
140 static char* utf8_subject_cache_; | 175 static char* utf8_subject_cache_; |
141 static int utf8_length_cache_; | 176 static int utf8_length_cache_; |
142 static int utf8_position_; | 177 static int utf8_position_; |
143 static int character_position_; | 178 static int character_position_; |
144 }; | 179 }; |
145 | 180 |
146 | 181 |
(...skipping 1165 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
1312 RegExpNode* node; | 1347 RegExpNode* node; |
1313 bool simple; | 1348 bool simple; |
1314 bool contains_anchor; | 1349 bool contains_anchor; |
1315 Handle<String> error; | 1350 Handle<String> error; |
1316 int capture_count; | 1351 int capture_count; |
1317 }; | 1352 }; |
1318 | 1353 |
1319 | 1354 |
1320 class RegExpEngine: public AllStatic { | 1355 class RegExpEngine: public AllStatic { |
1321 public: | 1356 public: |
1322 static Handle<FixedArray> Compile(RegExpCompileData* input, | 1357 struct CompilationResult { |
1323 bool ignore_case, | 1358 explicit CompilationResult(const char* error_message) |
1324 bool multiline, | 1359 : error_message(error_message), |
1325 Handle<String> pattern, | 1360 code(Heap::the_hole_value()), |
1326 bool is_ascii); | 1361 num_registers(0) {} |
1362 CompilationResult(Object* code, int registers) | |
1363 : error_message(NULL), | |
1364 code(code), | |
1365 num_registers(registers) {} | |
1366 const char* error_message; | |
1367 Object* code; | |
1368 int num_registers; | |
1369 }; | |
1370 | |
1371 static CompilationResult Compile(RegExpCompileData* input, | |
1372 bool ignore_case, | |
1373 bool multiline, | |
1374 Handle<String> pattern, | |
1375 bool is_ascii); | |
1327 | 1376 |
1328 static void DotPrint(const char* label, RegExpNode* node, bool ignore_case); | 1377 static void DotPrint(const char* label, RegExpNode* node, bool ignore_case); |
1329 }; | 1378 }; |
1330 | 1379 |
1331 | 1380 |
1332 } } // namespace v8::internal | 1381 } } // namespace v8::internal |
1333 | 1382 |
1334 #endif // V8_JSREGEXP_H_ | 1383 #endif // V8_JSREGEXP_H_ |
OLD | NEW |