Chromium Code Reviews| OLD | NEW |
|---|---|
| 1 // Copyright 2008 the V8 project authors. All rights reserved. | 1 // Copyright 2008 the V8 project authors. All rights reserved. |
| 2 // Redistribution and use in source and binary forms, with or without | 2 // Redistribution and use in source and binary forms, with or without |
| 3 // modification, are permitted provided that the following conditions are | 3 // modification, are permitted provided that the following conditions are |
| 4 // met: | 4 // met: |
| 5 // | 5 // |
| 6 // * Redistributions of source code must retain the above copyright | 6 // * Redistributions of source code must retain the above copyright |
| 7 // notice, this list of conditions and the following disclaimer. | 7 // notice, this list of conditions and the following disclaimer. |
| 8 // * Redistributions in binary form must reproduce the above | 8 // * Redistributions in binary form must reproduce the above |
| 9 // copyright notice, this list of conditions and the following | 9 // copyright notice, this list of conditions and the following |
| 10 // disclaimer in the documentation and/or other materials provided | 10 // disclaimer in the documentation and/or other materials provided |
| (...skipping 11 matching lines...) Expand all Loading... | |
| 22 // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, | 22 // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
| 23 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY | 23 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
| 24 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | 24 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
| 25 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE | 25 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
| 26 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | 26 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| 27 | 27 |
| 28 // A simple interpreter for the Irregexp byte code. | 28 // A simple interpreter for the Irregexp byte code. |
| 29 | 29 |
| 30 | 30 |
| 31 #include "v8.h" | 31 #include "v8.h" |
| 32 #include "unicode.h" | |
| 32 #include "utils.h" | 33 #include "utils.h" |
| 33 #include "ast.h" | 34 #include "ast.h" |
| 34 #include "bytecodes-irregexp.h" | 35 #include "bytecodes-irregexp.h" |
| 35 #include "interpreter-irregexp.h" | 36 #include "interpreter-irregexp.h" |
| 36 | 37 |
| 37 | 38 |
| 38 namespace v8 { namespace internal { | 39 namespace v8 { namespace internal { |
| 39 | 40 |
| 40 | 41 |
| 42 static unibrow::Mapping<unibrow::Ecma262Canonicalize> canonicalize; | |
| 43 | |
| 44 | |
| 45 static bool BackRefMatchesNoCase(int from, | |
|
Christian Plesner Hansen
2008/11/25 08:18:45
If we were concerned about performance we could co
| |
| 46 int current, | |
| 47 int len, | |
| 48 Vector<const uc16> subject) { | |
| 49 for (int i = 0; i < len; i++) { | |
| 50 unibrow::uchar old_char = subject[from++]; | |
| 51 unibrow::uchar new_char = subject[current++]; | |
| 52 canonicalize.get(old_char, '\0', &old_char); | |
| 53 canonicalize.get(new_char, '\0', &new_char); | |
| 54 if (old_char != new_char) { | |
| 55 return false; | |
| 56 } | |
| 57 } | |
| 58 return true; | |
| 59 } | |
| 60 | |
| 61 | |
| 41 #ifdef DEBUG | 62 #ifdef DEBUG |
| 42 static void TraceInterpreter(const byte* code_base, | 63 static void TraceInterpreter(const byte* code_base, |
| 43 const byte* pc, | 64 const byte* pc, |
| 44 int stack_depth, | 65 int stack_depth, |
| 45 int current_position, | 66 int current_position, |
| 46 int bytecode_length, | 67 int bytecode_length, |
| 47 const char* bytecode_name) { | 68 const char* bytecode_name) { |
| 48 if (FLAG_trace_regexp_bytecodes) { | 69 if (FLAG_trace_regexp_bytecodes) { |
| 49 PrintF("pc = %02x, sp = %d, current = %d, bc = %s", | 70 PrintF("pc = %02x, sp = %d, current = %d, bc = %s", |
| 50 pc - code_base, | 71 pc - code_base, |
| (...skipping 261 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
| 312 pc = code_base + Load32(pc + 2); | 333 pc = code_base + Load32(pc + 2); |
| 313 break; | 334 break; |
| 314 } | 335 } |
| 315 } | 336 } |
| 316 if (i < len) break; | 337 if (i < len) break; |
| 317 current += len; | 338 current += len; |
| 318 } | 339 } |
| 319 pc += BC_CHECK_NOT_BACK_REF_LENGTH; | 340 pc += BC_CHECK_NOT_BACK_REF_LENGTH; |
| 320 break; | 341 break; |
| 321 } | 342 } |
| 343 BYTECODE(CHECK_NOT_BACK_REF_NO_CASE) { | |
| 344 int from = registers[pc[1]]; | |
| 345 int len = registers[pc[1] + 1] - from; | |
| 346 if (current + len > subject.length()) { | |
| 347 pc = code_base + Load32(pc + 2); | |
| 348 break; | |
| 349 } else { | |
| 350 if (BackRefMatchesNoCase(from, current, len, subject)) { | |
| 351 pc += BC_CHECK_NOT_BACK_REF_NO_CASE_LENGTH; | |
| 352 } else { | |
| 353 pc = code_base + Load32(pc + 2); | |
| 354 } | |
| 355 } | |
| 356 break; | |
| 357 } | |
| 322 default: | 358 default: |
| 323 UNREACHABLE(); | 359 UNREACHABLE(); |
| 324 break; | 360 break; |
| 325 } | 361 } |
| 326 } | 362 } |
| 327 } | 363 } |
| 328 | 364 |
| 329 | 365 |
| 330 bool IrregexpInterpreter::Match(Handle<ByteArray> code_array, | 366 bool IrregexpInterpreter::Match(Handle<ByteArray> code_array, |
| 331 Handle<String> subject16, | 367 Handle<String> subject16, |
| 332 int* registers, | 368 int* registers, |
| 333 int start_position) { | 369 int start_position) { |
| 334 ASSERT(StringShape(*subject16).IsTwoByteRepresentation()); | 370 ASSERT(StringShape(*subject16).IsTwoByteRepresentation()); |
| 335 ASSERT(subject16->IsFlat(StringShape(*subject16))); | 371 ASSERT(subject16->IsFlat(StringShape(*subject16))); |
| 336 | 372 |
| 337 | 373 |
| 338 AssertNoAllocation a; | 374 AssertNoAllocation a; |
| 339 const byte* code_base = code_array->GetDataStartAddress(); | 375 const byte* code_base = code_array->GetDataStartAddress(); |
| 340 return RawMatch(code_base, | 376 return RawMatch(code_base, |
| 341 Vector<const uc16>(subject16->GetTwoByteData(), | 377 Vector<const uc16>(subject16->GetTwoByteData(), |
| 342 subject16->length()), | 378 subject16->length()), |
| 343 registers, | 379 registers, |
| 344 start_position); | 380 start_position); |
| 345 } | 381 } |
| 346 | 382 |
| 347 } } // namespace v8::internal | 383 } } // namespace v8::internal |
| OLD | NEW |