OLD | NEW |
1 // Copyright 2012 the V8 project authors. All rights reserved. | 1 // Copyright 2012 the V8 project authors. All rights reserved. |
2 // Redistribution and use in source and binary forms, with or without | 2 // Redistribution and use in source and binary forms, with or without |
3 // modification, are permitted provided that the following conditions are | 3 // modification, are permitted provided that the following conditions are |
4 // met: | 4 // met: |
5 // | 5 // |
6 // * Redistributions of source code must retain the above copyright | 6 // * Redistributions of source code must retain the above copyright |
7 // notice, this list of conditions and the following disclaimer. | 7 // notice, this list of conditions and the following disclaimer. |
8 // * Redistributions in binary form must reproduce the above | 8 // * Redistributions in binary form must reproduce the above |
9 // copyright notice, this list of conditions and the following | 9 // copyright notice, this list of conditions and the following |
10 // disclaimer in the documentation and/or other materials provided | 10 // disclaimer in the documentation and/or other materials provided |
(...skipping 213 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
224 Handle<FixedArray> data(FixedArray::cast(re->data())); | 224 Handle<FixedArray> data(FixedArray::cast(re->data())); |
225 compilation_cache->PutRegExp(pattern, flags, data); | 225 compilation_cache->PutRegExp(pattern, flags, data); |
226 | 226 |
227 return re; | 227 return re; |
228 } | 228 } |
229 | 229 |
230 | 230 |
231 Handle<Object> RegExpImpl::Exec(Handle<JSRegExp> regexp, | 231 Handle<Object> RegExpImpl::Exec(Handle<JSRegExp> regexp, |
232 Handle<String> subject, | 232 Handle<String> subject, |
233 int index, | 233 int index, |
234 Handle<JSArray> last_match_info) { | 234 Handle<JSArray> last_match_info, |
| 235 Zone* zone) { |
235 switch (regexp->TypeTag()) { | 236 switch (regexp->TypeTag()) { |
236 case JSRegExp::ATOM: | 237 case JSRegExp::ATOM: |
237 return AtomExec(regexp, subject, index, last_match_info); | 238 return AtomExec(regexp, subject, index, last_match_info); |
238 case JSRegExp::IRREGEXP: { | 239 case JSRegExp::IRREGEXP: { |
239 Handle<Object> result = | 240 Handle<Object> result = |
240 IrregexpExec(regexp, subject, index, last_match_info); | 241 IrregexpExec(regexp, subject, index, last_match_info, zone); |
241 ASSERT(!result.is_null() || | 242 ASSERT(!result.is_null() || |
242 regexp->GetIsolate()->has_pending_exception()); | 243 regexp->GetIsolate()->has_pending_exception()); |
243 return result; | 244 return result; |
244 } | 245 } |
245 default: | 246 default: |
246 UNREACHABLE(); | 247 UNREACHABLE(); |
247 return Handle<Object>::null(); | 248 return Handle<Object>::null(); |
248 } | 249 } |
249 } | 250 } |
250 | 251 |
(...skipping 86 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
337 | 338 |
338 // Irregexp implementation. | 339 // Irregexp implementation. |
339 | 340 |
340 // Ensures that the regexp object contains a compiled version of the | 341 // Ensures that the regexp object contains a compiled version of the |
341 // source for either ASCII or non-ASCII strings. | 342 // source for either ASCII or non-ASCII strings. |
342 // If the compiled version doesn't already exist, it is compiled | 343 // If the compiled version doesn't already exist, it is compiled |
343 // from the source pattern. | 344 // from the source pattern. |
344 // If compilation fails, an exception is thrown and this function | 345 // If compilation fails, an exception is thrown and this function |
345 // returns false. | 346 // returns false. |
346 bool RegExpImpl::EnsureCompiledIrregexp( | 347 bool RegExpImpl::EnsureCompiledIrregexp( |
347 Handle<JSRegExp> re, Handle<String> sample_subject, bool is_ascii) { | 348 Handle<JSRegExp> re, Handle<String> sample_subject, bool is_ascii, |
| 349 Zone* zone) { |
348 Object* compiled_code = re->DataAt(JSRegExp::code_index(is_ascii)); | 350 Object* compiled_code = re->DataAt(JSRegExp::code_index(is_ascii)); |
349 #ifdef V8_INTERPRETED_REGEXP | 351 #ifdef V8_INTERPRETED_REGEXP |
350 if (compiled_code->IsByteArray()) return true; | 352 if (compiled_code->IsByteArray()) return true; |
351 #else // V8_INTERPRETED_REGEXP (RegExp native code) | 353 #else // V8_INTERPRETED_REGEXP (RegExp native code) |
352 if (compiled_code->IsCode()) return true; | 354 if (compiled_code->IsCode()) return true; |
353 #endif | 355 #endif |
354 // We could potentially have marked this as flushable, but have kept | 356 // We could potentially have marked this as flushable, but have kept |
355 // a saved version if we did not flush it yet. | 357 // a saved version if we did not flush it yet. |
356 Object* saved_code = re->DataAt(JSRegExp::saved_code_index(is_ascii)); | 358 Object* saved_code = re->DataAt(JSRegExp::saved_code_index(is_ascii)); |
357 if (saved_code->IsCode()) { | 359 if (saved_code->IsCode()) { |
358 // Reinstate the code in the original place. | 360 // Reinstate the code in the original place. |
359 re->SetDataAt(JSRegExp::code_index(is_ascii), saved_code); | 361 re->SetDataAt(JSRegExp::code_index(is_ascii), saved_code); |
360 ASSERT(compiled_code->IsSmi()); | 362 ASSERT(compiled_code->IsSmi()); |
361 return true; | 363 return true; |
362 } | 364 } |
363 return CompileIrregexp(re, sample_subject, is_ascii); | 365 return CompileIrregexp(re, sample_subject, is_ascii, zone); |
364 } | 366 } |
365 | 367 |
366 | 368 |
367 static bool CreateRegExpErrorObjectAndThrow(Handle<JSRegExp> re, | 369 static bool CreateRegExpErrorObjectAndThrow(Handle<JSRegExp> re, |
368 bool is_ascii, | 370 bool is_ascii, |
369 Handle<String> error_message, | 371 Handle<String> error_message, |
370 Isolate* isolate) { | 372 Isolate* isolate) { |
371 Factory* factory = isolate->factory(); | 373 Factory* factory = isolate->factory(); |
372 Handle<FixedArray> elements = factory->NewFixedArray(2); | 374 Handle<FixedArray> elements = factory->NewFixedArray(2); |
373 elements->set(0, re->Pattern()); | 375 elements->set(0, re->Pattern()); |
374 elements->set(1, *error_message); | 376 elements->set(1, *error_message); |
375 Handle<JSArray> array = factory->NewJSArrayWithElements(elements); | 377 Handle<JSArray> array = factory->NewJSArrayWithElements(elements); |
376 Handle<Object> regexp_err = | 378 Handle<Object> regexp_err = |
377 factory->NewSyntaxError("malformed_regexp", array); | 379 factory->NewSyntaxError("malformed_regexp", array); |
378 isolate->Throw(*regexp_err); | 380 isolate->Throw(*regexp_err); |
379 return false; | 381 return false; |
380 } | 382 } |
381 | 383 |
382 | 384 |
383 bool RegExpImpl::CompileIrregexp(Handle<JSRegExp> re, | 385 bool RegExpImpl::CompileIrregexp(Handle<JSRegExp> re, |
384 Handle<String> sample_subject, | 386 Handle<String> sample_subject, |
385 bool is_ascii) { | 387 bool is_ascii, |
| 388 Zone* zone) { |
386 // Compile the RegExp. | 389 // Compile the RegExp. |
387 Isolate* isolate = re->GetIsolate(); | 390 Isolate* isolate = re->GetIsolate(); |
388 ZoneScope zone_scope(isolate, DELETE_ON_EXIT); | 391 ZoneScope zone_scope(isolate, DELETE_ON_EXIT); |
389 PostponeInterruptsScope postpone(isolate); | 392 PostponeInterruptsScope postpone(isolate); |
390 // If we had a compilation error the last time this is saved at the | 393 // If we had a compilation error the last time this is saved at the |
391 // saved code index. | 394 // saved code index. |
392 Object* entry = re->DataAt(JSRegExp::code_index(is_ascii)); | 395 Object* entry = re->DataAt(JSRegExp::code_index(is_ascii)); |
393 // When arriving here entry can only be a smi, either representing an | 396 // When arriving here entry can only be a smi, either representing an |
394 // uncompiled regexp, a previous compilation error, or code that has | 397 // uncompiled regexp, a previous compilation error, or code that has |
395 // been flushed. | 398 // been flushed. |
(...skipping 30 matching lines...) Expand all Loading... |
426 "malformed_regexp"); | 429 "malformed_regexp"); |
427 return false; | 430 return false; |
428 } | 431 } |
429 RegExpEngine::CompilationResult result = | 432 RegExpEngine::CompilationResult result = |
430 RegExpEngine::Compile(&compile_data, | 433 RegExpEngine::Compile(&compile_data, |
431 flags.is_ignore_case(), | 434 flags.is_ignore_case(), |
432 flags.is_global(), | 435 flags.is_global(), |
433 flags.is_multiline(), | 436 flags.is_multiline(), |
434 pattern, | 437 pattern, |
435 sample_subject, | 438 sample_subject, |
436 is_ascii); | 439 is_ascii, |
| 440 zone); |
437 if (result.error_message != NULL) { | 441 if (result.error_message != NULL) { |
438 // Unable to compile regexp. | 442 // Unable to compile regexp. |
439 Handle<String> error_message = | 443 Handle<String> error_message = |
440 isolate->factory()->NewStringFromUtf8(CStrVector(result.error_message)); | 444 isolate->factory()->NewStringFromUtf8(CStrVector(result.error_message)); |
441 CreateRegExpErrorObjectAndThrow(re, is_ascii, error_message, isolate); | 445 CreateRegExpErrorObjectAndThrow(re, is_ascii, error_message, isolate); |
442 return false; | 446 return false; |
443 } | 447 } |
444 | 448 |
445 Handle<FixedArray> data = Handle<FixedArray>(FixedArray::cast(re->data())); | 449 Handle<FixedArray> data = Handle<FixedArray>(FixedArray::cast(re->data())); |
446 data->set(JSRegExp::code_index(is_ascii), result.code); | 450 data->set(JSRegExp::code_index(is_ascii), result.code); |
(...skipping 44 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
491 // Initialize compiled code entries to null. | 495 // Initialize compiled code entries to null. |
492 re->GetIsolate()->factory()->SetRegExpIrregexpData(re, | 496 re->GetIsolate()->factory()->SetRegExpIrregexpData(re, |
493 JSRegExp::IRREGEXP, | 497 JSRegExp::IRREGEXP, |
494 pattern, | 498 pattern, |
495 flags, | 499 flags, |
496 capture_count); | 500 capture_count); |
497 } | 501 } |
498 | 502 |
499 | 503 |
500 int RegExpImpl::IrregexpPrepare(Handle<JSRegExp> regexp, | 504 int RegExpImpl::IrregexpPrepare(Handle<JSRegExp> regexp, |
501 Handle<String> subject) { | 505 Handle<String> subject, |
| 506 Zone* zone) { |
502 if (!subject->IsFlat()) FlattenString(subject); | 507 if (!subject->IsFlat()) FlattenString(subject); |
503 | 508 |
504 // Check the asciiness of the underlying storage. | 509 // Check the asciiness of the underlying storage. |
505 bool is_ascii = subject->IsAsciiRepresentationUnderneath(); | 510 bool is_ascii = subject->IsAsciiRepresentationUnderneath(); |
506 if (!EnsureCompiledIrregexp(regexp, subject, is_ascii)) return -1; | 511 if (!EnsureCompiledIrregexp(regexp, subject, is_ascii, zone)) return -1; |
507 | 512 |
508 #ifdef V8_INTERPRETED_REGEXP | 513 #ifdef V8_INTERPRETED_REGEXP |
509 // Byte-code regexp needs space allocated for all its registers. | 514 // Byte-code regexp needs space allocated for all its registers. |
510 return IrregexpNumberOfRegisters(FixedArray::cast(regexp->data())); | 515 return IrregexpNumberOfRegisters(FixedArray::cast(regexp->data())); |
511 #else // V8_INTERPRETED_REGEXP | 516 #else // V8_INTERPRETED_REGEXP |
512 // Native regexp only needs room to output captures. Registers are handled | 517 // Native regexp only needs room to output captures. Registers are handled |
513 // internally. | 518 // internally. |
514 return (IrregexpNumberOfCaptures(FixedArray::cast(regexp->data())) + 1) * 2; | 519 return (IrregexpNumberOfCaptures(FixedArray::cast(regexp->data())) + 1) * 2; |
515 #endif // V8_INTERPRETED_REGEXP | 520 #endif // V8_INTERPRETED_REGEXP |
516 } | 521 } |
(...skipping 12 matching lines...) Expand all Loading... |
529 *max_matches = size / registers_per_match; | 534 *max_matches = size / registers_per_match; |
530 return size; | 535 return size; |
531 #endif // V8_INTERPRETED_REGEXP | 536 #endif // V8_INTERPRETED_REGEXP |
532 } | 537 } |
533 | 538 |
534 | 539 |
535 int RegExpImpl::IrregexpExecRaw( | 540 int RegExpImpl::IrregexpExecRaw( |
536 Handle<JSRegExp> regexp, | 541 Handle<JSRegExp> regexp, |
537 Handle<String> subject, | 542 Handle<String> subject, |
538 int index, | 543 int index, |
539 Vector<int> output) { | 544 Vector<int> output, |
| 545 Zone* zone) { |
540 Isolate* isolate = regexp->GetIsolate(); | 546 Isolate* isolate = regexp->GetIsolate(); |
541 | 547 |
542 Handle<FixedArray> irregexp(FixedArray::cast(regexp->data()), isolate); | 548 Handle<FixedArray> irregexp(FixedArray::cast(regexp->data()), isolate); |
543 | 549 |
544 ASSERT(index >= 0); | 550 ASSERT(index >= 0); |
545 ASSERT(index <= subject->length()); | 551 ASSERT(index <= subject->length()); |
546 ASSERT(subject->IsFlat()); | 552 ASSERT(subject->IsFlat()); |
547 | 553 |
548 bool is_ascii = subject->IsAsciiRepresentationUnderneath(); | 554 bool is_ascii = subject->IsAsciiRepresentationUnderneath(); |
549 | 555 |
550 #ifndef V8_INTERPRETED_REGEXP | 556 #ifndef V8_INTERPRETED_REGEXP |
551 ASSERT(output.length() >= (IrregexpNumberOfCaptures(*irregexp) + 1) * 2); | 557 ASSERT(output.length() >= (IrregexpNumberOfCaptures(*irregexp) + 1) * 2); |
552 do { | 558 do { |
553 EnsureCompiledIrregexp(regexp, subject, is_ascii); | 559 EnsureCompiledIrregexp(regexp, subject, is_ascii, zone); |
554 Handle<Code> code(IrregexpNativeCode(*irregexp, is_ascii), isolate); | 560 Handle<Code> code(IrregexpNativeCode(*irregexp, is_ascii), isolate); |
555 NativeRegExpMacroAssembler::Result res = | 561 NativeRegExpMacroAssembler::Result res = |
556 NativeRegExpMacroAssembler::Match(code, | 562 NativeRegExpMacroAssembler::Match(code, |
557 subject, | 563 subject, |
558 output.start(), | 564 output.start(), |
559 output.length(), | 565 output.length(), |
560 index, | 566 index, |
561 isolate); | 567 isolate); |
562 if (res != NativeRegExpMacroAssembler::RETRY) { | 568 if (res != NativeRegExpMacroAssembler::RETRY) { |
563 ASSERT(res != NativeRegExpMacroAssembler::EXCEPTION || | 569 ASSERT(res != NativeRegExpMacroAssembler::EXCEPTION || |
564 isolate->has_pending_exception()); | 570 isolate->has_pending_exception()); |
565 STATIC_ASSERT( | 571 STATIC_ASSERT( |
566 static_cast<int>(NativeRegExpMacroAssembler::SUCCESS) == RE_SUCCESS); | 572 static_cast<int>(NativeRegExpMacroAssembler::SUCCESS) == RE_SUCCESS); |
567 STATIC_ASSERT( | 573 STATIC_ASSERT( |
568 static_cast<int>(NativeRegExpMacroAssembler::FAILURE) == RE_FAILURE); | 574 static_cast<int>(NativeRegExpMacroAssembler::FAILURE) == RE_FAILURE); |
569 STATIC_ASSERT(static_cast<int>(NativeRegExpMacroAssembler::EXCEPTION) | 575 STATIC_ASSERT(static_cast<int>(NativeRegExpMacroAssembler::EXCEPTION) |
570 == RE_EXCEPTION); | 576 == RE_EXCEPTION); |
571 return static_cast<IrregexpResult>(res); | 577 return static_cast<IrregexpResult>(res); |
572 } | 578 } |
573 // If result is RETRY, the string has changed representation, and we | 579 // If result is RETRY, the string has changed representation, and we |
574 // must restart from scratch. | 580 // must restart from scratch. |
575 // In this case, it means we must make sure we are prepared to handle | 581 // In this case, it means we must make sure we are prepared to handle |
576 // the, potentially, different subject (the string can switch between | 582 // the, potentially, different subject (the string can switch between |
577 // being internal and external, and even between being ASCII and UC16, | 583 // being internal and external, and even between being ASCII and UC16, |
578 // but the characters are always the same). | 584 // but the characters are always the same). |
579 IrregexpPrepare(regexp, subject); | 585 IrregexpPrepare(regexp, subject, zone); |
580 is_ascii = subject->IsAsciiRepresentationUnderneath(); | 586 is_ascii = subject->IsAsciiRepresentationUnderneath(); |
581 } while (true); | 587 } while (true); |
582 UNREACHABLE(); | 588 UNREACHABLE(); |
583 return RE_EXCEPTION; | 589 return RE_EXCEPTION; |
584 #else // V8_INTERPRETED_REGEXP | 590 #else // V8_INTERPRETED_REGEXP |
585 | 591 |
586 ASSERT(output.length() >= IrregexpNumberOfRegisters(*irregexp)); | 592 ASSERT(output.length() >= IrregexpNumberOfRegisters(*irregexp)); |
587 // We must have done EnsureCompiledIrregexp, so we can get the number of | 593 // We must have done EnsureCompiledIrregexp, so we can get the number of |
588 // registers. | 594 // registers. |
589 int* register_vector = output.start(); | 595 int* register_vector = output.start(); |
(...skipping 14 matching lines...) Expand all Loading... |
604 isolate->StackOverflow(); | 610 isolate->StackOverflow(); |
605 } | 611 } |
606 return result; | 612 return result; |
607 #endif // V8_INTERPRETED_REGEXP | 613 #endif // V8_INTERPRETED_REGEXP |
608 } | 614 } |
609 | 615 |
610 | 616 |
611 Handle<Object> RegExpImpl::IrregexpExec(Handle<JSRegExp> jsregexp, | 617 Handle<Object> RegExpImpl::IrregexpExec(Handle<JSRegExp> jsregexp, |
612 Handle<String> subject, | 618 Handle<String> subject, |
613 int previous_index, | 619 int previous_index, |
614 Handle<JSArray> last_match_info) { | 620 Handle<JSArray> last_match_info, |
| 621 Zone* zone) { |
615 Isolate* isolate = jsregexp->GetIsolate(); | 622 Isolate* isolate = jsregexp->GetIsolate(); |
616 ASSERT_EQ(jsregexp->TypeTag(), JSRegExp::IRREGEXP); | 623 ASSERT_EQ(jsregexp->TypeTag(), JSRegExp::IRREGEXP); |
617 | 624 |
618 // Prepare space for the return values. | 625 // Prepare space for the return values. |
619 #ifdef V8_INTERPRETED_REGEXP | 626 #ifdef V8_INTERPRETED_REGEXP |
620 #ifdef DEBUG | 627 #ifdef DEBUG |
621 if (FLAG_trace_regexp_bytecodes) { | 628 if (FLAG_trace_regexp_bytecodes) { |
622 String* pattern = jsregexp->Pattern(); | 629 String* pattern = jsregexp->Pattern(); |
623 PrintF("\n\nRegexp match: /%s/\n\n", *(pattern->ToCString())); | 630 PrintF("\n\nRegexp match: /%s/\n\n", *(pattern->ToCString())); |
624 PrintF("\n\nSubject string: '%s'\n\n", *(subject->ToCString())); | 631 PrintF("\n\nSubject string: '%s'\n\n", *(subject->ToCString())); |
625 } | 632 } |
626 #endif | 633 #endif |
627 #endif | 634 #endif |
628 int required_registers = RegExpImpl::IrregexpPrepare(jsregexp, subject); | 635 int required_registers = RegExpImpl::IrregexpPrepare(jsregexp, subject, zone); |
629 if (required_registers < 0) { | 636 if (required_registers < 0) { |
630 // Compiling failed with an exception. | 637 // Compiling failed with an exception. |
631 ASSERT(isolate->has_pending_exception()); | 638 ASSERT(isolate->has_pending_exception()); |
632 return Handle<Object>::null(); | 639 return Handle<Object>::null(); |
633 } | 640 } |
634 | 641 |
635 OffsetsVector registers(required_registers, isolate); | 642 OffsetsVector registers(required_registers, isolate); |
636 | 643 |
637 int res = RegExpImpl::IrregexpExecRaw( | 644 int res = RegExpImpl::IrregexpExecRaw( |
638 jsregexp, subject, previous_index, Vector<int>(registers.vector(), | 645 jsregexp, subject, previous_index, Vector<int>(registers.vector(), |
639 registers.length())); | 646 registers.length()), |
| 647 zone); |
640 if (res == RE_SUCCESS) { | 648 if (res == RE_SUCCESS) { |
641 int capture_register_count = | 649 int capture_register_count = |
642 (IrregexpNumberOfCaptures(FixedArray::cast(jsregexp->data())) + 1) * 2; | 650 (IrregexpNumberOfCaptures(FixedArray::cast(jsregexp->data())) + 1) * 2; |
643 last_match_info->EnsureSize(capture_register_count + kLastMatchOverhead); | 651 last_match_info->EnsureSize(capture_register_count + kLastMatchOverhead); |
644 AssertNoAllocation no_gc; | 652 AssertNoAllocation no_gc; |
645 int* register_vector = registers.vector(); | 653 int* register_vector = registers.vector(); |
646 FixedArray* array = FixedArray::cast(last_match_info->elements()); | 654 FixedArray* array = FixedArray::cast(last_match_info->elements()); |
647 for (int i = 0; i < capture_register_count; i += 2) { | 655 for (int i = 0; i < capture_register_count; i += 2) { |
648 SetCapture(array, i, register_vector[i]); | 656 SetCapture(array, i, register_vector[i]); |
649 SetCapture(array, i + 1, register_vector[i + 1]); | 657 SetCapture(array, i + 1, register_vector[i + 1]); |
(...skipping 260 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
910 | 918 |
911 | 919 |
912 private: | 920 private: |
913 CharacterFrequency frequencies_[RegExpMacroAssembler::kTableSize]; | 921 CharacterFrequency frequencies_[RegExpMacroAssembler::kTableSize]; |
914 int total_samples_; | 922 int total_samples_; |
915 }; | 923 }; |
916 | 924 |
917 | 925 |
918 class RegExpCompiler { | 926 class RegExpCompiler { |
919 public: | 927 public: |
920 RegExpCompiler(int capture_count, bool ignore_case, bool is_ascii); | 928 RegExpCompiler(int capture_count, bool ignore_case, bool is_ascii, |
| 929 Zone* zone); |
921 | 930 |
922 int AllocateRegister() { | 931 int AllocateRegister() { |
923 if (next_register_ >= RegExpMacroAssembler::kMaxRegister) { | 932 if (next_register_ >= RegExpMacroAssembler::kMaxRegister) { |
924 reg_exp_too_big_ = true; | 933 reg_exp_too_big_ = true; |
925 return next_register_; | 934 return next_register_; |
926 } | 935 } |
927 return next_register_++; | 936 return next_register_++; |
928 } | 937 } |
929 | 938 |
930 RegExpEngine::CompilationResult Assemble(RegExpMacroAssembler* assembler, | 939 RegExpEngine::CompilationResult Assemble(RegExpMacroAssembler* assembler, |
(...skipping 19 matching lines...) Expand all Loading... |
950 | 959 |
951 inline bool ignore_case() { return ignore_case_; } | 960 inline bool ignore_case() { return ignore_case_; } |
952 inline bool ascii() { return ascii_; } | 961 inline bool ascii() { return ascii_; } |
953 FrequencyCollator* frequency_collator() { return &frequency_collator_; } | 962 FrequencyCollator* frequency_collator() { return &frequency_collator_; } |
954 | 963 |
955 int current_expansion_factor() { return current_expansion_factor_; } | 964 int current_expansion_factor() { return current_expansion_factor_; } |
956 void set_current_expansion_factor(int value) { | 965 void set_current_expansion_factor(int value) { |
957 current_expansion_factor_ = value; | 966 current_expansion_factor_ = value; |
958 } | 967 } |
959 | 968 |
| 969 Zone* zone() { return zone_; } |
| 970 |
960 static const int kNoRegister = -1; | 971 static const int kNoRegister = -1; |
961 | 972 |
962 private: | 973 private: |
963 EndNode* accept_; | 974 EndNode* accept_; |
964 int next_register_; | 975 int next_register_; |
965 List<RegExpNode*>* work_list_; | 976 List<RegExpNode*>* work_list_; |
966 int recursion_depth_; | 977 int recursion_depth_; |
967 RegExpMacroAssembler* macro_assembler_; | 978 RegExpMacroAssembler* macro_assembler_; |
968 bool ignore_case_; | 979 bool ignore_case_; |
969 bool ascii_; | 980 bool ascii_; |
970 bool reg_exp_too_big_; | 981 bool reg_exp_too_big_; |
971 int current_expansion_factor_; | 982 int current_expansion_factor_; |
972 FrequencyCollator frequency_collator_; | 983 FrequencyCollator frequency_collator_; |
| 984 Zone* zone_; |
973 }; | 985 }; |
974 | 986 |
975 | 987 |
976 class RecursionCheck { | 988 class RecursionCheck { |
977 public: | 989 public: |
978 explicit RecursionCheck(RegExpCompiler* compiler) : compiler_(compiler) { | 990 explicit RecursionCheck(RegExpCompiler* compiler) : compiler_(compiler) { |
979 compiler->IncrementRecursionDepth(); | 991 compiler->IncrementRecursionDepth(); |
980 } | 992 } |
981 ~RecursionCheck() { compiler_->DecrementRecursionDepth(); } | 993 ~RecursionCheck() { compiler_->DecrementRecursionDepth(); } |
982 private: | 994 private: |
983 RegExpCompiler* compiler_; | 995 RegExpCompiler* compiler_; |
984 }; | 996 }; |
985 | 997 |
986 | 998 |
987 static RegExpEngine::CompilationResult IrregexpRegExpTooBig() { | 999 static RegExpEngine::CompilationResult IrregexpRegExpTooBig() { |
988 return RegExpEngine::CompilationResult("RegExp too big"); | 1000 return RegExpEngine::CompilationResult("RegExp too big"); |
989 } | 1001 } |
990 | 1002 |
991 | 1003 |
992 // Attempts to compile the regexp using an Irregexp code generator. Returns | 1004 // Attempts to compile the regexp using an Irregexp code generator. Returns |
993 // a fixed array or a null handle depending on whether it succeeded. | 1005 // a fixed array or a null handle depending on whether it succeeded. |
994 RegExpCompiler::RegExpCompiler(int capture_count, bool ignore_case, bool ascii) | 1006 RegExpCompiler::RegExpCompiler(int capture_count, bool ignore_case, bool ascii, |
| 1007 Zone* zone) |
995 : next_register_(2 * (capture_count + 1)), | 1008 : next_register_(2 * (capture_count + 1)), |
996 work_list_(NULL), | 1009 work_list_(NULL), |
997 recursion_depth_(0), | 1010 recursion_depth_(0), |
998 ignore_case_(ignore_case), | 1011 ignore_case_(ignore_case), |
999 ascii_(ascii), | 1012 ascii_(ascii), |
1000 reg_exp_too_big_(false), | 1013 reg_exp_too_big_(false), |
1001 current_expansion_factor_(1), | 1014 current_expansion_factor_(1), |
1002 frequency_collator_() { | 1015 frequency_collator_(), |
1003 accept_ = new EndNode(EndNode::ACCEPT); | 1016 zone_(zone) { |
| 1017 accept_ = new EndNode(EndNode::ACCEPT, zone); |
1004 ASSERT(next_register_ - 1 <= RegExpMacroAssembler::kMaxRegister); | 1018 ASSERT(next_register_ - 1 <= RegExpMacroAssembler::kMaxRegister); |
1005 } | 1019 } |
1006 | 1020 |
1007 | 1021 |
1008 RegExpEngine::CompilationResult RegExpCompiler::Assemble( | 1022 RegExpEngine::CompilationResult RegExpCompiler::Assemble( |
1009 RegExpMacroAssembler* macro_assembler, | 1023 RegExpMacroAssembler* macro_assembler, |
1010 RegExpNode* start, | 1024 RegExpNode* start, |
1011 int capture_count, | 1025 int capture_count, |
1012 Handle<String> pattern) { | 1026 Handle<String> pattern) { |
1013 Heap* heap = pattern->GetHeap(); | 1027 Heap* heap = pattern->GetHeap(); |
(...skipping 1896 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
2910 RegExpMacroAssembler* assembler = compiler->macro_assembler(); | 2924 RegExpMacroAssembler* assembler = compiler->macro_assembler(); |
2911 Trace::TriBool next_is_word_character = Trace::UNKNOWN; | 2925 Trace::TriBool next_is_word_character = Trace::UNKNOWN; |
2912 bool not_at_start = (trace->at_start() == Trace::FALSE); | 2926 bool not_at_start = (trace->at_start() == Trace::FALSE); |
2913 BoyerMooreLookahead* lookahead = bm_info(not_at_start); | 2927 BoyerMooreLookahead* lookahead = bm_info(not_at_start); |
2914 if (lookahead == NULL) { | 2928 if (lookahead == NULL) { |
2915 int eats_at_least = | 2929 int eats_at_least = |
2916 Min(kMaxLookaheadForBoyerMoore, | 2930 Min(kMaxLookaheadForBoyerMoore, |
2917 EatsAtLeast(kMaxLookaheadForBoyerMoore, 0, not_at_start)); | 2931 EatsAtLeast(kMaxLookaheadForBoyerMoore, 0, not_at_start)); |
2918 if (eats_at_least >= 1) { | 2932 if (eats_at_least >= 1) { |
2919 BoyerMooreLookahead* bm = | 2933 BoyerMooreLookahead* bm = |
2920 new BoyerMooreLookahead(eats_at_least, compiler); | 2934 new BoyerMooreLookahead(eats_at_least, compiler, zone()); |
2921 FillInBMInfo(0, 0, bm, not_at_start); | 2935 FillInBMInfo(0, 0, bm, not_at_start); |
2922 if (bm->at(0)->is_non_word()) next_is_word_character = Trace::FALSE; | 2936 if (bm->at(0)->is_non_word()) next_is_word_character = Trace::FALSE; |
2923 if (bm->at(0)->is_word()) next_is_word_character = Trace::TRUE; | 2937 if (bm->at(0)->is_word()) next_is_word_character = Trace::TRUE; |
2924 } | 2938 } |
2925 } else { | 2939 } else { |
2926 if (lookahead->at(0)->is_non_word()) next_is_word_character = Trace::FALSE; | 2940 if (lookahead->at(0)->is_non_word()) next_is_word_character = Trace::FALSE; |
2927 if (lookahead->at(0)->is_word()) next_is_word_character = Trace::TRUE; | 2941 if (lookahead->at(0)->is_word()) next_is_word_character = Trace::TRUE; |
2928 } | 2942 } |
2929 bool at_boundary = (type_ == AssertionNode::AT_BOUNDARY); | 2943 bool at_boundary = (type_ == AssertionNode::AT_BOUNDARY); |
2930 if (next_is_word_character == Trace::UNKNOWN) { | 2944 if (next_is_word_character == Trace::UNKNOWN) { |
(...skipping 560 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
3491 void BoyerMoorePositionInfo::SetAll() { | 3505 void BoyerMoorePositionInfo::SetAll() { |
3492 s_ = w_ = d_ = kLatticeUnknown; | 3506 s_ = w_ = d_ = kLatticeUnknown; |
3493 if (map_count_ != kMapSize) { | 3507 if (map_count_ != kMapSize) { |
3494 map_count_ = kMapSize; | 3508 map_count_ = kMapSize; |
3495 for (int i = 0; i < kMapSize; i++) map_->at(i) = true; | 3509 for (int i = 0; i < kMapSize; i++) map_->at(i) = true; |
3496 } | 3510 } |
3497 } | 3511 } |
3498 | 3512 |
3499 | 3513 |
3500 BoyerMooreLookahead::BoyerMooreLookahead( | 3514 BoyerMooreLookahead::BoyerMooreLookahead( |
3501 int length, RegExpCompiler* compiler) | 3515 int length, RegExpCompiler* compiler, Zone* zone) |
3502 : length_(length), | 3516 : length_(length), |
3503 compiler_(compiler) { | 3517 compiler_(compiler) { |
3504 if (compiler->ascii()) { | 3518 if (compiler->ascii()) { |
3505 max_char_ = String::kMaxAsciiCharCode; | 3519 max_char_ = String::kMaxAsciiCharCode; |
3506 } else { | 3520 } else { |
3507 max_char_ = String::kMaxUtf16CodeUnit; | 3521 max_char_ = String::kMaxUtf16CodeUnit; |
3508 } | 3522 } |
3509 bitmaps_ = new ZoneList<BoyerMoorePositionInfo*>(length); | 3523 bitmaps_ = new ZoneList<BoyerMoorePositionInfo*>(length); |
3510 for (int i = 0; i < length; i++) { | 3524 for (int i = 0; i < length; i++) { |
3511 bitmaps_->Add(new BoyerMoorePositionInfo()); | 3525 bitmaps_->Add(new BoyerMoorePositionInfo(zone)); |
3512 } | 3526 } |
3513 } | 3527 } |
3514 | 3528 |
3515 | 3529 |
3516 // Find the longest range of lookahead that has the fewest number of different | 3530 // Find the longest range of lookahead that has the fewest number of different |
3517 // characters that can occur at a given position. Since we are optimizing two | 3531 // characters that can occur at a given position. Since we are optimizing two |
3518 // different parameters at once this is a tradeoff. | 3532 // different parameters at once this is a tradeoff. |
3519 bool BoyerMooreLookahead::FindWorthwhileInterval(int* from, int* to) { | 3533 bool BoyerMooreLookahead::FindWorthwhileInterval(int* from, int* to) { |
3520 int biggest_points = 0; | 3534 int biggest_points = 0; |
3521 // If more than 32 characters out of 128 can occur it is unlikely that we can | 3535 // If more than 32 characters out of 128 can occur it is unlikely that we can |
(...skipping 325 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
3847 // not be atoms, they can be any reasonably limited character class or | 3861 // not be atoms, they can be any reasonably limited character class or |
3848 // small alternation. | 3862 // small alternation. |
3849 ASSERT(trace->is_trivial()); // This is the case on LoopChoiceNodes. | 3863 ASSERT(trace->is_trivial()); // This is the case on LoopChoiceNodes. |
3850 BoyerMooreLookahead* lookahead = bm_info(not_at_start); | 3864 BoyerMooreLookahead* lookahead = bm_info(not_at_start); |
3851 if (lookahead == NULL) { | 3865 if (lookahead == NULL) { |
3852 eats_at_least = | 3866 eats_at_least = |
3853 Min(kMaxLookaheadForBoyerMoore, | 3867 Min(kMaxLookaheadForBoyerMoore, |
3854 EatsAtLeast(kMaxLookaheadForBoyerMoore, 0, not_at_start)); | 3868 EatsAtLeast(kMaxLookaheadForBoyerMoore, 0, not_at_start)); |
3855 if (eats_at_least >= 1) { | 3869 if (eats_at_least >= 1) { |
3856 BoyerMooreLookahead* bm = | 3870 BoyerMooreLookahead* bm = |
3857 new BoyerMooreLookahead(eats_at_least, compiler); | 3871 new BoyerMooreLookahead(eats_at_least, compiler, zone()); |
3858 GuardedAlternative alt0 = alternatives_->at(0); | 3872 GuardedAlternative alt0 = alternatives_->at(0); |
3859 alt0.node()->FillInBMInfo(0, 0, bm, not_at_start); | 3873 alt0.node()->FillInBMInfo(0, 0, bm, not_at_start); |
3860 skip_was_emitted = bm->EmitSkipInstructions(macro_assembler); | 3874 skip_was_emitted = bm->EmitSkipInstructions(macro_assembler); |
3861 } | 3875 } |
3862 } else { | 3876 } else { |
3863 skip_was_emitted = lookahead->EmitSkipInstructions(macro_assembler); | 3877 skip_was_emitted = lookahead->EmitSkipInstructions(macro_assembler); |
3864 } | 3878 } |
3865 } | 3879 } |
3866 } | 3880 } |
3867 } | 3881 } |
(...skipping 767 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
4635 RegExpNode* RegExpCharacterClass::ToNode(RegExpCompiler* compiler, | 4649 RegExpNode* RegExpCharacterClass::ToNode(RegExpCompiler* compiler, |
4636 RegExpNode* on_success) { | 4650 RegExpNode* on_success) { |
4637 return new TextNode(this, on_success); | 4651 return new TextNode(this, on_success); |
4638 } | 4652 } |
4639 | 4653 |
4640 | 4654 |
4641 RegExpNode* RegExpDisjunction::ToNode(RegExpCompiler* compiler, | 4655 RegExpNode* RegExpDisjunction::ToNode(RegExpCompiler* compiler, |
4642 RegExpNode* on_success) { | 4656 RegExpNode* on_success) { |
4643 ZoneList<RegExpTree*>* alternatives = this->alternatives(); | 4657 ZoneList<RegExpTree*>* alternatives = this->alternatives(); |
4644 int length = alternatives->length(); | 4658 int length = alternatives->length(); |
4645 ChoiceNode* result = new ChoiceNode(length); | 4659 ChoiceNode* result = new ChoiceNode(length, compiler->zone()); |
4646 for (int i = 0; i < length; i++) { | 4660 for (int i = 0; i < length; i++) { |
4647 GuardedAlternative alternative(alternatives->at(i)->ToNode(compiler, | 4661 GuardedAlternative alternative(alternatives->at(i)->ToNode(compiler, |
4648 on_success)); | 4662 on_success)); |
4649 result->AddAlternative(alternative); | 4663 result->AddAlternative(alternative); |
4650 } | 4664 } |
4651 return result; | 4665 return result; |
4652 } | 4666 } |
4653 | 4667 |
4654 | 4668 |
4655 RegExpNode* RegExpQuantifier::ToNode(RegExpCompiler* compiler, | 4669 RegExpNode* RegExpQuantifier::ToNode(RegExpCompiler* compiler, |
(...skipping 102 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
4758 return answer; | 4772 return answer; |
4759 } | 4773 } |
4760 } | 4774 } |
4761 if (max <= kMaxUnrolledMaxMatches && min == 0) { | 4775 if (max <= kMaxUnrolledMaxMatches && min == 0) { |
4762 ASSERT(max > 0); // Due to the 'if' above. | 4776 ASSERT(max > 0); // Due to the 'if' above. |
4763 RegExpExpansionLimiter limiter(compiler, max); | 4777 RegExpExpansionLimiter limiter(compiler, max); |
4764 if (limiter.ok_to_expand()) { | 4778 if (limiter.ok_to_expand()) { |
4765 // Unroll the optional matches up to max. | 4779 // Unroll the optional matches up to max. |
4766 RegExpNode* answer = on_success; | 4780 RegExpNode* answer = on_success; |
4767 for (int i = 0; i < max; i++) { | 4781 for (int i = 0; i < max; i++) { |
4768 ChoiceNode* alternation = new ChoiceNode(2); | 4782 ChoiceNode* alternation = new ChoiceNode(2, compiler->zone()); |
4769 if (is_greedy) { | 4783 if (is_greedy) { |
4770 alternation->AddAlternative( | 4784 alternation->AddAlternative( |
4771 GuardedAlternative(body->ToNode(compiler, answer))); | 4785 GuardedAlternative(body->ToNode(compiler, answer))); |
4772 alternation->AddAlternative(GuardedAlternative(on_success)); | 4786 alternation->AddAlternative(GuardedAlternative(on_success)); |
4773 } else { | 4787 } else { |
4774 alternation->AddAlternative(GuardedAlternative(on_success)); | 4788 alternation->AddAlternative(GuardedAlternative(on_success)); |
4775 alternation->AddAlternative( | 4789 alternation->AddAlternative( |
4776 GuardedAlternative(body->ToNode(compiler, answer))); | 4790 GuardedAlternative(body->ToNode(compiler, answer))); |
4777 } | 4791 } |
4778 answer = alternation; | 4792 answer = alternation; |
4779 if (not_at_start) alternation->set_not_at_start(); | 4793 if (not_at_start) alternation->set_not_at_start(); |
4780 } | 4794 } |
4781 return answer; | 4795 return answer; |
4782 } | 4796 } |
4783 } | 4797 } |
4784 } | 4798 } |
4785 bool has_min = min > 0; | 4799 bool has_min = min > 0; |
4786 bool has_max = max < RegExpTree::kInfinity; | 4800 bool has_max = max < RegExpTree::kInfinity; |
4787 bool needs_counter = has_min || has_max; | 4801 bool needs_counter = has_min || has_max; |
4788 int reg_ctr = needs_counter | 4802 int reg_ctr = needs_counter |
4789 ? compiler->AllocateRegister() | 4803 ? compiler->AllocateRegister() |
4790 : RegExpCompiler::kNoRegister; | 4804 : RegExpCompiler::kNoRegister; |
4791 LoopChoiceNode* center = new LoopChoiceNode(body->min_match() == 0); | 4805 LoopChoiceNode* center = new LoopChoiceNode(body->min_match() == 0, |
| 4806 compiler->zone()); |
4792 if (not_at_start) center->set_not_at_start(); | 4807 if (not_at_start) center->set_not_at_start(); |
4793 RegExpNode* loop_return = needs_counter | 4808 RegExpNode* loop_return = needs_counter |
4794 ? static_cast<RegExpNode*>(ActionNode::IncrementRegister(reg_ctr, center)) | 4809 ? static_cast<RegExpNode*>(ActionNode::IncrementRegister(reg_ctr, center)) |
4795 : static_cast<RegExpNode*>(center); | 4810 : static_cast<RegExpNode*>(center); |
4796 if (body_can_be_empty) { | 4811 if (body_can_be_empty) { |
4797 // If the body can be empty we need to check if it was and then | 4812 // If the body can be empty we need to check if it was and then |
4798 // backtrack. | 4813 // backtrack. |
4799 loop_return = ActionNode::EmptyMatchCheck(body_start_reg, | 4814 loop_return = ActionNode::EmptyMatchCheck(body_start_reg, |
4800 reg_ctr, | 4815 reg_ctr, |
4801 min, | 4816 min, |
(...skipping 48 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
4850 return AssertionNode::AtNonBoundary(on_success); | 4865 return AssertionNode::AtNonBoundary(on_success); |
4851 case END_OF_INPUT: | 4866 case END_OF_INPUT: |
4852 return AssertionNode::AtEnd(on_success); | 4867 return AssertionNode::AtEnd(on_success); |
4853 case END_OF_LINE: { | 4868 case END_OF_LINE: { |
4854 // Compile $ in multiline regexps as an alternation with a positive | 4869 // Compile $ in multiline regexps as an alternation with a positive |
4855 // lookahead in one side and an end-of-input on the other side. | 4870 // lookahead in one side and an end-of-input on the other side. |
4856 // We need two registers for the lookahead. | 4871 // We need two registers for the lookahead. |
4857 int stack_pointer_register = compiler->AllocateRegister(); | 4872 int stack_pointer_register = compiler->AllocateRegister(); |
4858 int position_register = compiler->AllocateRegister(); | 4873 int position_register = compiler->AllocateRegister(); |
4859 // The ChoiceNode to distinguish between a newline and end-of-input. | 4874 // The ChoiceNode to distinguish between a newline and end-of-input. |
4860 ChoiceNode* result = new ChoiceNode(2); | 4875 ChoiceNode* result = new ChoiceNode(2, compiler->zone()); |
4861 // Create a newline atom. | 4876 // Create a newline atom. |
4862 ZoneList<CharacterRange>* newline_ranges = | 4877 ZoneList<CharacterRange>* newline_ranges = |
4863 new ZoneList<CharacterRange>(3); | 4878 new ZoneList<CharacterRange>(3); |
4864 CharacterRange::AddClassEscape('n', newline_ranges); | 4879 CharacterRange::AddClassEscape('n', newline_ranges); |
4865 RegExpCharacterClass* newline_atom = new RegExpCharacterClass('n'); | 4880 RegExpCharacterClass* newline_atom = new RegExpCharacterClass('n'); |
4866 TextNode* newline_matcher = new TextNode( | 4881 TextNode* newline_matcher = new TextNode( |
4867 newline_atom, | 4882 newline_atom, |
4868 ActionNode::PositiveSubmatchSuccess(stack_pointer_register, | 4883 ActionNode::PositiveSubmatchSuccess(stack_pointer_register, |
4869 position_register, | 4884 position_register, |
4870 0, // No captures inside. | 4885 0, // No captures inside. |
(...skipping 66 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
4937 // the second alternative is tried, which is exactly the desired result | 4952 // the second alternative is tried, which is exactly the desired result |
4938 // for a negative lookahead. The NegativeLookaheadChoiceNode is a special | 4953 // for a negative lookahead. The NegativeLookaheadChoiceNode is a special |
4939 // ChoiceNode that knows to ignore the first exit when calculating quick | 4954 // ChoiceNode that knows to ignore the first exit when calculating quick |
4940 // checks. | 4955 // checks. |
4941 GuardedAlternative body_alt( | 4956 GuardedAlternative body_alt( |
4942 body()->ToNode( | 4957 body()->ToNode( |
4943 compiler, | 4958 compiler, |
4944 success = new NegativeSubmatchSuccess(stack_pointer_register, | 4959 success = new NegativeSubmatchSuccess(stack_pointer_register, |
4945 position_register, | 4960 position_register, |
4946 register_count, | 4961 register_count, |
4947 register_start))); | 4962 register_start, |
| 4963 compiler->zone()))); |
4948 ChoiceNode* choice_node = | 4964 ChoiceNode* choice_node = |
4949 new NegativeLookaheadChoiceNode(body_alt, | 4965 new NegativeLookaheadChoiceNode(body_alt, |
4950 GuardedAlternative(on_success)); | 4966 GuardedAlternative(on_success), |
| 4967 compiler->zone()); |
4951 return ActionNode::BeginSubmatch(stack_pointer_register, | 4968 return ActionNode::BeginSubmatch(stack_pointer_register, |
4952 position_register, | 4969 position_register, |
4953 choice_node); | 4970 choice_node); |
4954 } | 4971 } |
4955 } | 4972 } |
4956 | 4973 |
4957 | 4974 |
4958 RegExpNode* RegExpCapture::ToNode(RegExpCompiler* compiler, | 4975 RegExpNode* RegExpCapture::ToNode(RegExpCompiler* compiler, |
4959 RegExpNode* on_success) { | 4976 RegExpNode* on_success) { |
4960 return ToNode(body(), index(), compiler, on_success); | 4977 return ToNode(body(), index(), compiler, on_success); |
(...skipping 846 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
5807 } | 5824 } |
5808 | 5825 |
5809 | 5826 |
5810 RegExpEngine::CompilationResult RegExpEngine::Compile( | 5827 RegExpEngine::CompilationResult RegExpEngine::Compile( |
5811 RegExpCompileData* data, | 5828 RegExpCompileData* data, |
5812 bool ignore_case, | 5829 bool ignore_case, |
5813 bool is_global, | 5830 bool is_global, |
5814 bool is_multiline, | 5831 bool is_multiline, |
5815 Handle<String> pattern, | 5832 Handle<String> pattern, |
5816 Handle<String> sample_subject, | 5833 Handle<String> sample_subject, |
5817 bool is_ascii) { | 5834 bool is_ascii, |
| 5835 Zone* zone) { |
5818 if ((data->capture_count + 1) * 2 - 1 > RegExpMacroAssembler::kMaxRegister) { | 5836 if ((data->capture_count + 1) * 2 - 1 > RegExpMacroAssembler::kMaxRegister) { |
5819 return IrregexpRegExpTooBig(); | 5837 return IrregexpRegExpTooBig(); |
5820 } | 5838 } |
5821 RegExpCompiler compiler(data->capture_count, ignore_case, is_ascii); | 5839 RegExpCompiler compiler(data->capture_count, ignore_case, is_ascii, zone); |
5822 | 5840 |
5823 // Sample some characters from the middle of the string. | 5841 // Sample some characters from the middle of the string. |
5824 static const int kSampleSize = 128; | 5842 static const int kSampleSize = 128; |
5825 | 5843 |
5826 FlattenString(sample_subject); | 5844 FlattenString(sample_subject); |
5827 int chars_sampled = 0; | 5845 int chars_sampled = 0; |
5828 int half_way = (sample_subject->length() - kSampleSize) / 2; | 5846 int half_way = (sample_subject->length() - kSampleSize) / 2; |
5829 for (int i = Max(0, half_way); | 5847 for (int i = Max(0, half_way); |
5830 i < sample_subject->length() && chars_sampled < kSampleSize; | 5848 i < sample_subject->length() && chars_sampled < kSampleSize; |
5831 i++, chars_sampled++) { | 5849 i++, chars_sampled++) { |
(...skipping 17 matching lines...) Expand all Loading... |
5849 RegExpTree::kInfinity, | 5867 RegExpTree::kInfinity, |
5850 false, | 5868 false, |
5851 new RegExpCharacterClass('*'), | 5869 new RegExpCharacterClass('*'), |
5852 &compiler, | 5870 &compiler, |
5853 captured_body, | 5871 captured_body, |
5854 data->contains_anchor); | 5872 data->contains_anchor); |
5855 | 5873 |
5856 if (data->contains_anchor) { | 5874 if (data->contains_anchor) { |
5857 // Unroll loop once, to take care of the case that might start | 5875 // Unroll loop once, to take care of the case that might start |
5858 // at the start of input. | 5876 // at the start of input. |
5859 ChoiceNode* first_step_node = new ChoiceNode(2); | 5877 ChoiceNode* first_step_node = new ChoiceNode(2, zone); |
5860 first_step_node->AddAlternative(GuardedAlternative(captured_body)); | 5878 first_step_node->AddAlternative(GuardedAlternative(captured_body)); |
5861 first_step_node->AddAlternative(GuardedAlternative( | 5879 first_step_node->AddAlternative(GuardedAlternative( |
5862 new TextNode(new RegExpCharacterClass('*'), loop_node))); | 5880 new TextNode(new RegExpCharacterClass('*'), loop_node))); |
5863 node = first_step_node; | 5881 node = first_step_node; |
5864 } else { | 5882 } else { |
5865 node = loop_node; | 5883 node = loop_node; |
5866 } | 5884 } |
5867 } | 5885 } |
5868 if (is_ascii) { | 5886 if (is_ascii) { |
5869 node = node->FilterASCII(RegExpCompiler::kMaxRecursion); | 5887 node = node->FilterASCII(RegExpCompiler::kMaxRecursion); |
5870 // Do it again to propagate the new nodes to places where they were not | 5888 // Do it again to propagate the new nodes to places where they were not |
5871 // put because they had not been calculated yet. | 5889 // put because they had not been calculated yet. |
5872 if (node != NULL) node = node->FilterASCII(RegExpCompiler::kMaxRecursion); | 5890 if (node != NULL) node = node->FilterASCII(RegExpCompiler::kMaxRecursion); |
5873 } | 5891 } |
5874 | 5892 |
5875 if (node == NULL) node = new EndNode(EndNode::BACKTRACK); | 5893 if (node == NULL) node = new EndNode(EndNode::BACKTRACK, zone); |
5876 data->node = node; | 5894 data->node = node; |
5877 Analysis analysis(ignore_case, is_ascii); | 5895 Analysis analysis(ignore_case, is_ascii); |
5878 analysis.EnsureAnalyzed(node); | 5896 analysis.EnsureAnalyzed(node); |
5879 if (analysis.has_failed()) { | 5897 if (analysis.has_failed()) { |
5880 const char* error_message = analysis.error_message(); | 5898 const char* error_message = analysis.error_message(); |
5881 return CompilationResult(error_message); | 5899 return CompilationResult(error_message); |
5882 } | 5900 } |
5883 | 5901 |
5884 // Create the correct assembler for the architecture. | 5902 // Create the correct assembler for the architecture. |
5885 #ifndef V8_INTERPRETED_REGEXP | 5903 #ifndef V8_INTERPRETED_REGEXP |
(...skipping 31 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
5917 macro_assembler.set_global(is_global); | 5935 macro_assembler.set_global(is_global); |
5918 | 5936 |
5919 return compiler.Assemble(¯o_assembler, | 5937 return compiler.Assemble(¯o_assembler, |
5920 node, | 5938 node, |
5921 data->capture_count, | 5939 data->capture_count, |
5922 pattern); | 5940 pattern); |
5923 } | 5941 } |
5924 | 5942 |
5925 | 5943 |
5926 }} // namespace v8::internal | 5944 }} // namespace v8::internal |
OLD | NEW |