Chromium Code Reviews| OLD | NEW |
|---|---|
| 1 // Copyright 2006-2009 the V8 project authors. All rights reserved. | 1 // Copyright 2006-2009 the V8 project authors. All rights reserved. |
| 2 // Redistribution and use in source and binary forms, with or without | 2 // Redistribution and use in source and binary forms, with or without |
| 3 // modification, are permitted provided that the following conditions are | 3 // modification, are permitted provided that the following conditions are |
| 4 // met: | 4 // met: |
| 5 // | 5 // |
| 6 // * Redistributions of source code must retain the above copyright | 6 // * Redistributions of source code must retain the above copyright |
| 7 // notice, this list of conditions and the following disclaimer. | 7 // notice, this list of conditions and the following disclaimer. |
| 8 // * Redistributions in binary form must reproduce the above | 8 // * Redistributions in binary form must reproduce the above |
| 9 // copyright notice, this list of conditions and the following | 9 // copyright notice, this list of conditions and the following |
| 10 // disclaimer in the documentation and/or other materials provided | 10 // disclaimer in the documentation and/or other materials provided |
| (...skipping 141 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
| 152 if (%_ArgumentsLength() === 0) return 0; | 152 if (%_ArgumentsLength() === 0) return 0; |
| 153 return %StringLocaleCompare(TO_STRING_INLINE(this), | 153 return %StringLocaleCompare(TO_STRING_INLINE(this), |
| 154 TO_STRING_INLINE(other)); | 154 TO_STRING_INLINE(other)); |
| 155 } | 155 } |
| 156 | 156 |
| 157 | 157 |
| 158 // ECMA-262 section 15.5.4.10 | 158 // ECMA-262 section 15.5.4.10 |
| 159 function StringMatch(regexp) { | 159 function StringMatch(regexp) { |
| 160 var subject = TO_STRING_INLINE(this); | 160 var subject = TO_STRING_INLINE(this); |
| 161 if (IS_REGEXP(regexp)) { | 161 if (IS_REGEXP(regexp)) { |
| 162 if (!regexp.global) return regexp.exec(subject); | 162 if (!regexp.global) return RegExpExecNoTests(regexp, subject, 0); |
| 163 %_Log('regexp', 'regexp-match,%0S,%1r', [subject, regexp]); | 163 %_Log('regexp', 'regexp-match,%0S,%1r', [subject, regexp]); |
| 164 // lastMatchInfo is defined in regexp.js. | 164 // lastMatchInfo is defined in regexp.js. |
| 165 return %StringMatch(subject, regexp, lastMatchInfo); | 165 return %StringMatch(subject, regexp, lastMatchInfo); |
| 166 } | 166 } |
| 167 // Non-regexp argument. | 167 // Non-regexp argument. |
| 168 regexp = new $RegExp(regexp); | 168 regexp = new $RegExp(regexp); |
| 169 return RegExpExecNoTests(regexp, subject, 0); | 169 return RegExpExecNoTests(regexp, subject, 0); |
| 170 } | 170 } |
| 171 | 171 |
| 172 | 172 |
| (...skipping 67 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
| 240 | 240 |
| 241 return builder.generate(); | 241 return builder.generate(); |
| 242 } | 242 } |
| 243 | 243 |
| 244 | 244 |
| 245 // Expand the $-expressions in the string and return a new string with | 245 // Expand the $-expressions in the string and return a new string with |
| 246 // the result. | 246 // the result. |
| 247 function ExpandReplacement(string, subject, matchInfo, builder) { | 247 function ExpandReplacement(string, subject, matchInfo, builder) { |
| 248 var next = %StringIndexOf(string, '$', 0); | 248 var next = %StringIndexOf(string, '$', 0); |
| 249 if (next < 0) { | 249 if (next < 0) { |
| 250 builder.add(string); | 250 builder.addString(string); |
| 251 return; | 251 return; |
| 252 } | 252 } |
| 253 | 253 |
| 254 // Compute the number of captures; see ECMA-262, 15.5.4.11, p. 102. | 254 // Compute the number of captures; see ECMA-262, 15.5.4.11, p. 102. |
| 255 var m = NUMBER_OF_CAPTURES(matchInfo) >> 1; // Includes the match. | 255 var m = NUMBER_OF_CAPTURES(matchInfo) >> 1; // Includes the match. |
| 256 | 256 |
| 257 if (next > 0) builder.add(SubString(string, 0, next)); | 257 if (next > 0) builder.elements.push(SubString(string, 0, next)); |
|
Lasse Reichstein
2010/12/17 10:38:30
Consider extracting elements from builder, so you
sandholm
2010/12/17 11:50:24
Done.
| |
| 258 var length = string.length; | 258 var length = string.length; |
| 259 | 259 |
| 260 while (true) { | 260 while (true) { |
| 261 var expansion = '$'; | 261 var expansion = '$'; |
| 262 var position = next + 1; | 262 var position = next + 1; |
| 263 if (position < length) { | 263 if (position < length) { |
| 264 var peek = %_StringCharCodeAt(string, position); | 264 var peek = %_StringCharCodeAt(string, position); |
| 265 if (peek == 36) { // $$ | 265 if (peek == 36) { // $$ |
| 266 ++position; | 266 ++position; |
| 267 builder.add('$'); | 267 builder.elements.push('$'); |
| 268 } else if (peek == 38) { // $& - match | 268 } else if (peek == 38) { // $& - match |
| 269 ++position; | 269 ++position; |
| 270 builder.addSpecialSlice(matchInfo[CAPTURE0], | 270 builder.addSpecialSlice(matchInfo[CAPTURE0], |
| 271 matchInfo[CAPTURE1]); | 271 matchInfo[CAPTURE1]); |
| 272 } else if (peek == 96) { // $` - prefix | 272 } else if (peek == 96) { // $` - prefix |
| 273 ++position; | 273 ++position; |
| 274 builder.addSpecialSlice(0, matchInfo[CAPTURE0]); | 274 builder.addSpecialSlice(0, matchInfo[CAPTURE0]); |
| 275 } else if (peek == 39) { // $' - suffix | 275 } else if (peek == 39) { // $' - suffix |
| 276 ++position; | 276 ++position; |
| 277 builder.addSpecialSlice(matchInfo[CAPTURE1], subject.length); | 277 builder.addSpecialSlice(matchInfo[CAPTURE1], subject.length); |
| (...skipping 16 matching lines...) Expand all Loading... | |
| 294 } | 294 } |
| 295 } | 295 } |
| 296 } | 296 } |
| 297 if (0 < n && n < m) { | 297 if (0 < n && n < m) { |
| 298 addCaptureString(builder, matchInfo, n); | 298 addCaptureString(builder, matchInfo, n); |
| 299 } else { | 299 } else { |
| 300 // Because of the captures range check in the parsing of two | 300 // Because of the captures range check in the parsing of two |
| 301 // digit capture references, we can only enter here when a | 301 // digit capture references, we can only enter here when a |
| 302 // single digit capture reference is outside the range of | 302 // single digit capture reference is outside the range of |
| 303 // captures. | 303 // captures. |
| 304 builder.add('$'); | 304 builder.elements.push('$'); |
| 305 --position; | 305 --position; |
| 306 } | 306 } |
| 307 } else { | 307 } else { |
| 308 builder.add('$'); | 308 builder.elements.push('$'); |
| 309 } | 309 } |
| 310 } else { | 310 } else { |
| 311 builder.add('$'); | 311 builder.elements.push('$'); |
| 312 } | 312 } |
| 313 | 313 |
| 314 // Go the the next $ in the string. | 314 // Go the the next $ in the string. |
| 315 next = %StringIndexOf(string, '$', position); | 315 next = %StringIndexOf(string, '$', position); |
| 316 | 316 |
| 317 // Return if there are no more $ characters in the string. If we | 317 // Return if there are no more $ characters in the string. If we |
| 318 // haven't reached the end, we need to append the suffix. | 318 // haven't reached the end, we need to append the suffix. |
| 319 if (next < 0) { | 319 if (next < 0) { |
| 320 if (position < length) { | 320 if (position < length) { |
| 321 builder.add(SubString(string, position, length)); | 321 builder.elements.push(SubString(string, position, length)); |
| 322 } | 322 } |
| 323 return; | 323 return; |
| 324 } | 324 } |
| 325 | 325 |
| 326 // Append substring between the previous and the next $ character. | 326 // Append substring between the previous and the next $ character. |
| 327 builder.add(SubString(string, position, next)); | 327 builder.addString(SubString(string, position, next)); |
| 328 } | 328 } |
| 329 }; | 329 }; |
| 330 | 330 |
| 331 | 331 |
| 332 // Compute the string of a given regular expression capture. | 332 // Compute the string of a given regular expression capture. |
| 333 function CaptureString(string, lastCaptureInfo, index) { | 333 function CaptureString(string, lastCaptureInfo, index) { |
| 334 // Scale the index. | 334 // Scale the index. |
| 335 var scaled = index << 1; | 335 var scaled = index << 1; |
| 336 // Compute start and end. | 336 // Compute start and end. |
| 337 var start = lastCaptureInfo[CAPTURE(scaled)]; | 337 var start = lastCaptureInfo[CAPTURE(scaled)]; |
| (...skipping 214 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
| 552 | 552 |
| 553 if (length === 0) { | 553 if (length === 0) { |
| 554 if (DoRegExpExec(separator, subject, 0, 0) != null) { | 554 if (DoRegExpExec(separator, subject, 0, 0) != null) { |
| 555 return []; | 555 return []; |
| 556 } | 556 } |
| 557 return [subject]; | 557 return [subject]; |
| 558 } | 558 } |
| 559 | 559 |
| 560 var currentIndex = 0; | 560 var currentIndex = 0; |
| 561 var startIndex = 0; | 561 var startIndex = 0; |
| 562 var startMatch = 0; | |
| 562 var result = []; | 563 var result = []; |
| 563 | 564 |
| 564 outer_loop: | 565 outer_loop: |
| 565 while (true) { | 566 while (true) { |
| 566 | 567 |
| 567 if (startIndex === length) { | 568 if (startIndex === length) { |
| 568 result.push(subject.slice(currentIndex, length)); | 569 result.push(SubString(subject, currentIndex, length)); |
| 569 break; | 570 break; |
| 570 } | 571 } |
| 571 | 572 |
| 572 var matchInfo = splitMatch(separator, subject, currentIndex, startIndex); | 573 var matchInfo = DoRegExpExec(separator, subject, startIndex); |
| 573 | 574 if (IS_NULL_OR_UNDEFINED(matchInfo) |
|
Lasse Reichstein
2010/12/17 10:38:30
Why accept undefined?
sandholm
2010/12/17 11:50:24
I am just applying the same semantics as the inlin
| |
| 574 if (IS_NULL(matchInfo)) { | 575 || length === (startMatch = matchInfo[CAPTURE0])) { |
| 575 result.push(subject.slice(currentIndex, length)); | 576 result.push(SubString(subject, currentIndex, length)); |
| 576 break; | 577 break; |
| 577 } | 578 } |
| 578 | |
| 579 var endIndex = matchInfo[CAPTURE1]; | 579 var endIndex = matchInfo[CAPTURE1]; |
| 580 | 580 |
| 581 // We ignore a zero-length match at the currentIndex. | 581 // We ignore a zero-length match at the currentIndex. |
| 582 if (startIndex === endIndex && endIndex === currentIndex) { | 582 if (startIndex === endIndex && endIndex === currentIndex) { |
| 583 startIndex++; | 583 startIndex++; |
| 584 continue; | 584 continue; |
| 585 } | 585 } |
| 586 | 586 |
| 587 result.push(SubString(subject, currentIndex, matchInfo[CAPTURE0])); | 587 if (currentIndex + 1 == startMatch) { |
|
Lasse Reichstein
2010/12/17 10:38:30
Does this really pay off? It seems to be simply in
sandholm
2010/12/17 11:50:24
It is faster. I generally only inline call sites w
| |
| 588 result.push(%_StringCharAt(subject, currentIndex)); | |
| 589 } else { | |
| 590 result.push(%_SubString(subject, currentIndex, startMatch)); | |
| 591 } | |
| 592 | |
| 588 if (result.length === limit) break; | 593 if (result.length === limit) break; |
| 589 | 594 |
| 590 var matchinfo_len = NUMBER_OF_CAPTURES(matchInfo) + REGEXP_FIRST_CAPTURE; | 595 var matchinfo_len = NUMBER_OF_CAPTURES(matchInfo) + REGEXP_FIRST_CAPTURE; |
| 591 for (var i = REGEXP_FIRST_CAPTURE + 2; i < matchinfo_len; ) { | 596 for (var i = REGEXP_FIRST_CAPTURE + 2; i < matchinfo_len; ) { |
| 592 var start = matchInfo[i++]; | 597 var start = matchInfo[i++]; |
| 593 var end = matchInfo[i++]; | 598 var end = matchInfo[i++]; |
| 594 if (end != -1) { | 599 if (end != -1) { |
| 595 if (start + 1 == end) { | 600 if (start + 1 == end) { |
| 596 result.push(%_StringCharAt(subject, start)); | 601 result.push(%_StringCharAt(subject, start)); |
| 597 } else { | 602 } else { |
| 598 result.push(%_SubString(subject, start, end)); | 603 result.push(%_SubString(subject, start, end)); |
| 599 } | 604 } |
| 600 } else { | 605 } else { |
| 601 result.push(void 0); | 606 result.push(void 0); |
| 602 } | 607 } |
| 603 if (result.length === limit) break outer_loop; | 608 if (result.length === limit) break outer_loop; |
| 604 } | 609 } |
| 605 | 610 |
| 606 startIndex = currentIndex = endIndex; | 611 startIndex = currentIndex = endIndex; |
| 607 } | 612 } |
| 608 return result; | 613 return result; |
| 609 } | 614 } |
| 610 | 615 |
| 611 | 616 |
| 612 // ECMA-262 section 15.5.4.14 | |
| 613 // Helper function used by split. This version returns the matchInfo | |
| 614 // instead of allocating a new array with basically the same information. | |
| 615 function splitMatch(separator, subject, current_index, start_index) { | |
| 616 var matchInfo = DoRegExpExec(separator, subject, start_index); | |
| 617 if (matchInfo == null) return null; | |
| 618 // Section 15.5.4.14 paragraph two says that we do not allow zero length | |
| 619 // matches at the end of the string. | |
| 620 if (matchInfo[CAPTURE0] === subject.length) return null; | |
| 621 return matchInfo; | |
| 622 } | |
| 623 | |
| 624 | |
| 625 // ECMA-262 section 15.5.4.15 | 617 // ECMA-262 section 15.5.4.15 |
| 626 function StringSubstring(start, end) { | 618 function StringSubstring(start, end) { |
| 627 var s = TO_STRING_INLINE(this); | 619 var s = TO_STRING_INLINE(this); |
| 628 var s_len = s.length; | 620 var s_len = s.length; |
| 629 | 621 |
| 630 var start_i = TO_INTEGER(start); | 622 var start_i = TO_INTEGER(start); |
| 631 if (start_i < 0) { | 623 if (start_i < 0) { |
| 632 start_i = 0; | 624 start_i = 0; |
| 633 } else if (start_i > s_len) { | 625 } else if (start_i > s_len) { |
| 634 start_i = s_len; | 626 start_i = s_len; |
| (...skipping 202 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
| 837 this.elements = %_Arguments(1); | 829 this.elements = %_Arguments(1); |
| 838 } else { | 830 } else { |
| 839 this.elements = new $Array(); | 831 this.elements = new $Array(); |
| 840 } | 832 } |
| 841 this.special_string = str; | 833 this.special_string = str; |
| 842 } | 834 } |
| 843 | 835 |
| 844 | 836 |
| 845 ReplaceResultBuilder.prototype.add = function(str) { | 837 ReplaceResultBuilder.prototype.add = function(str) { |
| 846 str = TO_STRING_INLINE(str); | 838 str = TO_STRING_INLINE(str); |
| 847 if (str.length > 0) { | 839 if (str.length > 0) this.elements.push(str); |
| 848 var elements = this.elements; | 840 } |
| 849 elements[elements.length] = str; | 841 |
| 850 } | 842 |
| 843 ReplaceResultBuilder.prototype.addString = function(str) { | |
| 844 if (str.length > 0) this.elements.push(str); | |
| 851 } | 845 } |
| 852 | 846 |
| 853 | 847 |
| 854 ReplaceResultBuilder.prototype.addSpecialSlice = function(start, end) { | 848 ReplaceResultBuilder.prototype.addSpecialSlice = function(start, end) { |
| 855 var len = end - start; | 849 var len = end - start; |
| 856 if (start < 0 || len <= 0) return; | 850 if (start < 0 || len <= 0) return; |
| 857 var elements = this.elements; | |
| 858 if (start < 0x80000 && len < 0x800) { | 851 if (start < 0x80000 && len < 0x800) { |
| 859 elements[elements.length] = (start << 11) | len; | 852 this.elements.push((start << 11) | len); |
| 860 } else { | 853 } else { |
| 861 // 0 < len <= String::kMaxLength and Smi::kMaxValue >= String::kMaxLength, | 854 // 0 < len <= String::kMaxLength and Smi::kMaxValue >= String::kMaxLength, |
| 862 // so -len is a smi. | 855 // so -len is a smi. |
| 863 elements[elements.length] = -len; | 856 var elements = this.elements; |
| 864 elements[elements.length] = start; | 857 elements.push(-len); |
| 858 elements.push(start); | |
| 865 } | 859 } |
| 866 } | 860 } |
| 867 | 861 |
| 868 | 862 |
| 869 ReplaceResultBuilder.prototype.generate = function() { | 863 ReplaceResultBuilder.prototype.generate = function() { |
| 870 var elements = this.elements; | 864 var elements = this.elements; |
| 871 return %StringBuilderConcat(elements, elements.length, this.special_string); | 865 return %StringBuilderConcat(elements, elements.length, this.special_string); |
| 872 } | 866 } |
| 873 | 867 |
| 874 | 868 |
| (...skipping 45 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
| 920 "italics", StringItalics, | 914 "italics", StringItalics, |
| 921 "small", StringSmall, | 915 "small", StringSmall, |
| 922 "strike", StringStrike, | 916 "strike", StringStrike, |
| 923 "sub", StringSub, | 917 "sub", StringSub, |
| 924 "sup", StringSup | 918 "sup", StringSup |
| 925 )); | 919 )); |
| 926 } | 920 } |
| 927 | 921 |
| 928 | 922 |
| 929 SetupString(); | 923 SetupString(); |
| OLD | NEW |