OLD | NEW |
| (Empty) |
1 // Copyright 2012 the V8 project authors. All rights reserved. | |
2 // Use of this source code is governed by a BSD-style license that can be | |
3 // found in the LICENSE file. | |
4 | |
5 #include "src/v8.h" | |
6 | |
7 #if V8_TARGET_ARCH_X64 | |
8 | |
9 #include "src/cpu-profiler.h" | |
10 #include "src/log.h" | |
11 #include "src/macro-assembler.h" | |
12 #include "src/regexp-macro-assembler.h" | |
13 #include "src/regexp-stack.h" | |
14 #include "src/unicode.h" | |
15 #include "src/x64/regexp-macro-assembler-x64.h" | |
16 | |
17 namespace v8 { | |
18 namespace internal { | |
19 | |
20 #ifndef V8_INTERPRETED_REGEXP | |
21 | |
22 /* | |
23 * This assembler uses the following register assignment convention | |
24 * - rdx : Currently loaded character(s) as Latin1 or UC16. Must be loaded | |
25 * using LoadCurrentCharacter before using any of the dispatch methods. | |
26 * Temporarily stores the index of capture start after a matching pass | |
27 * for a global regexp. | |
28 * - rdi : Current position in input, as negative offset from end of string. | |
29 * Please notice that this is the byte offset, not the character | |
30 * offset! Is always a 32-bit signed (negative) offset, but must be | |
31 * maintained sign-extended to 64 bits, since it is used as index. | |
32 * - rsi : End of input (points to byte after last character in input), | |
33 * so that rsi+rdi points to the current character. | |
34 * - rbp : Frame pointer. Used to access arguments, local variables and | |
35 * RegExp registers. | |
36 * - rsp : Points to tip of C stack. | |
37 * - rcx : Points to tip of backtrack stack. The backtrack stack contains | |
38 * only 32-bit values. Most are offsets from some base (e.g., character | |
39 * positions from end of string or code location from Code* pointer). | |
40 * - r8 : Code object pointer. Used to convert between absolute and | |
41 * code-object-relative addresses. | |
42 * | |
43 * The registers rax, rbx, r9 and r11 are free to use for computations. | |
44 * If changed to use r12+, they should be saved as callee-save registers. | |
45 * The macro assembler special register r13 (kRootRegister) isn't special | |
46 * during execution of RegExp code (it doesn't hold the value assumed when | |
47 * creating JS code), so Root related macro operations can be used. | |
48 * | |
49 * Each call to a C++ method should retain these registers. | |
50 * | |
51 * The stack will have the following content, in some order, indexable from the | |
52 * frame pointer (see, e.g., kStackHighEnd): | |
53 * - Isolate* isolate (address of the current isolate) | |
54 * - direct_call (if 1, direct call from JavaScript code, if 0 call | |
55 * through the runtime system) | |
56 * - stack_area_base (high end of the memory area to use as | |
57 * backtracking stack) | |
58 * - capture array size (may fit multiple sets of matches) | |
59 * - int* capture_array (int[num_saved_registers_], for output). | |
60 * - end of input (address of end of string) | |
61 * - start of input (address of first character in string) | |
62 * - start index (character index of start) | |
63 * - String* input_string (input string) | |
64 * - return address | |
65 * - backup of callee save registers (rbx, possibly rsi and rdi). | |
66 * - success counter (only useful for global regexp to count matches) | |
67 * - Offset of location before start of input (effectively character | |
68 * position -1). Used to initialize capture registers to a non-position. | |
69 * - At start of string (if 1, we are starting at the start of the | |
70 * string, otherwise 0) | |
71 * - register 0 rbp[-n] (Only positions must be stored in the first | |
72 * - register 1 rbp[-n-8] num_saved_registers_ registers) | |
73 * - ... | |
74 * | |
75 * The first num_saved_registers_ registers are initialized to point to | |
76 * "character -1" in the string (i.e., char_size() bytes before the first | |
77 * character of the string). The remaining registers starts out uninitialized. | |
78 * | |
79 * The first seven values must be provided by the calling code by | |
80 * calling the code's entry address cast to a function pointer with the | |
81 * following signature: | |
82 * int (*match)(String* input_string, | |
83 * int start_index, | |
84 * Address start, | |
85 * Address end, | |
86 * int* capture_output_array, | |
87 * bool at_start, | |
88 * byte* stack_area_base, | |
89 * bool direct_call) | |
90 */ | |
91 | |
92 #define __ ACCESS_MASM((&masm_)) | |
93 | |
94 RegExpMacroAssemblerX64::RegExpMacroAssemblerX64(Isolate* isolate, Zone* zone, | |
95 Mode mode, | |
96 int registers_to_save) | |
97 : NativeRegExpMacroAssembler(isolate, zone), | |
98 masm_(isolate, NULL, kRegExpCodeSize), | |
99 no_root_array_scope_(&masm_), | |
100 code_relative_fixup_positions_(4, zone), | |
101 mode_(mode), | |
102 num_registers_(registers_to_save), | |
103 num_saved_registers_(registers_to_save), | |
104 entry_label_(), | |
105 start_label_(), | |
106 success_label_(), | |
107 backtrack_label_(), | |
108 exit_label_() { | |
109 DCHECK_EQ(0, registers_to_save % 2); | |
110 __ jmp(&entry_label_); // We'll write the entry code when we know more. | |
111 __ bind(&start_label_); // And then continue from here. | |
112 } | |
113 | |
114 | |
115 RegExpMacroAssemblerX64::~RegExpMacroAssemblerX64() { | |
116 // Unuse labels in case we throw away the assembler without calling GetCode. | |
117 entry_label_.Unuse(); | |
118 start_label_.Unuse(); | |
119 success_label_.Unuse(); | |
120 backtrack_label_.Unuse(); | |
121 exit_label_.Unuse(); | |
122 check_preempt_label_.Unuse(); | |
123 stack_overflow_label_.Unuse(); | |
124 } | |
125 | |
126 | |
127 int RegExpMacroAssemblerX64::stack_limit_slack() { | |
128 return RegExpStack::kStackLimitSlack; | |
129 } | |
130 | |
131 | |
132 void RegExpMacroAssemblerX64::AdvanceCurrentPosition(int by) { | |
133 if (by != 0) { | |
134 __ addq(rdi, Immediate(by * char_size())); | |
135 } | |
136 } | |
137 | |
138 | |
139 void RegExpMacroAssemblerX64::AdvanceRegister(int reg, int by) { | |
140 DCHECK(reg >= 0); | |
141 DCHECK(reg < num_registers_); | |
142 if (by != 0) { | |
143 __ addp(register_location(reg), Immediate(by)); | |
144 } | |
145 } | |
146 | |
147 | |
148 void RegExpMacroAssemblerX64::Backtrack() { | |
149 CheckPreemption(); | |
150 // Pop Code* offset from backtrack stack, add Code* and jump to location. | |
151 Pop(rbx); | |
152 __ addp(rbx, code_object_pointer()); | |
153 __ jmp(rbx); | |
154 } | |
155 | |
156 | |
157 void RegExpMacroAssemblerX64::Bind(Label* label) { | |
158 __ bind(label); | |
159 } | |
160 | |
161 | |
162 void RegExpMacroAssemblerX64::CheckCharacter(uint32_t c, Label* on_equal) { | |
163 __ cmpl(current_character(), Immediate(c)); | |
164 BranchOrBacktrack(equal, on_equal); | |
165 } | |
166 | |
167 | |
168 void RegExpMacroAssemblerX64::CheckCharacterGT(uc16 limit, Label* on_greater) { | |
169 __ cmpl(current_character(), Immediate(limit)); | |
170 BranchOrBacktrack(greater, on_greater); | |
171 } | |
172 | |
173 | |
174 void RegExpMacroAssemblerX64::CheckAtStart(Label* on_at_start) { | |
175 Label not_at_start; | |
176 // Did we start the match at the start of the string at all? | |
177 __ cmpl(Operand(rbp, kStartIndex), Immediate(0)); | |
178 BranchOrBacktrack(not_equal, ¬_at_start); | |
179 // If we did, are we still at the start of the input? | |
180 __ leap(rax, Operand(rsi, rdi, times_1, 0)); | |
181 __ cmpp(rax, Operand(rbp, kInputStart)); | |
182 BranchOrBacktrack(equal, on_at_start); | |
183 __ bind(¬_at_start); | |
184 } | |
185 | |
186 | |
187 void RegExpMacroAssemblerX64::CheckNotAtStart(Label* on_not_at_start) { | |
188 // Did we start the match at the start of the string at all? | |
189 __ cmpl(Operand(rbp, kStartIndex), Immediate(0)); | |
190 BranchOrBacktrack(not_equal, on_not_at_start); | |
191 // If we did, are we still at the start of the input? | |
192 __ leap(rax, Operand(rsi, rdi, times_1, 0)); | |
193 __ cmpp(rax, Operand(rbp, kInputStart)); | |
194 BranchOrBacktrack(not_equal, on_not_at_start); | |
195 } | |
196 | |
197 | |
198 void RegExpMacroAssemblerX64::CheckCharacterLT(uc16 limit, Label* on_less) { | |
199 __ cmpl(current_character(), Immediate(limit)); | |
200 BranchOrBacktrack(less, on_less); | |
201 } | |
202 | |
203 | |
204 void RegExpMacroAssemblerX64::CheckGreedyLoop(Label* on_equal) { | |
205 Label fallthrough; | |
206 __ cmpl(rdi, Operand(backtrack_stackpointer(), 0)); | |
207 __ j(not_equal, &fallthrough); | |
208 Drop(); | |
209 BranchOrBacktrack(no_condition, on_equal); | |
210 __ bind(&fallthrough); | |
211 } | |
212 | |
213 | |
214 void RegExpMacroAssemblerX64::CheckNotBackReferenceIgnoreCase( | |
215 int start_reg, | |
216 Label* on_no_match) { | |
217 Label fallthrough; | |
218 ReadPositionFromRegister(rdx, start_reg); // Offset of start of capture | |
219 ReadPositionFromRegister(rbx, start_reg + 1); // Offset of end of capture | |
220 __ subp(rbx, rdx); // Length of capture. | |
221 | |
222 // ----------------------- | |
223 // rdx = Start offset of capture. | |
224 // rbx = Length of capture | |
225 | |
226 // If length is negative, this code will fail (it's a symptom of a partial or | |
227 // illegal capture where start of capture after end of capture). | |
228 // This must not happen (no back-reference can reference a capture that wasn't | |
229 // closed before in the reg-exp, and we must not generate code that can cause | |
230 // this condition). | |
231 | |
232 // If length is zero, either the capture is empty or it is nonparticipating. | |
233 // In either case succeed immediately. | |
234 __ j(equal, &fallthrough); | |
235 | |
236 // ----------------------- | |
237 // rdx - Start of capture | |
238 // rbx - length of capture | |
239 // Check that there are sufficient characters left in the input. | |
240 __ movl(rax, rdi); | |
241 __ addl(rax, rbx); | |
242 BranchOrBacktrack(greater, on_no_match); | |
243 | |
244 if (mode_ == LATIN1) { | |
245 Label loop_increment; | |
246 if (on_no_match == NULL) { | |
247 on_no_match = &backtrack_label_; | |
248 } | |
249 | |
250 __ leap(r9, Operand(rsi, rdx, times_1, 0)); | |
251 __ leap(r11, Operand(rsi, rdi, times_1, 0)); | |
252 __ addp(rbx, r9); // End of capture | |
253 // --------------------- | |
254 // r11 - current input character address | |
255 // r9 - current capture character address | |
256 // rbx - end of capture | |
257 | |
258 Label loop; | |
259 __ bind(&loop); | |
260 __ movzxbl(rdx, Operand(r9, 0)); | |
261 __ movzxbl(rax, Operand(r11, 0)); | |
262 // al - input character | |
263 // dl - capture character | |
264 __ cmpb(rax, rdx); | |
265 __ j(equal, &loop_increment); | |
266 | |
267 // Mismatch, try case-insensitive match (converting letters to lower-case). | |
268 // I.e., if or-ing with 0x20 makes values equal and in range 'a'-'z', it's | |
269 // a match. | |
270 __ orp(rax, Immediate(0x20)); // Convert match character to lower-case. | |
271 __ orp(rdx, Immediate(0x20)); // Convert capture character to lower-case. | |
272 __ cmpb(rax, rdx); | |
273 __ j(not_equal, on_no_match); // Definitely not equal. | |
274 __ subb(rax, Immediate('a')); | |
275 __ cmpb(rax, Immediate('z' - 'a')); | |
276 __ j(below_equal, &loop_increment); // In range 'a'-'z'. | |
277 // Latin-1: Check for values in range [224,254] but not 247. | |
278 __ subb(rax, Immediate(224 - 'a')); | |
279 __ cmpb(rax, Immediate(254 - 224)); | |
280 __ j(above, on_no_match); // Weren't Latin-1 letters. | |
281 __ cmpb(rax, Immediate(247 - 224)); // Check for 247. | |
282 __ j(equal, on_no_match); | |
283 __ bind(&loop_increment); | |
284 // Increment pointers into match and capture strings. | |
285 __ addp(r11, Immediate(1)); | |
286 __ addp(r9, Immediate(1)); | |
287 // Compare to end of capture, and loop if not done. | |
288 __ cmpp(r9, rbx); | |
289 __ j(below, &loop); | |
290 | |
291 // Compute new value of character position after the matched part. | |
292 __ movp(rdi, r11); | |
293 __ subq(rdi, rsi); | |
294 } else { | |
295 DCHECK(mode_ == UC16); | |
296 // Save important/volatile registers before calling C function. | |
297 #ifndef _WIN64 | |
298 // Caller save on Linux and callee save in Windows. | |
299 __ pushq(rsi); | |
300 __ pushq(rdi); | |
301 #endif | |
302 __ pushq(backtrack_stackpointer()); | |
303 | |
304 static const int num_arguments = 4; | |
305 __ PrepareCallCFunction(num_arguments); | |
306 | |
307 // Put arguments into parameter registers. Parameters are | |
308 // Address byte_offset1 - Address captured substring's start. | |
309 // Address byte_offset2 - Address of current character position. | |
310 // size_t byte_length - length of capture in bytes(!) | |
311 // Isolate* isolate | |
312 #ifdef _WIN64 | |
313 // Compute and set byte_offset1 (start of capture). | |
314 __ leap(rcx, Operand(rsi, rdx, times_1, 0)); | |
315 // Set byte_offset2. | |
316 __ leap(rdx, Operand(rsi, rdi, times_1, 0)); | |
317 // Set byte_length. | |
318 __ movp(r8, rbx); | |
319 // Isolate. | |
320 __ LoadAddress(r9, ExternalReference::isolate_address(isolate())); | |
321 #else // AMD64 calling convention | |
322 // Compute byte_offset2 (current position = rsi+rdi). | |
323 __ leap(rax, Operand(rsi, rdi, times_1, 0)); | |
324 // Compute and set byte_offset1 (start of capture). | |
325 __ leap(rdi, Operand(rsi, rdx, times_1, 0)); | |
326 // Set byte_offset2. | |
327 __ movp(rsi, rax); | |
328 // Set byte_length. | |
329 __ movp(rdx, rbx); | |
330 // Isolate. | |
331 __ LoadAddress(rcx, ExternalReference::isolate_address(isolate())); | |
332 #endif | |
333 | |
334 { // NOLINT: Can't find a way to open this scope without confusing the | |
335 // linter. | |
336 AllowExternalCallThatCantCauseGC scope(&masm_); | |
337 ExternalReference compare = | |
338 ExternalReference::re_case_insensitive_compare_uc16(isolate()); | |
339 __ CallCFunction(compare, num_arguments); | |
340 } | |
341 | |
342 // Restore original values before reacting on result value. | |
343 __ Move(code_object_pointer(), masm_.CodeObject()); | |
344 __ popq(backtrack_stackpointer()); | |
345 #ifndef _WIN64 | |
346 __ popq(rdi); | |
347 __ popq(rsi); | |
348 #endif | |
349 | |
350 // Check if function returned non-zero for success or zero for failure. | |
351 __ testp(rax, rax); | |
352 BranchOrBacktrack(zero, on_no_match); | |
353 // On success, increment position by length of capture. | |
354 // Requires that rbx is callee save (true for both Win64 and AMD64 ABIs). | |
355 __ addq(rdi, rbx); | |
356 } | |
357 __ bind(&fallthrough); | |
358 } | |
359 | |
360 | |
361 void RegExpMacroAssemblerX64::CheckNotBackReference( | |
362 int start_reg, | |
363 Label* on_no_match) { | |
364 Label fallthrough; | |
365 | |
366 // Find length of back-referenced capture. | |
367 ReadPositionFromRegister(rdx, start_reg); // Offset of start of capture | |
368 ReadPositionFromRegister(rax, start_reg + 1); // Offset of end of capture | |
369 __ subp(rax, rdx); // Length to check. | |
370 | |
371 // Fail on partial or illegal capture (start of capture after end of capture). | |
372 // This must not happen (no back-reference can reference a capture that wasn't | |
373 // closed before in the reg-exp). | |
374 __ Check(greater_equal, kInvalidCaptureReferenced); | |
375 | |
376 // Succeed on empty capture (including non-participating capture) | |
377 __ j(equal, &fallthrough); | |
378 | |
379 // ----------------------- | |
380 // rdx - Start of capture | |
381 // rax - length of capture | |
382 | |
383 // Check that there are sufficient characters left in the input. | |
384 __ movl(rbx, rdi); | |
385 __ addl(rbx, rax); | |
386 BranchOrBacktrack(greater, on_no_match); | |
387 | |
388 // Compute pointers to match string and capture string | |
389 __ leap(rbx, Operand(rsi, rdi, times_1, 0)); // Start of match. | |
390 __ addp(rdx, rsi); // Start of capture. | |
391 __ leap(r9, Operand(rdx, rax, times_1, 0)); // End of capture | |
392 | |
393 // ----------------------- | |
394 // rbx - current capture character address. | |
395 // rbx - current input character address . | |
396 // r9 - end of input to match (capture length after rbx). | |
397 | |
398 Label loop; | |
399 __ bind(&loop); | |
400 if (mode_ == LATIN1) { | |
401 __ movzxbl(rax, Operand(rdx, 0)); | |
402 __ cmpb(rax, Operand(rbx, 0)); | |
403 } else { | |
404 DCHECK(mode_ == UC16); | |
405 __ movzxwl(rax, Operand(rdx, 0)); | |
406 __ cmpw(rax, Operand(rbx, 0)); | |
407 } | |
408 BranchOrBacktrack(not_equal, on_no_match); | |
409 // Increment pointers into capture and match string. | |
410 __ addp(rbx, Immediate(char_size())); | |
411 __ addp(rdx, Immediate(char_size())); | |
412 // Check if we have reached end of match area. | |
413 __ cmpp(rdx, r9); | |
414 __ j(below, &loop); | |
415 | |
416 // Success. | |
417 // Set current character position to position after match. | |
418 __ movp(rdi, rbx); | |
419 __ subq(rdi, rsi); | |
420 | |
421 __ bind(&fallthrough); | |
422 } | |
423 | |
424 | |
425 void RegExpMacroAssemblerX64::CheckNotCharacter(uint32_t c, | |
426 Label* on_not_equal) { | |
427 __ cmpl(current_character(), Immediate(c)); | |
428 BranchOrBacktrack(not_equal, on_not_equal); | |
429 } | |
430 | |
431 | |
432 void RegExpMacroAssemblerX64::CheckCharacterAfterAnd(uint32_t c, | |
433 uint32_t mask, | |
434 Label* on_equal) { | |
435 if (c == 0) { | |
436 __ testl(current_character(), Immediate(mask)); | |
437 } else { | |
438 __ movl(rax, Immediate(mask)); | |
439 __ andp(rax, current_character()); | |
440 __ cmpl(rax, Immediate(c)); | |
441 } | |
442 BranchOrBacktrack(equal, on_equal); | |
443 } | |
444 | |
445 | |
446 void RegExpMacroAssemblerX64::CheckNotCharacterAfterAnd(uint32_t c, | |
447 uint32_t mask, | |
448 Label* on_not_equal) { | |
449 if (c == 0) { | |
450 __ testl(current_character(), Immediate(mask)); | |
451 } else { | |
452 __ movl(rax, Immediate(mask)); | |
453 __ andp(rax, current_character()); | |
454 __ cmpl(rax, Immediate(c)); | |
455 } | |
456 BranchOrBacktrack(not_equal, on_not_equal); | |
457 } | |
458 | |
459 | |
460 void RegExpMacroAssemblerX64::CheckNotCharacterAfterMinusAnd( | |
461 uc16 c, | |
462 uc16 minus, | |
463 uc16 mask, | |
464 Label* on_not_equal) { | |
465 DCHECK(minus < String::kMaxUtf16CodeUnit); | |
466 __ leap(rax, Operand(current_character(), -minus)); | |
467 __ andp(rax, Immediate(mask)); | |
468 __ cmpl(rax, Immediate(c)); | |
469 BranchOrBacktrack(not_equal, on_not_equal); | |
470 } | |
471 | |
472 | |
473 void RegExpMacroAssemblerX64::CheckCharacterInRange( | |
474 uc16 from, | |
475 uc16 to, | |
476 Label* on_in_range) { | |
477 __ leal(rax, Operand(current_character(), -from)); | |
478 __ cmpl(rax, Immediate(to - from)); | |
479 BranchOrBacktrack(below_equal, on_in_range); | |
480 } | |
481 | |
482 | |
483 void RegExpMacroAssemblerX64::CheckCharacterNotInRange( | |
484 uc16 from, | |
485 uc16 to, | |
486 Label* on_not_in_range) { | |
487 __ leal(rax, Operand(current_character(), -from)); | |
488 __ cmpl(rax, Immediate(to - from)); | |
489 BranchOrBacktrack(above, on_not_in_range); | |
490 } | |
491 | |
492 | |
493 void RegExpMacroAssemblerX64::CheckBitInTable( | |
494 Handle<ByteArray> table, | |
495 Label* on_bit_set) { | |
496 __ Move(rax, table); | |
497 Register index = current_character(); | |
498 if (mode_ != LATIN1 || kTableMask != String::kMaxOneByteCharCode) { | |
499 __ movp(rbx, current_character()); | |
500 __ andp(rbx, Immediate(kTableMask)); | |
501 index = rbx; | |
502 } | |
503 __ cmpb(FieldOperand(rax, index, times_1, ByteArray::kHeaderSize), | |
504 Immediate(0)); | |
505 BranchOrBacktrack(not_equal, on_bit_set); | |
506 } | |
507 | |
508 | |
509 bool RegExpMacroAssemblerX64::CheckSpecialCharacterClass(uc16 type, | |
510 Label* on_no_match) { | |
511 // Range checks (c in min..max) are generally implemented by an unsigned | |
512 // (c - min) <= (max - min) check, using the sequence: | |
513 // leap(rax, Operand(current_character(), -min)) or sub(rax, Immediate(min)) | |
514 // cmp(rax, Immediate(max - min)) | |
515 switch (type) { | |
516 case 's': | |
517 // Match space-characters | |
518 if (mode_ == LATIN1) { | |
519 // One byte space characters are '\t'..'\r', ' ' and \u00a0. | |
520 Label success; | |
521 __ cmpl(current_character(), Immediate(' ')); | |
522 __ j(equal, &success, Label::kNear); | |
523 // Check range 0x09..0x0d | |
524 __ leap(rax, Operand(current_character(), -'\t')); | |
525 __ cmpl(rax, Immediate('\r' - '\t')); | |
526 __ j(below_equal, &success, Label::kNear); | |
527 // \u00a0 (NBSP). | |
528 __ cmpl(rax, Immediate(0x00a0 - '\t')); | |
529 BranchOrBacktrack(not_equal, on_no_match); | |
530 __ bind(&success); | |
531 return true; | |
532 } | |
533 return false; | |
534 case 'S': | |
535 // The emitted code for generic character classes is good enough. | |
536 return false; | |
537 case 'd': | |
538 // Match ASCII digits ('0'..'9') | |
539 __ leap(rax, Operand(current_character(), -'0')); | |
540 __ cmpl(rax, Immediate('9' - '0')); | |
541 BranchOrBacktrack(above, on_no_match); | |
542 return true; | |
543 case 'D': | |
544 // Match non ASCII-digits | |
545 __ leap(rax, Operand(current_character(), -'0')); | |
546 __ cmpl(rax, Immediate('9' - '0')); | |
547 BranchOrBacktrack(below_equal, on_no_match); | |
548 return true; | |
549 case '.': { | |
550 // Match non-newlines (not 0x0a('\n'), 0x0d('\r'), 0x2028 and 0x2029) | |
551 __ movl(rax, current_character()); | |
552 __ xorp(rax, Immediate(0x01)); | |
553 // See if current character is '\n'^1 or '\r'^1, i.e., 0x0b or 0x0c | |
554 __ subl(rax, Immediate(0x0b)); | |
555 __ cmpl(rax, Immediate(0x0c - 0x0b)); | |
556 BranchOrBacktrack(below_equal, on_no_match); | |
557 if (mode_ == UC16) { | |
558 // Compare original value to 0x2028 and 0x2029, using the already | |
559 // computed (current_char ^ 0x01 - 0x0b). I.e., check for | |
560 // 0x201d (0x2028 - 0x0b) or 0x201e. | |
561 __ subl(rax, Immediate(0x2028 - 0x0b)); | |
562 __ cmpl(rax, Immediate(0x2029 - 0x2028)); | |
563 BranchOrBacktrack(below_equal, on_no_match); | |
564 } | |
565 return true; | |
566 } | |
567 case 'n': { | |
568 // Match newlines (0x0a('\n'), 0x0d('\r'), 0x2028 and 0x2029) | |
569 __ movl(rax, current_character()); | |
570 __ xorp(rax, Immediate(0x01)); | |
571 // See if current character is '\n'^1 or '\r'^1, i.e., 0x0b or 0x0c | |
572 __ subl(rax, Immediate(0x0b)); | |
573 __ cmpl(rax, Immediate(0x0c - 0x0b)); | |
574 if (mode_ == LATIN1) { | |
575 BranchOrBacktrack(above, on_no_match); | |
576 } else { | |
577 Label done; | |
578 BranchOrBacktrack(below_equal, &done); | |
579 // Compare original value to 0x2028 and 0x2029, using the already | |
580 // computed (current_char ^ 0x01 - 0x0b). I.e., check for | |
581 // 0x201d (0x2028 - 0x0b) or 0x201e. | |
582 __ subl(rax, Immediate(0x2028 - 0x0b)); | |
583 __ cmpl(rax, Immediate(0x2029 - 0x2028)); | |
584 BranchOrBacktrack(above, on_no_match); | |
585 __ bind(&done); | |
586 } | |
587 return true; | |
588 } | |
589 case 'w': { | |
590 if (mode_ != LATIN1) { | |
591 // Table is 256 entries, so all Latin1 characters can be tested. | |
592 __ cmpl(current_character(), Immediate('z')); | |
593 BranchOrBacktrack(above, on_no_match); | |
594 } | |
595 __ Move(rbx, ExternalReference::re_word_character_map()); | |
596 DCHECK_EQ(0, word_character_map[0]); // Character '\0' is not a word char. | |
597 __ testb(Operand(rbx, current_character(), times_1, 0), | |
598 current_character()); | |
599 BranchOrBacktrack(zero, on_no_match); | |
600 return true; | |
601 } | |
602 case 'W': { | |
603 Label done; | |
604 if (mode_ != LATIN1) { | |
605 // Table is 256 entries, so all Latin1 characters can be tested. | |
606 __ cmpl(current_character(), Immediate('z')); | |
607 __ j(above, &done); | |
608 } | |
609 __ Move(rbx, ExternalReference::re_word_character_map()); | |
610 DCHECK_EQ(0, word_character_map[0]); // Character '\0' is not a word char. | |
611 __ testb(Operand(rbx, current_character(), times_1, 0), | |
612 current_character()); | |
613 BranchOrBacktrack(not_zero, on_no_match); | |
614 if (mode_ != LATIN1) { | |
615 __ bind(&done); | |
616 } | |
617 return true; | |
618 } | |
619 | |
620 case '*': | |
621 // Match any character. | |
622 return true; | |
623 // No custom implementation (yet): s(UC16), S(UC16). | |
624 default: | |
625 return false; | |
626 } | |
627 } | |
628 | |
629 | |
630 void RegExpMacroAssemblerX64::Fail() { | |
631 STATIC_ASSERT(FAILURE == 0); // Return value for failure is zero. | |
632 if (!global()) { | |
633 __ Set(rax, FAILURE); | |
634 } | |
635 __ jmp(&exit_label_); | |
636 } | |
637 | |
638 | |
639 Handle<HeapObject> RegExpMacroAssemblerX64::GetCode(Handle<String> source) { | |
640 Label return_rax; | |
641 // Finalize code - write the entry point code now we know how many | |
642 // registers we need. | |
643 // Entry code: | |
644 __ bind(&entry_label_); | |
645 | |
646 // Tell the system that we have a stack frame. Because the type is MANUAL, no | |
647 // is generated. | |
648 FrameScope scope(&masm_, StackFrame::MANUAL); | |
649 | |
650 // Actually emit code to start a new stack frame. | |
651 __ pushq(rbp); | |
652 __ movp(rbp, rsp); | |
653 // Save parameters and callee-save registers. Order here should correspond | |
654 // to order of kBackup_ebx etc. | |
655 #ifdef _WIN64 | |
656 // MSVC passes arguments in rcx, rdx, r8, r9, with backing stack slots. | |
657 // Store register parameters in pre-allocated stack slots, | |
658 __ movq(Operand(rbp, kInputString), rcx); | |
659 __ movq(Operand(rbp, kStartIndex), rdx); // Passed as int32 in edx. | |
660 __ movq(Operand(rbp, kInputStart), r8); | |
661 __ movq(Operand(rbp, kInputEnd), r9); | |
662 // Callee-save on Win64. | |
663 __ pushq(rsi); | |
664 __ pushq(rdi); | |
665 __ pushq(rbx); | |
666 #else | |
667 // GCC passes arguments in rdi, rsi, rdx, rcx, r8, r9 (and then on stack). | |
668 // Push register parameters on stack for reference. | |
669 DCHECK_EQ(kInputString, -1 * kRegisterSize); | |
670 DCHECK_EQ(kStartIndex, -2 * kRegisterSize); | |
671 DCHECK_EQ(kInputStart, -3 * kRegisterSize); | |
672 DCHECK_EQ(kInputEnd, -4 * kRegisterSize); | |
673 DCHECK_EQ(kRegisterOutput, -5 * kRegisterSize); | |
674 DCHECK_EQ(kNumOutputRegisters, -6 * kRegisterSize); | |
675 __ pushq(rdi); | |
676 __ pushq(rsi); | |
677 __ pushq(rdx); | |
678 __ pushq(rcx); | |
679 __ pushq(r8); | |
680 __ pushq(r9); | |
681 | |
682 __ pushq(rbx); // Callee-save | |
683 #endif | |
684 | |
685 __ Push(Immediate(0)); // Number of successful matches in a global regexp. | |
686 __ Push(Immediate(0)); // Make room for "input start - 1" constant. | |
687 | |
688 // Check if we have space on the stack for registers. | |
689 Label stack_limit_hit; | |
690 Label stack_ok; | |
691 | |
692 ExternalReference stack_limit = | |
693 ExternalReference::address_of_stack_limit(isolate()); | |
694 __ movp(rcx, rsp); | |
695 __ Move(kScratchRegister, stack_limit); | |
696 __ subp(rcx, Operand(kScratchRegister, 0)); | |
697 // Handle it if the stack pointer is already below the stack limit. | |
698 __ j(below_equal, &stack_limit_hit); | |
699 // Check if there is room for the variable number of registers above | |
700 // the stack limit. | |
701 __ cmpp(rcx, Immediate(num_registers_ * kPointerSize)); | |
702 __ j(above_equal, &stack_ok); | |
703 // Exit with OutOfMemory exception. There is not enough space on the stack | |
704 // for our working registers. | |
705 __ Set(rax, EXCEPTION); | |
706 __ jmp(&return_rax); | |
707 | |
708 __ bind(&stack_limit_hit); | |
709 __ Move(code_object_pointer(), masm_.CodeObject()); | |
710 CallCheckStackGuardState(); // Preserves no registers beside rbp and rsp. | |
711 __ testp(rax, rax); | |
712 // If returned value is non-zero, we exit with the returned value as result. | |
713 __ j(not_zero, &return_rax); | |
714 | |
715 __ bind(&stack_ok); | |
716 | |
717 // Allocate space on stack for registers. | |
718 __ subp(rsp, Immediate(num_registers_ * kPointerSize)); | |
719 // Load string length. | |
720 __ movp(rsi, Operand(rbp, kInputEnd)); | |
721 // Load input position. | |
722 __ movp(rdi, Operand(rbp, kInputStart)); | |
723 // Set up rdi to be negative offset from string end. | |
724 __ subq(rdi, rsi); | |
725 // Set rax to address of char before start of the string | |
726 // (effectively string position -1). | |
727 __ movp(rbx, Operand(rbp, kStartIndex)); | |
728 __ negq(rbx); | |
729 if (mode_ == UC16) { | |
730 __ leap(rax, Operand(rdi, rbx, times_2, -char_size())); | |
731 } else { | |
732 __ leap(rax, Operand(rdi, rbx, times_1, -char_size())); | |
733 } | |
734 // Store this value in a local variable, for use when clearing | |
735 // position registers. | |
736 __ movp(Operand(rbp, kInputStartMinusOne), rax); | |
737 | |
738 #if V8_OS_WIN | |
739 // Ensure that we have written to each stack page, in order. Skipping a page | |
740 // on Windows can cause segmentation faults. Assuming page size is 4k. | |
741 const int kPageSize = 4096; | |
742 const int kRegistersPerPage = kPageSize / kPointerSize; | |
743 for (int i = num_saved_registers_ + kRegistersPerPage - 1; | |
744 i < num_registers_; | |
745 i += kRegistersPerPage) { | |
746 __ movp(register_location(i), rax); // One write every page. | |
747 } | |
748 #endif // V8_OS_WIN | |
749 | |
750 // Initialize code object pointer. | |
751 __ Move(code_object_pointer(), masm_.CodeObject()); | |
752 | |
753 Label load_char_start_regexp, start_regexp; | |
754 // Load newline if index is at start, previous character otherwise. | |
755 __ cmpl(Operand(rbp, kStartIndex), Immediate(0)); | |
756 __ j(not_equal, &load_char_start_regexp, Label::kNear); | |
757 __ Set(current_character(), '\n'); | |
758 __ jmp(&start_regexp, Label::kNear); | |
759 | |
760 // Global regexp restarts matching here. | |
761 __ bind(&load_char_start_regexp); | |
762 // Load previous char as initial value of current character register. | |
763 LoadCurrentCharacterUnchecked(-1, 1); | |
764 __ bind(&start_regexp); | |
765 | |
766 // Initialize on-stack registers. | |
767 if (num_saved_registers_ > 0) { | |
768 // Fill saved registers with initial value = start offset - 1 | |
769 // Fill in stack push order, to avoid accessing across an unwritten | |
770 // page (a problem on Windows). | |
771 if (num_saved_registers_ > 8) { | |
772 __ Set(rcx, kRegisterZero); | |
773 Label init_loop; | |
774 __ bind(&init_loop); | |
775 __ movp(Operand(rbp, rcx, times_1, 0), rax); | |
776 __ subq(rcx, Immediate(kPointerSize)); | |
777 __ cmpq(rcx, | |
778 Immediate(kRegisterZero - num_saved_registers_ * kPointerSize)); | |
779 __ j(greater, &init_loop); | |
780 } else { // Unroll the loop. | |
781 for (int i = 0; i < num_saved_registers_; i++) { | |
782 __ movp(register_location(i), rax); | |
783 } | |
784 } | |
785 } | |
786 | |
787 // Initialize backtrack stack pointer. | |
788 __ movp(backtrack_stackpointer(), Operand(rbp, kStackHighEnd)); | |
789 | |
790 __ jmp(&start_label_); | |
791 | |
792 // Exit code: | |
793 if (success_label_.is_linked()) { | |
794 // Save captures when successful. | |
795 __ bind(&success_label_); | |
796 if (num_saved_registers_ > 0) { | |
797 // copy captures to output | |
798 __ movp(rdx, Operand(rbp, kStartIndex)); | |
799 __ movp(rbx, Operand(rbp, kRegisterOutput)); | |
800 __ movp(rcx, Operand(rbp, kInputEnd)); | |
801 __ subp(rcx, Operand(rbp, kInputStart)); | |
802 if (mode_ == UC16) { | |
803 __ leap(rcx, Operand(rcx, rdx, times_2, 0)); | |
804 } else { | |
805 __ addp(rcx, rdx); | |
806 } | |
807 for (int i = 0; i < num_saved_registers_; i++) { | |
808 __ movp(rax, register_location(i)); | |
809 if (i == 0 && global_with_zero_length_check()) { | |
810 // Keep capture start in rdx for the zero-length check later. | |
811 __ movp(rdx, rax); | |
812 } | |
813 __ addp(rax, rcx); // Convert to index from start, not end. | |
814 if (mode_ == UC16) { | |
815 __ sarp(rax, Immediate(1)); // Convert byte index to character index. | |
816 } | |
817 __ movl(Operand(rbx, i * kIntSize), rax); | |
818 } | |
819 } | |
820 | |
821 if (global()) { | |
822 // Restart matching if the regular expression is flagged as global. | |
823 // Increment success counter. | |
824 __ incp(Operand(rbp, kSuccessfulCaptures)); | |
825 // Capture results have been stored, so the number of remaining global | |
826 // output registers is reduced by the number of stored captures. | |
827 __ movsxlq(rcx, Operand(rbp, kNumOutputRegisters)); | |
828 __ subp(rcx, Immediate(num_saved_registers_)); | |
829 // Check whether we have enough room for another set of capture results. | |
830 __ cmpp(rcx, Immediate(num_saved_registers_)); | |
831 __ j(less, &exit_label_); | |
832 | |
833 __ movp(Operand(rbp, kNumOutputRegisters), rcx); | |
834 // Advance the location for output. | |
835 __ addp(Operand(rbp, kRegisterOutput), | |
836 Immediate(num_saved_registers_ * kIntSize)); | |
837 | |
838 // Prepare rax to initialize registers with its value in the next run. | |
839 __ movp(rax, Operand(rbp, kInputStartMinusOne)); | |
840 | |
841 if (global_with_zero_length_check()) { | |
842 // Special case for zero-length matches. | |
843 // rdx: capture start index | |
844 __ cmpp(rdi, rdx); | |
845 // Not a zero-length match, restart. | |
846 __ j(not_equal, &load_char_start_regexp); | |
847 // rdi (offset from the end) is zero if we already reached the end. | |
848 __ testp(rdi, rdi); | |
849 __ j(zero, &exit_label_, Label::kNear); | |
850 // Advance current position after a zero-length match. | |
851 if (mode_ == UC16) { | |
852 __ addq(rdi, Immediate(2)); | |
853 } else { | |
854 __ incq(rdi); | |
855 } | |
856 } | |
857 | |
858 __ jmp(&load_char_start_regexp); | |
859 } else { | |
860 __ movp(rax, Immediate(SUCCESS)); | |
861 } | |
862 } | |
863 | |
864 __ bind(&exit_label_); | |
865 if (global()) { | |
866 // Return the number of successful captures. | |
867 __ movp(rax, Operand(rbp, kSuccessfulCaptures)); | |
868 } | |
869 | |
870 __ bind(&return_rax); | |
871 #ifdef _WIN64 | |
872 // Restore callee save registers. | |
873 __ leap(rsp, Operand(rbp, kLastCalleeSaveRegister)); | |
874 __ popq(rbx); | |
875 __ popq(rdi); | |
876 __ popq(rsi); | |
877 // Stack now at rbp. | |
878 #else | |
879 // Restore callee save register. | |
880 __ movp(rbx, Operand(rbp, kBackup_rbx)); | |
881 // Skip rsp to rbp. | |
882 __ movp(rsp, rbp); | |
883 #endif | |
884 // Exit function frame, restore previous one. | |
885 __ popq(rbp); | |
886 __ ret(0); | |
887 | |
888 // Backtrack code (branch target for conditional backtracks). | |
889 if (backtrack_label_.is_linked()) { | |
890 __ bind(&backtrack_label_); | |
891 Backtrack(); | |
892 } | |
893 | |
894 Label exit_with_exception; | |
895 | |
896 // Preempt-code | |
897 if (check_preempt_label_.is_linked()) { | |
898 SafeCallTarget(&check_preempt_label_); | |
899 | |
900 __ pushq(backtrack_stackpointer()); | |
901 __ pushq(rdi); | |
902 | |
903 CallCheckStackGuardState(); | |
904 __ testp(rax, rax); | |
905 // If returning non-zero, we should end execution with the given | |
906 // result as return value. | |
907 __ j(not_zero, &return_rax); | |
908 | |
909 // Restore registers. | |
910 __ Move(code_object_pointer(), masm_.CodeObject()); | |
911 __ popq(rdi); | |
912 __ popq(backtrack_stackpointer()); | |
913 // String might have moved: Reload esi from frame. | |
914 __ movp(rsi, Operand(rbp, kInputEnd)); | |
915 SafeReturn(); | |
916 } | |
917 | |
918 // Backtrack stack overflow code. | |
919 if (stack_overflow_label_.is_linked()) { | |
920 SafeCallTarget(&stack_overflow_label_); | |
921 // Reached if the backtrack-stack limit has been hit. | |
922 | |
923 Label grow_failed; | |
924 // Save registers before calling C function | |
925 #ifndef _WIN64 | |
926 // Callee-save in Microsoft 64-bit ABI, but not in AMD64 ABI. | |
927 __ pushq(rsi); | |
928 __ pushq(rdi); | |
929 #endif | |
930 | |
931 // Call GrowStack(backtrack_stackpointer()) | |
932 static const int num_arguments = 3; | |
933 __ PrepareCallCFunction(num_arguments); | |
934 #ifdef _WIN64 | |
935 // Microsoft passes parameters in rcx, rdx, r8. | |
936 // First argument, backtrack stackpointer, is already in rcx. | |
937 __ leap(rdx, Operand(rbp, kStackHighEnd)); // Second argument | |
938 __ LoadAddress(r8, ExternalReference::isolate_address(isolate())); | |
939 #else | |
940 // AMD64 ABI passes parameters in rdi, rsi, rdx. | |
941 __ movp(rdi, backtrack_stackpointer()); // First argument. | |
942 __ leap(rsi, Operand(rbp, kStackHighEnd)); // Second argument. | |
943 __ LoadAddress(rdx, ExternalReference::isolate_address(isolate())); | |
944 #endif | |
945 ExternalReference grow_stack = | |
946 ExternalReference::re_grow_stack(isolate()); | |
947 __ CallCFunction(grow_stack, num_arguments); | |
948 // If return NULL, we have failed to grow the stack, and | |
949 // must exit with a stack-overflow exception. | |
950 __ testp(rax, rax); | |
951 __ j(equal, &exit_with_exception); | |
952 // Otherwise use return value as new stack pointer. | |
953 __ movp(backtrack_stackpointer(), rax); | |
954 // Restore saved registers and continue. | |
955 __ Move(code_object_pointer(), masm_.CodeObject()); | |
956 #ifndef _WIN64 | |
957 __ popq(rdi); | |
958 __ popq(rsi); | |
959 #endif | |
960 SafeReturn(); | |
961 } | |
962 | |
963 if (exit_with_exception.is_linked()) { | |
964 // If any of the code above needed to exit with an exception. | |
965 __ bind(&exit_with_exception); | |
966 // Exit with Result EXCEPTION(-1) to signal thrown exception. | |
967 __ Set(rax, EXCEPTION); | |
968 __ jmp(&return_rax); | |
969 } | |
970 | |
971 FixupCodeRelativePositions(); | |
972 | |
973 CodeDesc code_desc; | |
974 masm_.GetCode(&code_desc); | |
975 Isolate* isolate = this->isolate(); | |
976 Handle<Code> code = isolate->factory()->NewCode( | |
977 code_desc, Code::ComputeFlags(Code::REGEXP), | |
978 masm_.CodeObject()); | |
979 PROFILE(isolate, RegExpCodeCreateEvent(*code, *source)); | |
980 return Handle<HeapObject>::cast(code); | |
981 } | |
982 | |
983 | |
984 void RegExpMacroAssemblerX64::GoTo(Label* to) { | |
985 BranchOrBacktrack(no_condition, to); | |
986 } | |
987 | |
988 | |
989 void RegExpMacroAssemblerX64::IfRegisterGE(int reg, | |
990 int comparand, | |
991 Label* if_ge) { | |
992 __ cmpp(register_location(reg), Immediate(comparand)); | |
993 BranchOrBacktrack(greater_equal, if_ge); | |
994 } | |
995 | |
996 | |
997 void RegExpMacroAssemblerX64::IfRegisterLT(int reg, | |
998 int comparand, | |
999 Label* if_lt) { | |
1000 __ cmpp(register_location(reg), Immediate(comparand)); | |
1001 BranchOrBacktrack(less, if_lt); | |
1002 } | |
1003 | |
1004 | |
1005 void RegExpMacroAssemblerX64::IfRegisterEqPos(int reg, | |
1006 Label* if_eq) { | |
1007 __ cmpp(rdi, register_location(reg)); | |
1008 BranchOrBacktrack(equal, if_eq); | |
1009 } | |
1010 | |
1011 | |
1012 RegExpMacroAssembler::IrregexpImplementation | |
1013 RegExpMacroAssemblerX64::Implementation() { | |
1014 return kX64Implementation; | |
1015 } | |
1016 | |
1017 | |
1018 void RegExpMacroAssemblerX64::LoadCurrentCharacter(int cp_offset, | |
1019 Label* on_end_of_input, | |
1020 bool check_bounds, | |
1021 int characters) { | |
1022 DCHECK(cp_offset >= -1); // ^ and \b can look behind one character. | |
1023 DCHECK(cp_offset < (1<<30)); // Be sane! (And ensure negation works) | |
1024 if (check_bounds) { | |
1025 CheckPosition(cp_offset + characters - 1, on_end_of_input); | |
1026 } | |
1027 LoadCurrentCharacterUnchecked(cp_offset, characters); | |
1028 } | |
1029 | |
1030 | |
1031 void RegExpMacroAssemblerX64::PopCurrentPosition() { | |
1032 Pop(rdi); | |
1033 } | |
1034 | |
1035 | |
1036 void RegExpMacroAssemblerX64::PopRegister(int register_index) { | |
1037 Pop(rax); | |
1038 __ movp(register_location(register_index), rax); | |
1039 } | |
1040 | |
1041 | |
1042 void RegExpMacroAssemblerX64::PushBacktrack(Label* label) { | |
1043 Push(label); | |
1044 CheckStackLimit(); | |
1045 } | |
1046 | |
1047 | |
1048 void RegExpMacroAssemblerX64::PushCurrentPosition() { | |
1049 Push(rdi); | |
1050 } | |
1051 | |
1052 | |
1053 void RegExpMacroAssemblerX64::PushRegister(int register_index, | |
1054 StackCheckFlag check_stack_limit) { | |
1055 __ movp(rax, register_location(register_index)); | |
1056 Push(rax); | |
1057 if (check_stack_limit) CheckStackLimit(); | |
1058 } | |
1059 | |
1060 | |
1061 STATIC_ASSERT(kPointerSize == kInt64Size || kPointerSize == kInt32Size); | |
1062 | |
1063 | |
1064 void RegExpMacroAssemblerX64::ReadCurrentPositionFromRegister(int reg) { | |
1065 if (kPointerSize == kInt64Size) { | |
1066 __ movq(rdi, register_location(reg)); | |
1067 } else { | |
1068 // Need sign extension for x32 as rdi might be used as an index register. | |
1069 __ movsxlq(rdi, register_location(reg)); | |
1070 } | |
1071 } | |
1072 | |
1073 | |
1074 void RegExpMacroAssemblerX64::ReadPositionFromRegister(Register dst, int reg) { | |
1075 if (kPointerSize == kInt64Size) { | |
1076 __ movq(dst, register_location(reg)); | |
1077 } else { | |
1078 // Need sign extension for x32 as dst might be used as an index register. | |
1079 __ movsxlq(dst, register_location(reg)); | |
1080 } | |
1081 } | |
1082 | |
1083 | |
1084 void RegExpMacroAssemblerX64::ReadStackPointerFromRegister(int reg) { | |
1085 __ movp(backtrack_stackpointer(), register_location(reg)); | |
1086 __ addp(backtrack_stackpointer(), Operand(rbp, kStackHighEnd)); | |
1087 } | |
1088 | |
1089 | |
1090 void RegExpMacroAssemblerX64::SetCurrentPositionFromEnd(int by) { | |
1091 Label after_position; | |
1092 __ cmpp(rdi, Immediate(-by * char_size())); | |
1093 __ j(greater_equal, &after_position, Label::kNear); | |
1094 __ movq(rdi, Immediate(-by * char_size())); | |
1095 // On RegExp code entry (where this operation is used), the character before | |
1096 // the current position is expected to be already loaded. | |
1097 // We have advanced the position, so it's safe to read backwards. | |
1098 LoadCurrentCharacterUnchecked(-1, 1); | |
1099 __ bind(&after_position); | |
1100 } | |
1101 | |
1102 | |
1103 void RegExpMacroAssemblerX64::SetRegister(int register_index, int to) { | |
1104 DCHECK(register_index >= num_saved_registers_); // Reserved for positions! | |
1105 __ movp(register_location(register_index), Immediate(to)); | |
1106 } | |
1107 | |
1108 | |
1109 bool RegExpMacroAssemblerX64::Succeed() { | |
1110 __ jmp(&success_label_); | |
1111 return global(); | |
1112 } | |
1113 | |
1114 | |
1115 void RegExpMacroAssemblerX64::WriteCurrentPositionToRegister(int reg, | |
1116 int cp_offset) { | |
1117 if (cp_offset == 0) { | |
1118 __ movp(register_location(reg), rdi); | |
1119 } else { | |
1120 __ leap(rax, Operand(rdi, cp_offset * char_size())); | |
1121 __ movp(register_location(reg), rax); | |
1122 } | |
1123 } | |
1124 | |
1125 | |
1126 void RegExpMacroAssemblerX64::ClearRegisters(int reg_from, int reg_to) { | |
1127 DCHECK(reg_from <= reg_to); | |
1128 __ movp(rax, Operand(rbp, kInputStartMinusOne)); | |
1129 for (int reg = reg_from; reg <= reg_to; reg++) { | |
1130 __ movp(register_location(reg), rax); | |
1131 } | |
1132 } | |
1133 | |
1134 | |
1135 void RegExpMacroAssemblerX64::WriteStackPointerToRegister(int reg) { | |
1136 __ movp(rax, backtrack_stackpointer()); | |
1137 __ subp(rax, Operand(rbp, kStackHighEnd)); | |
1138 __ movp(register_location(reg), rax); | |
1139 } | |
1140 | |
1141 | |
1142 // Private methods: | |
1143 | |
1144 void RegExpMacroAssemblerX64::CallCheckStackGuardState() { | |
1145 // This function call preserves no register values. Caller should | |
1146 // store anything volatile in a C call or overwritten by this function. | |
1147 static const int num_arguments = 3; | |
1148 __ PrepareCallCFunction(num_arguments); | |
1149 #ifdef _WIN64 | |
1150 // Second argument: Code* of self. (Do this before overwriting r8). | |
1151 __ movp(rdx, code_object_pointer()); | |
1152 // Third argument: RegExp code frame pointer. | |
1153 __ movp(r8, rbp); | |
1154 // First argument: Next address on the stack (will be address of | |
1155 // return address). | |
1156 __ leap(rcx, Operand(rsp, -kPointerSize)); | |
1157 #else | |
1158 // Third argument: RegExp code frame pointer. | |
1159 __ movp(rdx, rbp); | |
1160 // Second argument: Code* of self. | |
1161 __ movp(rsi, code_object_pointer()); | |
1162 // First argument: Next address on the stack (will be address of | |
1163 // return address). | |
1164 __ leap(rdi, Operand(rsp, -kRegisterSize)); | |
1165 #endif | |
1166 ExternalReference stack_check = | |
1167 ExternalReference::re_check_stack_guard_state(isolate()); | |
1168 __ CallCFunction(stack_check, num_arguments); | |
1169 } | |
1170 | |
1171 | |
1172 // Helper function for reading a value out of a stack frame. | |
1173 template <typename T> | |
1174 static T& frame_entry(Address re_frame, int frame_offset) { | |
1175 return reinterpret_cast<T&>(Memory::int32_at(re_frame + frame_offset)); | |
1176 } | |
1177 | |
1178 | |
1179 template <typename T> | |
1180 static T* frame_entry_address(Address re_frame, int frame_offset) { | |
1181 return reinterpret_cast<T*>(re_frame + frame_offset); | |
1182 } | |
1183 | |
1184 | |
1185 int RegExpMacroAssemblerX64::CheckStackGuardState(Address* return_address, | |
1186 Code* re_code, | |
1187 Address re_frame) { | |
1188 return NativeRegExpMacroAssembler::CheckStackGuardState( | |
1189 frame_entry<Isolate*>(re_frame, kIsolate), | |
1190 frame_entry<int>(re_frame, kStartIndex), | |
1191 frame_entry<int>(re_frame, kDirectCall) == 1, return_address, re_code, | |
1192 frame_entry_address<String*>(re_frame, kInputString), | |
1193 frame_entry_address<const byte*>(re_frame, kInputStart), | |
1194 frame_entry_address<const byte*>(re_frame, kInputEnd)); | |
1195 } | |
1196 | |
1197 | |
1198 Operand RegExpMacroAssemblerX64::register_location(int register_index) { | |
1199 DCHECK(register_index < (1<<30)); | |
1200 if (num_registers_ <= register_index) { | |
1201 num_registers_ = register_index + 1; | |
1202 } | |
1203 return Operand(rbp, kRegisterZero - register_index * kPointerSize); | |
1204 } | |
1205 | |
1206 | |
1207 void RegExpMacroAssemblerX64::CheckPosition(int cp_offset, | |
1208 Label* on_outside_input) { | |
1209 __ cmpl(rdi, Immediate(-cp_offset * char_size())); | |
1210 BranchOrBacktrack(greater_equal, on_outside_input); | |
1211 } | |
1212 | |
1213 | |
1214 void RegExpMacroAssemblerX64::BranchOrBacktrack(Condition condition, | |
1215 Label* to) { | |
1216 if (condition < 0) { // No condition | |
1217 if (to == NULL) { | |
1218 Backtrack(); | |
1219 return; | |
1220 } | |
1221 __ jmp(to); | |
1222 return; | |
1223 } | |
1224 if (to == NULL) { | |
1225 __ j(condition, &backtrack_label_); | |
1226 return; | |
1227 } | |
1228 __ j(condition, to); | |
1229 } | |
1230 | |
1231 | |
1232 void RegExpMacroAssemblerX64::SafeCall(Label* to) { | |
1233 __ call(to); | |
1234 } | |
1235 | |
1236 | |
1237 void RegExpMacroAssemblerX64::SafeCallTarget(Label* label) { | |
1238 __ bind(label); | |
1239 __ subp(Operand(rsp, 0), code_object_pointer()); | |
1240 } | |
1241 | |
1242 | |
1243 void RegExpMacroAssemblerX64::SafeReturn() { | |
1244 __ addp(Operand(rsp, 0), code_object_pointer()); | |
1245 __ ret(0); | |
1246 } | |
1247 | |
1248 | |
1249 void RegExpMacroAssemblerX64::Push(Register source) { | |
1250 DCHECK(!source.is(backtrack_stackpointer())); | |
1251 // Notice: This updates flags, unlike normal Push. | |
1252 __ subp(backtrack_stackpointer(), Immediate(kIntSize)); | |
1253 __ movl(Operand(backtrack_stackpointer(), 0), source); | |
1254 } | |
1255 | |
1256 | |
1257 void RegExpMacroAssemblerX64::Push(Immediate value) { | |
1258 // Notice: This updates flags, unlike normal Push. | |
1259 __ subp(backtrack_stackpointer(), Immediate(kIntSize)); | |
1260 __ movl(Operand(backtrack_stackpointer(), 0), value); | |
1261 } | |
1262 | |
1263 | |
1264 void RegExpMacroAssemblerX64::FixupCodeRelativePositions() { | |
1265 for (int i = 0, n = code_relative_fixup_positions_.length(); i < n; i++) { | |
1266 int position = code_relative_fixup_positions_[i]; | |
1267 // The position succeeds a relative label offset from position. | |
1268 // Patch the relative offset to be relative to the Code object pointer | |
1269 // instead. | |
1270 int patch_position = position - kIntSize; | |
1271 int offset = masm_.long_at(patch_position); | |
1272 masm_.long_at_put(patch_position, | |
1273 offset | |
1274 + position | |
1275 + Code::kHeaderSize | |
1276 - kHeapObjectTag); | |
1277 } | |
1278 code_relative_fixup_positions_.Clear(); | |
1279 } | |
1280 | |
1281 | |
1282 void RegExpMacroAssemblerX64::Push(Label* backtrack_target) { | |
1283 __ subp(backtrack_stackpointer(), Immediate(kIntSize)); | |
1284 __ movl(Operand(backtrack_stackpointer(), 0), backtrack_target); | |
1285 MarkPositionForCodeRelativeFixup(); | |
1286 } | |
1287 | |
1288 | |
1289 void RegExpMacroAssemblerX64::Pop(Register target) { | |
1290 DCHECK(!target.is(backtrack_stackpointer())); | |
1291 __ movsxlq(target, Operand(backtrack_stackpointer(), 0)); | |
1292 // Notice: This updates flags, unlike normal Pop. | |
1293 __ addp(backtrack_stackpointer(), Immediate(kIntSize)); | |
1294 } | |
1295 | |
1296 | |
1297 void RegExpMacroAssemblerX64::Drop() { | |
1298 __ addp(backtrack_stackpointer(), Immediate(kIntSize)); | |
1299 } | |
1300 | |
1301 | |
1302 void RegExpMacroAssemblerX64::CheckPreemption() { | |
1303 // Check for preemption. | |
1304 Label no_preempt; | |
1305 ExternalReference stack_limit = | |
1306 ExternalReference::address_of_stack_limit(isolate()); | |
1307 __ load_rax(stack_limit); | |
1308 __ cmpp(rsp, rax); | |
1309 __ j(above, &no_preempt); | |
1310 | |
1311 SafeCall(&check_preempt_label_); | |
1312 | |
1313 __ bind(&no_preempt); | |
1314 } | |
1315 | |
1316 | |
1317 void RegExpMacroAssemblerX64::CheckStackLimit() { | |
1318 Label no_stack_overflow; | |
1319 ExternalReference stack_limit = | |
1320 ExternalReference::address_of_regexp_stack_limit(isolate()); | |
1321 __ load_rax(stack_limit); | |
1322 __ cmpp(backtrack_stackpointer(), rax); | |
1323 __ j(above, &no_stack_overflow); | |
1324 | |
1325 SafeCall(&stack_overflow_label_); | |
1326 | |
1327 __ bind(&no_stack_overflow); | |
1328 } | |
1329 | |
1330 | |
1331 void RegExpMacroAssemblerX64::LoadCurrentCharacterUnchecked(int cp_offset, | |
1332 int characters) { | |
1333 if (mode_ == LATIN1) { | |
1334 if (characters == 4) { | |
1335 __ movl(current_character(), Operand(rsi, rdi, times_1, cp_offset)); | |
1336 } else if (characters == 2) { | |
1337 __ movzxwl(current_character(), Operand(rsi, rdi, times_1, cp_offset)); | |
1338 } else { | |
1339 DCHECK(characters == 1); | |
1340 __ movzxbl(current_character(), Operand(rsi, rdi, times_1, cp_offset)); | |
1341 } | |
1342 } else { | |
1343 DCHECK(mode_ == UC16); | |
1344 if (characters == 2) { | |
1345 __ movl(current_character(), | |
1346 Operand(rsi, rdi, times_1, cp_offset * sizeof(uc16))); | |
1347 } else { | |
1348 DCHECK(characters == 1); | |
1349 __ movzxwl(current_character(), | |
1350 Operand(rsi, rdi, times_1, cp_offset * sizeof(uc16))); | |
1351 } | |
1352 } | |
1353 } | |
1354 | |
1355 #undef __ | |
1356 | |
1357 #endif // V8_INTERPRETED_REGEXP | |
1358 | |
1359 } // namespace internal | |
1360 } // namespace v8 | |
1361 | |
1362 #endif // V8_TARGET_ARCH_X64 | |
OLD | NEW |