1 // Copyright 2012 the V8 project authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
4
5 #include "src/v8.h"
6
7 #if V8_TARGET_ARCH_MIPS64
8
9 #include "src/code-stubs.h"
10 #include "src/log.h"
11 #include "src/macro-assembler.h"
12 #include "src/regexp-macro-assembler.h"
13 #include "src/regexp-stack.h"
14 #include "src/unicode.h"
15
16 #include "src/mips64/regexp-macro-assembler-mips64.h"
17
18 namespace v8 {
19 namespace internal {
20
21 #ifndef V8_INTERPRETED_REGEXP
22 /*
23 * This assembler uses the following register assignment convention
24 * - t3 : Temporarily stores the index of capture start after a matching pass
25 * for a global regexp.
26 * - a5 : Pointer to current code object (Code*) including heap object tag.
27 * - a6 : Current position in input, as negative offset from end of string.
28 * Please notice that this is the byte offset, not the character offset!
29 * - a7 : Currently loaded character. Must be loaded using
30 * LoadCurrentCharacter before using any of the dispatch methods.
31 * - t0 : Points to tip of backtrack stack
32 * - t1 : Unused.
33 * - t2 : End of input (points to byte after last character in input).
34 * - fp : Frame pointer. Used to access arguments, local variables and
35 * RegExp registers.
36 * - sp : Points to tip of C stack.
37 *
38 * The remaining registers are free for computations.
39 * Each call to a public method should retain this convention.
40 *
41 * TODO(plind): O32 documented here with intent of having single 32/64 codebase
42 * in the future.
43 *
44 * The O32 stack will have the following structure:
45 *
46 * - fp[76] Isolate* isolate (address of the current isolate)
47 * - fp[72] direct_call (if 1, direct call from JavaScript code,
48 * if 0, call through the runtime system).
49 * - fp[68] stack_area_base (High end of the memory area to use as
50 * backtracking stack).
51 * - fp[64] capture array size (may fit multiple sets of matches)
52 * - fp[60] int* capture_array (int[num_saved_registers_], for output).
53 * - fp[44..59] MIPS O32 four argument slots
54 * - fp[40] secondary link/return address used by native call.
55 * --- sp when called ---
56 * - fp[36] return address (lr).
57 * - fp[32] old frame pointer (r11).
58 * - fp[0..31] backup of registers s0..s7.
59 * --- frame pointer ----
60 * - fp[-4] end of input (address of end of string).
61 * - fp[-8] start of input (address of first character in string).
62 * - fp[-12] start index (character index of start).
63 * - fp[-16] void* input_string (location of a handle containing the string).
64 * - fp[-20] success counter (only for global regexps to count matches).
65 * - fp[-24] Offset of location before start of input (effectively character
66 * position -1). Used to initialize capture registers to a
67 * non-position.
68 * - fp[-28] At start (if 1, we are starting at the start of the
69 * string, otherwise 0)
70 * - fp[-32] register 0 (Only positions must be stored in the first
71 * - register 1 num_saved_registers_ registers)
72 * - ...
73 * - register num_registers-1
74 * --- sp ---
75 *
76 *
77 * The N64 stack will have the following structure:
78 *
79 * - fp[88] Isolate* isolate (address of the current isolate) kIsolate
80 * - fp[80] secondary link/return address used by exit frame on native call. kSecondaryReturnAddress
81 kStackFrameHeader
82 * --- sp when called ---
83 * - fp[72] ra Return from RegExp code (ra). kReturnAddress
84 * - fp[64] s9, old-fp Old fp, callee saved(s9).
85 * - fp[0..63] s0..s7 Callee-saved registers s0..s7.
86 * --- frame pointer ----
87 * - fp[-8] direct_call (1 = direct call from JS, 0 = from runtime) kDirectCall
88 * - fp[-16] stack_base (Top of backtracking stack). kStackHighEnd
89 * - fp[-24] capture array size (may fit multiple sets of matches) kNumOutputRegisters
90 * - fp[-32] int* capture_array (int[num_saved_registers_], for output). kRegisterOutput
91 * - fp[-40] end of input (address of end of string). kInputEnd
92 * - fp[-48] start of input (address of first character in string). kInputStart
93 * - fp[-56] start index (character index of start). kStartIndex
94 * - fp[-64] void* input_string (location of a handle containing the string). kInputString
95 * - fp[-72] success counter (only for global regexps to count matches). kSuccessfulCaptures
96 * - fp[-80] Offset of location before start of input (effectively character kInputStartMinusOne
97 * position -1). Used to initialize capture registers to a
98 * non-position.
99 * --------- The following output registers are 32-bit values. ---------
100 * - fp[-88] register 0 (Only positions must be stored in the first kRegisterZero
101 * - register 1 num_saved_registers_ registers)
102 * - ...
103 * - register num_registers-1
104 * --- sp ---
105 *
106 * The first num_saved_registers_ registers are initialized to point to
107 * "character -1" in the string (i.e., char_size() bytes before the first
108 * character of the string). The remaining registers start out as garbage.
109 *
110 * The data up to the return address must be placed there by the calling
111 * code and the remaining arguments are passed in registers, e.g. by calling the
112 * code entry as cast to a function with the signature:
113 * int (*match)(String* input_string,
114 * int start_index,
115 * Address start,
116 * Address end,
117 * Address secondary_return_address, // Only used by native call.
118 * int* capture_output_array,
119 * byte* stack_area_base,
120 * bool direct_call = false,
121 * void* return_address,
122 * Isolate* isolate);
123 * The call is performed by NativeRegExpMacroAssembler::Execute()
124 * (in regexp-macro-assembler.cc) via the CALL_GENERATED_REGEXP_CODE macro
125 * in mips/simulator-mips.h.
126 * When calling as a non-direct call (i.e., from C++ code), the return address
127 * area is overwritten with the ra register by the RegExp code. When doing a
128 * direct call from generated code, the return address is placed there by
129 * the calling code, as in a normal exit frame.
130 */
131
132 #define __ ACCESS_MASM(masm_)
133
RegExpMacroAssemblerMIPS(Mode mode,int registers_to_save,Zone * zone)134 RegExpMacroAssemblerMIPS::RegExpMacroAssemblerMIPS(
135 Mode mode,
136 int registers_to_save,
137 Zone* zone)
138 : NativeRegExpMacroAssembler(zone),
139 masm_(new MacroAssembler(zone->isolate(), NULL, kRegExpCodeSize)),
140 mode_(mode),
141 num_registers_(registers_to_save),
142 num_saved_registers_(registers_to_save),
143 entry_label_(),
144 start_label_(),
145 success_label_(),
146 backtrack_label_(),
147 exit_label_(),
148 internal_failure_label_() {
149 DCHECK_EQ(0, registers_to_save % 2);
150 __ jmp(&entry_label_); // We'll write the entry code later.
151 // If the code gets too big or corrupted, an internal exception will be
152 // raised, and we will exit right away.
153 __ bind(&internal_failure_label_);
154 __ li(v0, Operand(FAILURE));
155 __ Ret();
156 __ bind(&start_label_); // And then continue from here.
157 }
158
159
~RegExpMacroAssemblerMIPS()160 RegExpMacroAssemblerMIPS::~RegExpMacroAssemblerMIPS() {
161 delete masm_;
162 // Unuse labels in case we throw away the assembler without calling GetCode.
163 entry_label_.Unuse();
164 start_label_.Unuse();
165 success_label_.Unuse();
166 backtrack_label_.Unuse();
167 exit_label_.Unuse();
168 check_preempt_label_.Unuse();
169 stack_overflow_label_.Unuse();
170 internal_failure_label_.Unuse();
171 }
172
173
stack_limit_slack()174 int RegExpMacroAssemblerMIPS::stack_limit_slack() {
175 return RegExpStack::kStackLimitSlack;
176 }
177
178
AdvanceCurrentPosition(int by)179 void RegExpMacroAssemblerMIPS::AdvanceCurrentPosition(int by) {
180 if (by != 0) {
181 __ Daddu(current_input_offset(),
182 current_input_offset(), Operand(by * char_size()));
183 }
184 }
185
186
AdvanceRegister(int reg,int by)187 void RegExpMacroAssemblerMIPS::AdvanceRegister(int reg, int by) {
188 DCHECK(reg >= 0);
189 DCHECK(reg < num_registers_);
190 if (by != 0) {
191 __ ld(a0, register_location(reg));
192 __ Daddu(a0, a0, Operand(by));
193 __ sd(a0, register_location(reg));
194 }
195 }
196
197
Backtrack()198 void RegExpMacroAssemblerMIPS::Backtrack() {
199 CheckPreemption();
200 // Pop Code* offset from backtrack stack, add Code* and jump to location.
201 Pop(a0);
202 __ Daddu(a0, a0, code_pointer());
203 __ Jump(a0);
204 }
205
206
Bind(Label * label)207 void RegExpMacroAssemblerMIPS::Bind(Label* label) {
208 __ bind(label);
209 }
210
211
CheckCharacter(uint32_t c,Label * on_equal)212 void RegExpMacroAssemblerMIPS::CheckCharacter(uint32_t c, Label* on_equal) {
213 BranchOrBacktrack(on_equal, eq, current_character(), Operand(c));
214 }
215
216
CheckCharacterGT(uc16 limit,Label * on_greater)217 void RegExpMacroAssemblerMIPS::CheckCharacterGT(uc16 limit, Label* on_greater) {
218 BranchOrBacktrack(on_greater, gt, current_character(), Operand(limit));
219 }
220
221
CheckAtStart(Label * on_at_start)222 void RegExpMacroAssemblerMIPS::CheckAtStart(Label* on_at_start) {
223 Label not_at_start;
224 // Did we start the match at the start of the string at all?
225 __ lw(a0, MemOperand(frame_pointer(), kStartIndex));
226 BranchOrBacktrack(¬_at_start, ne, a0, Operand(zero_reg));
227
228 // If we did, are we still at the start of the input?
229 __ ld(a1, MemOperand(frame_pointer(), kInputStart));
230 __ Daddu(a0, end_of_input_address(), Operand(current_input_offset()));
231 BranchOrBacktrack(on_at_start, eq, a0, Operand(a1));
232 __ bind(¬_at_start);
233 }
234
235
CheckNotAtStart(Label * on_not_at_start)236 void RegExpMacroAssemblerMIPS::CheckNotAtStart(Label* on_not_at_start) {
237 // Did we start the match at the start of the string at all?
238 __ lw(a0, MemOperand(frame_pointer(), kStartIndex));
239 BranchOrBacktrack(on_not_at_start, ne, a0, Operand(zero_reg));
240 // If we did, are we still at the start of the input?
241 __ ld(a1, MemOperand(frame_pointer(), kInputStart));
242 __ Daddu(a0, end_of_input_address(), Operand(current_input_offset()));
243 BranchOrBacktrack(on_not_at_start, ne, a0, Operand(a1));
244 }
245
246
CheckCharacterLT(uc16 limit,Label * on_less)247 void RegExpMacroAssemblerMIPS::CheckCharacterLT(uc16 limit, Label* on_less) {
248 BranchOrBacktrack(on_less, lt, current_character(), Operand(limit));
249 }
250
251
CheckGreedyLoop(Label * on_equal)252 void RegExpMacroAssemblerMIPS::CheckGreedyLoop(Label* on_equal) {
253 Label backtrack_non_equal;
254 __ lw(a0, MemOperand(backtrack_stackpointer(), 0));
255 __ Branch(&backtrack_non_equal, ne, current_input_offset(), Operand(a0));
256 __ Daddu(backtrack_stackpointer(),
257 backtrack_stackpointer(),
258 Operand(kIntSize));
259 __ bind(&backtrack_non_equal);
260 BranchOrBacktrack(on_equal, eq, current_input_offset(), Operand(a0));
261 }
262
263
CheckNotBackReferenceIgnoreCase(int start_reg,Label * on_no_match)264 void RegExpMacroAssemblerMIPS::CheckNotBackReferenceIgnoreCase(
265 int start_reg,
266 Label* on_no_match) {
267 Label fallthrough;
268 __ ld(a0, register_location(start_reg)); // Index of start of capture.
269 __ ld(a1, register_location(start_reg + 1)); // Index of end of capture.
270 __ Dsubu(a1, a1, a0); // Length of capture.
271
272 // If length is zero, either the capture is empty or it is not participating.
273 // In either case succeed immediately.
274 __ Branch(&fallthrough, eq, a1, Operand(zero_reg));
275
276 __ Daddu(t1, a1, current_input_offset());
277 // Check that there are enough characters left in the input.
278 BranchOrBacktrack(on_no_match, gt, t1, Operand(zero_reg));
279
280 if (mode_ == LATIN1) {
281 Label success;
282 Label fail;
283 Label loop_check;
284
285 // a0 - offset of start of capture.
286 // a1 - length of capture.
287 __ Daddu(a0, a0, Operand(end_of_input_address()));
288 __ Daddu(a2, end_of_input_address(), Operand(current_input_offset()));
289 __ Daddu(a1, a0, Operand(a1));
290
291 // a0 - Address of start of capture.
292 // a1 - Address of end of capture.
293 // a2 - Address of current input position.
294
295 Label loop;
296 __ bind(&loop);
297 __ lbu(a3, MemOperand(a0, 0));
298 __ daddiu(a0, a0, char_size());
299 __ lbu(a4, MemOperand(a2, 0));
300 __ daddiu(a2, a2, char_size());
301
302 __ Branch(&loop_check, eq, a4, Operand(a3));
303
304 // Mismatch, try case-insensitive match (converting letters to lower-case).
305 __ Or(a3, a3, Operand(0x20)); // Convert capture character to lower-case.
306 __ Or(a4, a4, Operand(0x20)); // Also convert input character.
307 __ Branch(&fail, ne, a4, Operand(a3));
308 __ Dsubu(a3, a3, Operand('a'));
309 __ Branch(&loop_check, ls, a3, Operand('z' - 'a'));
310 // Latin-1: Check for values in range [224,254] but not 247.
311 __ Dsubu(a3, a3, Operand(224 - 'a'));
312 // Weren't Latin-1 letters.
313 __ Branch(&fail, hi, a3, Operand(254 - 224));
314 // Check for 247.
315 __ Branch(&fail, eq, a3, Operand(247 - 224));
316
317 __ bind(&loop_check);
318 __ Branch(&loop, lt, a0, Operand(a1));
319 __ jmp(&success);
320
321 __ bind(&fail);
322 GoTo(on_no_match);
323
324 __ bind(&success);
325 // Compute new value of character position after the matched part.
326 __ Dsubu(current_input_offset(), a2, end_of_input_address());
327 } else {
328 DCHECK(mode_ == UC16);
329 // Put regexp engine registers on stack.
330 RegList regexp_registers_to_retain = current_input_offset().bit() |
331 current_character().bit() | backtrack_stackpointer().bit();
332 __ MultiPush(regexp_registers_to_retain);
333
334 int argument_count = 4;
335 __ PrepareCallCFunction(argument_count, a2);
336
337 // a0 - offset of start of capture.
338 // a1 - length of capture.
339
340 // Put arguments into arguments registers.
341 // Parameters are
342 // a0: Address byte_offset1 - Address captured substring's start.
343 // a1: Address byte_offset2 - Address of current character position.
344 // a2: size_t byte_length - length of capture in bytes(!).
345 // a3: Isolate* isolate.
346
347 // Address of start of capture.
348 __ Daddu(a0, a0, Operand(end_of_input_address()));
349 // Length of capture.
350 __ mov(a2, a1);
351 // Save length in callee-save register for use on return.
352 __ mov(s3, a1);
353 // Address of current input position.
354 __ Daddu(a1, current_input_offset(), Operand(end_of_input_address()));
355 // Isolate.
356 __ li(a3, Operand(ExternalReference::isolate_address(masm_->isolate())));
357
358 {
359 AllowExternalCallThatCantCauseGC scope(masm_);
360 ExternalReference function =
361 ExternalReference::re_case_insensitive_compare_uc16(masm_->isolate());
362 __ CallCFunction(function, argument_count);
363 }
364
365 // Restore regexp engine registers.
366 __ MultiPop(regexp_registers_to_retain);
367 __ li(code_pointer(), Operand(masm_->CodeObject()), CONSTANT_SIZE);
368 __ ld(end_of_input_address(), MemOperand(frame_pointer(), kInputEnd));
369
370 // Check if function returned non-zero for success or zero for failure.
371 BranchOrBacktrack(on_no_match, eq, v0, Operand(zero_reg));
372 // On success, increment position by length of capture.
373 __ Daddu(current_input_offset(), current_input_offset(), Operand(s3));
374 }
375
376 __ bind(&fallthrough);
377 }
378
379
CheckNotBackReference(int start_reg,Label * on_no_match)380 void RegExpMacroAssemblerMIPS::CheckNotBackReference(
381 int start_reg,
382 Label* on_no_match) {
383 Label fallthrough;
384 Label success;
385
386 // Find length of back-referenced capture.
387 __ ld(a0, register_location(start_reg));
388 __ ld(a1, register_location(start_reg + 1));
389 __ Dsubu(a1, a1, a0); // Length to check.
390 // Succeed on empty capture (including no capture).
391 __ Branch(&fallthrough, eq, a1, Operand(zero_reg));
392
393 __ Daddu(t1, a1, current_input_offset());
394 // Check that there are enough characters left in the input.
395 BranchOrBacktrack(on_no_match, gt, t1, Operand(zero_reg));
396
397 // Compute pointers to match string and capture string.
398 __ Daddu(a0, a0, Operand(end_of_input_address()));
399 __ Daddu(a2, end_of_input_address(), Operand(current_input_offset()));
400 __ Daddu(a1, a1, Operand(a0));
401
402 Label loop;
403 __ bind(&loop);
404 if (mode_ == LATIN1) {
405 __ lbu(a3, MemOperand(a0, 0));
406 __ daddiu(a0, a0, char_size());
407 __ lbu(a4, MemOperand(a2, 0));
408 __ daddiu(a2, a2, char_size());
409 } else {
410 DCHECK(mode_ == UC16);
411 __ lhu(a3, MemOperand(a0, 0));
412 __ daddiu(a0, a0, char_size());
413 __ lhu(a4, MemOperand(a2, 0));
414 __ daddiu(a2, a2, char_size());
415 }
416 BranchOrBacktrack(on_no_match, ne, a3, Operand(a4));
417 __ Branch(&loop, lt, a0, Operand(a1));
418
419 // Move current character position to position after match.
420 __ Dsubu(current_input_offset(), a2, end_of_input_address());
421 __ bind(&fallthrough);
422 }
423
424
CheckNotCharacter(uint32_t c,Label * on_not_equal)425 void RegExpMacroAssemblerMIPS::CheckNotCharacter(uint32_t c,
426 Label* on_not_equal) {
427 BranchOrBacktrack(on_not_equal, ne, current_character(), Operand(c));
428 }
429
430
CheckCharacterAfterAnd(uint32_t c,uint32_t mask,Label * on_equal)431 void RegExpMacroAssemblerMIPS::CheckCharacterAfterAnd(uint32_t c,
432 uint32_t mask,
433 Label* on_equal) {
434 __ And(a0, current_character(), Operand(mask));
435 Operand rhs = (c == 0) ? Operand(zero_reg) : Operand(c);
436 BranchOrBacktrack(on_equal, eq, a0, rhs);
437 }
438
439
CheckNotCharacterAfterAnd(uint32_t c,uint32_t mask,Label * on_not_equal)440 void RegExpMacroAssemblerMIPS::CheckNotCharacterAfterAnd(uint32_t c,
441 uint32_t mask,
442 Label* on_not_equal) {
443 __ And(a0, current_character(), Operand(mask));
444 Operand rhs = (c == 0) ? Operand(zero_reg) : Operand(c);
445 BranchOrBacktrack(on_not_equal, ne, a0, rhs);
446 }
447
448
CheckNotCharacterAfterMinusAnd(uc16 c,uc16 minus,uc16 mask,Label * on_not_equal)449 void RegExpMacroAssemblerMIPS::CheckNotCharacterAfterMinusAnd(
450 uc16 c,
451 uc16 minus,
452 uc16 mask,
453 Label* on_not_equal) {
454 DCHECK(minus < String::kMaxUtf16CodeUnit);
455 __ Dsubu(a0, current_character(), Operand(minus));
456 __ And(a0, a0, Operand(mask));
457 BranchOrBacktrack(on_not_equal, ne, a0, Operand(c));
458 }
459
460
CheckCharacterInRange(uc16 from,uc16 to,Label * on_in_range)461 void RegExpMacroAssemblerMIPS::CheckCharacterInRange(
462 uc16 from,
463 uc16 to,
464 Label* on_in_range) {
465 __ Dsubu(a0, current_character(), Operand(from));
466 // Unsigned lower-or-same condition.
467 BranchOrBacktrack(on_in_range, ls, a0, Operand(to - from));
468 }
469
470
CheckCharacterNotInRange(uc16 from,uc16 to,Label * on_not_in_range)471 void RegExpMacroAssemblerMIPS::CheckCharacterNotInRange(
472 uc16 from,
473 uc16 to,
474 Label* on_not_in_range) {
475 __ Dsubu(a0, current_character(), Operand(from));
476 // Unsigned higher condition.
477 BranchOrBacktrack(on_not_in_range, hi, a0, Operand(to - from));
478 }
479
480
CheckBitInTable(Handle<ByteArray> table,Label * on_bit_set)481 void RegExpMacroAssemblerMIPS::CheckBitInTable(
482 Handle<ByteArray> table,
483 Label* on_bit_set) {
484 __ li(a0, Operand(table));
485 if (mode_ != LATIN1 || kTableMask != String::kMaxOneByteCharCode) {
486 __ And(a1, current_character(), Operand(kTableSize - 1));
487 __ Daddu(a0, a0, a1);
488 } else {
489 __ Daddu(a0, a0, current_character());
490 }
491
492 __ lbu(a0, FieldMemOperand(a0, ByteArray::kHeaderSize));
493 BranchOrBacktrack(on_bit_set, ne, a0, Operand(zero_reg));
494 }
495
496
CheckSpecialCharacterClass(uc16 type,Label * on_no_match)497 bool RegExpMacroAssemblerMIPS::CheckSpecialCharacterClass(uc16 type,
498 Label* on_no_match) {
499 // Range checks (c in min..max) are generally implemented by an unsigned
500 // (c - min) <= (max - min) check.
501 switch (type) {
502 case 's':
503 // Match space-characters.
504 if (mode_ == LATIN1) {
505 // One byte space characters are '\t'..'\r', ' ' and \u00a0.
506 Label success;
507 __ Branch(&success, eq, current_character(), Operand(' '));
508 // Check range 0x09..0x0d.
509 __ Dsubu(a0, current_character(), Operand('\t'));
510 __ Branch(&success, ls, a0, Operand('\r' - '\t'));
511 // \u00a0 (NBSP).
512 BranchOrBacktrack(on_no_match, ne, a0, Operand(0x00a0 - '\t'));
513 __ bind(&success);
514 return true;
515 }
516 return false;
517 case 'S':
518 // The emitted code for generic character classes is good enough.
519 return false;
520 case 'd':
521 // Match Latin1 digits ('0'..'9').
522 __ Dsubu(a0, current_character(), Operand('0'));
523 BranchOrBacktrack(on_no_match, hi, a0, Operand('9' - '0'));
524 return true;
525 case 'D':
526 // Match non Latin1-digits.
527 __ Dsubu(a0, current_character(), Operand('0'));
528 BranchOrBacktrack(on_no_match, ls, a0, Operand('9' - '0'));
529 return true;
530 case '.': {
531 // Match non-newlines (not 0x0a('\n'), 0x0d('\r'), 0x2028 and 0x2029).
532 __ Xor(a0, current_character(), Operand(0x01));
533 // See if current character is '\n'^1 or '\r'^1, i.e., 0x0b or 0x0c.
534 __ Dsubu(a0, a0, Operand(0x0b));
535 BranchOrBacktrack(on_no_match, ls, a0, Operand(0x0c - 0x0b));
536 if (mode_ == UC16) {
537 // Compare original value to 0x2028 and 0x2029, using the already
538 // computed (current_char ^ 0x01 - 0x0b). I.e., check for
539 // 0x201d (0x2028 - 0x0b) or 0x201e.
540 __ Dsubu(a0, a0, Operand(0x2028 - 0x0b));
541 BranchOrBacktrack(on_no_match, ls, a0, Operand(1));
542 }
543 return true;
544 }
545 case 'n': {
546 // Match newlines (0x0a('\n'), 0x0d('\r'), 0x2028 and 0x2029).
547 __ Xor(a0, current_character(), Operand(0x01));
548 // See if current character is '\n'^1 or '\r'^1, i.e., 0x0b or 0x0c.
549 __ Dsubu(a0, a0, Operand(0x0b));
550 if (mode_ == LATIN1) {
551 BranchOrBacktrack(on_no_match, hi, a0, Operand(0x0c - 0x0b));
552 } else {
553 Label done;
554 BranchOrBacktrack(&done, ls, a0, Operand(0x0c - 0x0b));
555 // Compare original value to 0x2028 and 0x2029, using the already
556 // computed (current_char ^ 0x01 - 0x0b). I.e., check for
557 // 0x201d (0x2028 - 0x0b) or 0x201e.
558 __ Dsubu(a0, a0, Operand(0x2028 - 0x0b));
559 BranchOrBacktrack(on_no_match, hi, a0, Operand(1));
560 __ bind(&done);
561 }
562 return true;
563 }
564 case 'w': {
565 if (mode_ != LATIN1) {
566 // Table is 256 entries, so all Latin1 characters can be tested.
567 BranchOrBacktrack(on_no_match, hi, current_character(), Operand('z'));
568 }
569 ExternalReference map = ExternalReference::re_word_character_map();
570 __ li(a0, Operand(map));
571 __ Daddu(a0, a0, current_character());
572 __ lbu(a0, MemOperand(a0, 0));
573 BranchOrBacktrack(on_no_match, eq, a0, Operand(zero_reg));
574 return true;
575 }
576 case 'W': {
577 Label done;
578 if (mode_ != LATIN1) {
579 // Table is 256 entries, so all Latin1 characters can be tested.
580 __ Branch(&done, hi, current_character(), Operand('z'));
581 }
582 ExternalReference map = ExternalReference::re_word_character_map();
583 __ li(a0, Operand(map));
584 __ Daddu(a0, a0, current_character());
585 __ lbu(a0, MemOperand(a0, 0));
586 BranchOrBacktrack(on_no_match, ne, a0, Operand(zero_reg));
587 if (mode_ != LATIN1) {
588 __ bind(&done);
589 }
590 return true;
591 }
592 case '*':
593 // Match any character.
594 return true;
595 // No custom implementation (yet): s(UC16), S(UC16).
596 default:
597 return false;
598 }
599 }
600
601
Fail()602 void RegExpMacroAssemblerMIPS::Fail() {
603 __ li(v0, Operand(FAILURE));
604 __ jmp(&exit_label_);
605 }
606
607
GetCode(Handle<String> source)608 Handle<HeapObject> RegExpMacroAssemblerMIPS::GetCode(Handle<String> source) {
609 Label return_v0;
610 if (masm_->has_exception()) {
611 // If the code gets corrupted due to long regular expressions and lack of
612 // space on trampolines, an internal exception flag is set. If this case
613 // is detected, we will jump into exit sequence right away.
614 __ bind_to(&entry_label_, internal_failure_label_.pos());
615 } else {
616 // Finalize code - write the entry point code now we know how many
617 // registers we need.
618
619 // Entry code:
620 __ bind(&entry_label_);
621
622 // Tell the system that we have a stack frame. Because the type is MANUAL,
623 // no is generated.
624 FrameScope scope(masm_, StackFrame::MANUAL);
625
626 // Actually emit code to start a new stack frame.
627 // Push arguments
628 // Save callee-save registers.
629 // Start new stack frame.
630 // Store link register in existing stack-cell.
631 // Order here should correspond to order of offset constants in header file.
632 // TODO(plind): we save s0..s7, but ONLY use s3 here - use the regs
633 // or dont save.
634 RegList registers_to_retain = s0.bit() | s1.bit() | s2.bit() |
635 s3.bit() | s4.bit() | s5.bit() | s6.bit() | s7.bit() | fp.bit();
636 RegList argument_registers = a0.bit() | a1.bit() | a2.bit() | a3.bit();
637
638 if (kMipsAbi == kN64) {
639 // TODO(plind): Should probably alias a4-a7, for clarity.
640 argument_registers |= a4.bit() | a5.bit() | a6.bit() | a7.bit();
641 }
642
643 __ MultiPush(argument_registers | registers_to_retain | ra.bit());
644 // Set frame pointer in space for it if this is not a direct call
645 // from generated code.
646 // TODO(plind): this 8 is the # of argument regs, should have definition.
647 __ Daddu(frame_pointer(), sp, Operand(8 * kPointerSize));
648 __ mov(a0, zero_reg);
649 __ push(a0); // Make room for success counter and initialize it to 0.
650 __ push(a0); // Make room for "position - 1" constant (value irrelevant).
651
652 // Check if we have space on the stack for registers.
653 Label stack_limit_hit;
654 Label stack_ok;
655
656 ExternalReference stack_limit =
657 ExternalReference::address_of_stack_limit(masm_->isolate());
658 __ li(a0, Operand(stack_limit));
659 __ ld(a0, MemOperand(a0));
660 __ Dsubu(a0, sp, a0);
661 // Handle it if the stack pointer is already below the stack limit.
662 __ Branch(&stack_limit_hit, le, a0, Operand(zero_reg));
663 // Check if there is room for the variable number of registers above
664 // the stack limit.
665 __ Branch(&stack_ok, hs, a0, Operand(num_registers_ * kPointerSize));
666 // Exit with OutOfMemory exception. There is not enough space on the stack
667 // for our working registers.
668 __ li(v0, Operand(EXCEPTION));
669 __ jmp(&return_v0);
670
671 __ bind(&stack_limit_hit);
672 CallCheckStackGuardState(a0);
673 // If returned value is non-zero, we exit with the returned value as result.
674 __ Branch(&return_v0, ne, v0, Operand(zero_reg));
675
676 __ bind(&stack_ok);
677 // Allocate space on stack for registers.
678 __ Dsubu(sp, sp, Operand(num_registers_ * kPointerSize));
679 // Load string end.
680 __ ld(end_of_input_address(), MemOperand(frame_pointer(), kInputEnd));
681 // Load input start.
682 __ ld(a0, MemOperand(frame_pointer(), kInputStart));
683 // Find negative length (offset of start relative to end).
684 __ Dsubu(current_input_offset(), a0, end_of_input_address());
685 // Set a0 to address of char before start of the input string
686 // (effectively string position -1).
687 __ ld(a1, MemOperand(frame_pointer(), kStartIndex));
688 __ Dsubu(a0, current_input_offset(), Operand(char_size()));
689 __ dsll(t1, a1, (mode_ == UC16) ? 1 : 0);
690 __ Dsubu(a0, a0, t1);
691 // Store this value in a local variable, for use when clearing
692 // position registers.
693 __ sd(a0, MemOperand(frame_pointer(), kInputStartMinusOne));
694
695 // Initialize code pointer register
696 __ li(code_pointer(), Operand(masm_->CodeObject()), CONSTANT_SIZE);
697
698 Label load_char_start_regexp, start_regexp;
699 // Load newline if index is at start, previous character otherwise.
700 __ Branch(&load_char_start_regexp, ne, a1, Operand(zero_reg));
701 __ li(current_character(), Operand('\n'));
702 __ jmp(&start_regexp);
703
704 // Global regexp restarts matching here.
705 __ bind(&load_char_start_regexp);
706 // Load previous char as initial value of current character register.
707 LoadCurrentCharacterUnchecked(-1, 1);
708 __ bind(&start_regexp);
709
710 // Initialize on-stack registers.
711 if (num_saved_registers_ > 0) { // Always is, if generated from a regexp.
712 // Fill saved registers with initial value = start offset - 1.
713 if (num_saved_registers_ > 8) {
714 // Address of register 0.
715 __ Daddu(a1, frame_pointer(), Operand(kRegisterZero));
716 __ li(a2, Operand(num_saved_registers_));
717 Label init_loop;
718 __ bind(&init_loop);
719 __ sd(a0, MemOperand(a1));
720 __ Daddu(a1, a1, Operand(-kPointerSize));
721 __ Dsubu(a2, a2, Operand(1));
722 __ Branch(&init_loop, ne, a2, Operand(zero_reg));
723 } else {
724 for (int i = 0; i < num_saved_registers_; i++) {
725 __ sd(a0, register_location(i));
726 }
727 }
728 }
729
730 // Initialize backtrack stack pointer.
731 __ ld(backtrack_stackpointer(), MemOperand(frame_pointer(), kStackHighEnd));
732
733 __ jmp(&start_label_);
734
735
736 // Exit code:
737 if (success_label_.is_linked()) {
738 // Save captures when successful.
739 __ bind(&success_label_);
740 if (num_saved_registers_ > 0) {
741 // Copy captures to output.
742 __ ld(a1, MemOperand(frame_pointer(), kInputStart));
743 __ ld(a0, MemOperand(frame_pointer(), kRegisterOutput));
744 __ ld(a2, MemOperand(frame_pointer(), kStartIndex));
745 __ Dsubu(a1, end_of_input_address(), a1);
746 // a1 is length of input in bytes.
747 if (mode_ == UC16) {
748 __ dsrl(a1, a1, 1);
749 }
750 // a1 is length of input in characters.
751 __ Daddu(a1, a1, Operand(a2));
752 // a1 is length of string in characters.
753
754 DCHECK_EQ(0, num_saved_registers_ % 2);
755 // Always an even number of capture registers. This allows us to
756 // unroll the loop once to add an operation between a load of a register
757 // and the following use of that register.
758 for (int i = 0; i < num_saved_registers_; i += 2) {
759 __ ld(a2, register_location(i));
760 __ ld(a3, register_location(i + 1));
761 if (i == 0 && global_with_zero_length_check()) {
762 // Keep capture start in a4 for the zero-length check later.
763 __ mov(t3, a2);
764 }
765 if (mode_ == UC16) {
766 __ dsra(a2, a2, 1);
767 __ Daddu(a2, a2, a1);
768 __ dsra(a3, a3, 1);
769 __ Daddu(a3, a3, a1);
770 } else {
771 __ Daddu(a2, a1, Operand(a2));
772 __ Daddu(a3, a1, Operand(a3));
773 }
774 // V8 expects the output to be an int32_t array.
775 __ sw(a2, MemOperand(a0));
776 __ Daddu(a0, a0, kIntSize);
777 __ sw(a3, MemOperand(a0));
778 __ Daddu(a0, a0, kIntSize);
779 }
780 }
781
782 if (global()) {
783 // Restart matching if the regular expression is flagged as global.
784 __ ld(a0, MemOperand(frame_pointer(), kSuccessfulCaptures));
785 __ lw(a1, MemOperand(frame_pointer(), kNumOutputRegisters));
786 __ ld(a2, MemOperand(frame_pointer(), kRegisterOutput));
787 // Increment success counter.
788 __ Daddu(a0, a0, 1);
789 __ sd(a0, MemOperand(frame_pointer(), kSuccessfulCaptures));
790 // Capture results have been stored, so the number of remaining global
791 // output registers is reduced by the number of stored captures.
792 __ Dsubu(a1, a1, num_saved_registers_);
793 // Check whether we have enough room for another set of capture results.
794 __ mov(v0, a0);
795 __ Branch(&return_v0, lt, a1, Operand(num_saved_registers_));
796
797 __ sd(a1, MemOperand(frame_pointer(), kNumOutputRegisters));
798 // Advance the location for output.
799 __ Daddu(a2, a2, num_saved_registers_ * kIntSize);
800 __ sd(a2, MemOperand(frame_pointer(), kRegisterOutput));
801
802 // Prepare a0 to initialize registers with its value in the next run.
803 __ ld(a0, MemOperand(frame_pointer(), kInputStartMinusOne));
804
805 if (global_with_zero_length_check()) {
806 // Special case for zero-length matches.
807 // t3: capture start index
808 // Not a zero-length match, restart.
809 __ Branch(
810 &load_char_start_regexp, ne, current_input_offset(), Operand(t3));
811 // Offset from the end is zero if we already reached the end.
812 __ Branch(&exit_label_, eq, current_input_offset(),
813 Operand(zero_reg));
814 // Advance current position after a zero-length match.
815 __ Daddu(current_input_offset(),
816 current_input_offset(),
817 Operand((mode_ == UC16) ? 2 : 1));
818 }
819
820 __ Branch(&load_char_start_regexp);
821 } else {
822 __ li(v0, Operand(SUCCESS));
823 }
824 }
825 // Exit and return v0.
826 __ bind(&exit_label_);
827 if (global()) {
828 __ ld(v0, MemOperand(frame_pointer(), kSuccessfulCaptures));
829 }
830
831 __ bind(&return_v0);
832 // Skip sp past regexp registers and local variables..
833 __ mov(sp, frame_pointer());
834 // Restore registers s0..s7 and return (restoring ra to pc).
835 __ MultiPop(registers_to_retain | ra.bit());
836 __ Ret();
837
838 // Backtrack code (branch target for conditional backtracks).
839 if (backtrack_label_.is_linked()) {
840 __ bind(&backtrack_label_);
841 Backtrack();
842 }
843
844 Label exit_with_exception;
845
846 // Preempt-code.
847 if (check_preempt_label_.is_linked()) {
848 SafeCallTarget(&check_preempt_label_);
849 // Put regexp engine registers on stack.
850 RegList regexp_registers_to_retain = current_input_offset().bit() |
851 current_character().bit() | backtrack_stackpointer().bit();
852 __ MultiPush(regexp_registers_to_retain);
853 CallCheckStackGuardState(a0);
854 __ MultiPop(regexp_registers_to_retain);
855 // If returning non-zero, we should end execution with the given
856 // result as return value.
857 __ Branch(&return_v0, ne, v0, Operand(zero_reg));
858
859 // String might have moved: Reload end of string from frame.
860 __ ld(end_of_input_address(), MemOperand(frame_pointer(), kInputEnd));
861 __ li(code_pointer(), Operand(masm_->CodeObject()), CONSTANT_SIZE);
862 SafeReturn();
863 }
864
865 // Backtrack stack overflow code.
866 if (stack_overflow_label_.is_linked()) {
867 SafeCallTarget(&stack_overflow_label_);
868 // Reached if the backtrack-stack limit has been hit.
869 // Put regexp engine registers on stack first.
870 RegList regexp_registers = current_input_offset().bit() |
871 current_character().bit();
872 __ MultiPush(regexp_registers);
873 Label grow_failed;
874 // Call GrowStack(backtrack_stackpointer(), &stack_base)
875 static const int num_arguments = 3;
876 __ PrepareCallCFunction(num_arguments, a0);
877 __ mov(a0, backtrack_stackpointer());
878 __ Daddu(a1, frame_pointer(), Operand(kStackHighEnd));
879 __ li(a2, Operand(ExternalReference::isolate_address(masm_->isolate())));
880 ExternalReference grow_stack =
881 ExternalReference::re_grow_stack(masm_->isolate());
882 __ CallCFunction(grow_stack, num_arguments);
883 // Restore regexp registers.
884 __ MultiPop(regexp_registers);
885 // If return NULL, we have failed to grow the stack, and
886 // must exit with a stack-overflow exception.
887 __ Branch(&exit_with_exception, eq, v0, Operand(zero_reg));
888 // Otherwise use return value as new stack pointer.
889 __ mov(backtrack_stackpointer(), v0);
890 // Restore saved registers and continue.
891 __ li(code_pointer(), Operand(masm_->CodeObject()), CONSTANT_SIZE);
892 __ ld(end_of_input_address(), MemOperand(frame_pointer(), kInputEnd));
893 SafeReturn();
894 }
895
896 if (exit_with_exception.is_linked()) {
897 // If any of the code above needed to exit with an exception.
898 __ bind(&exit_with_exception);
899 // Exit with Result EXCEPTION(-1) to signal thrown exception.
900 __ li(v0, Operand(EXCEPTION));
901 __ jmp(&return_v0);
902 }
903 }
904
905 CodeDesc code_desc;
906 masm_->GetCode(&code_desc);
907 Handle<Code> code = isolate()->factory()->NewCode(
908 code_desc, Code::ComputeFlags(Code::REGEXP), masm_->CodeObject());
909 LOG(masm_->isolate(), RegExpCodeCreateEvent(*code, *source));
910 return Handle<HeapObject>::cast(code);
911 }
912
913
GoTo(Label * to)914 void RegExpMacroAssemblerMIPS::GoTo(Label* to) {
915 if (to == NULL) {
916 Backtrack();
917 return;
918 }
919 __ jmp(to);
920 return;
921 }
922
923
IfRegisterGE(int reg,int comparand,Label * if_ge)924 void RegExpMacroAssemblerMIPS::IfRegisterGE(int reg,
925 int comparand,
926 Label* if_ge) {
927 __ ld(a0, register_location(reg));
928 BranchOrBacktrack(if_ge, ge, a0, Operand(comparand));
929 }
930
931
IfRegisterLT(int reg,int comparand,Label * if_lt)932 void RegExpMacroAssemblerMIPS::IfRegisterLT(int reg,
933 int comparand,
934 Label* if_lt) {
935 __ ld(a0, register_location(reg));
936 BranchOrBacktrack(if_lt, lt, a0, Operand(comparand));
937 }
938
939
IfRegisterEqPos(int reg,Label * if_eq)940 void RegExpMacroAssemblerMIPS::IfRegisterEqPos(int reg,
941 Label* if_eq) {
942 __ ld(a0, register_location(reg));
943 BranchOrBacktrack(if_eq, eq, a0, Operand(current_input_offset()));
944 }
945
946
947 RegExpMacroAssembler::IrregexpImplementation
Implementation()948 RegExpMacroAssemblerMIPS::Implementation() {
949 return kMIPSImplementation;
950 }
951
952
LoadCurrentCharacter(int cp_offset,Label * on_end_of_input,bool check_bounds,int characters)953 void RegExpMacroAssemblerMIPS::LoadCurrentCharacter(int cp_offset,
954 Label* on_end_of_input,
955 bool check_bounds,
956 int characters) {
957 DCHECK(cp_offset >= -1); // ^ and \b can look behind one character.
958 DCHECK(cp_offset < (1<<30)); // Be sane! (And ensure negation works).
959 if (check_bounds) {
960 CheckPosition(cp_offset + characters - 1, on_end_of_input);
961 }
962 LoadCurrentCharacterUnchecked(cp_offset, characters);
963 }
964
965
PopCurrentPosition()966 void RegExpMacroAssemblerMIPS::PopCurrentPosition() {
967 Pop(current_input_offset());
968 }
969
970
PopRegister(int register_index)971 void RegExpMacroAssemblerMIPS::PopRegister(int register_index) {
972 Pop(a0);
973 __ sd(a0, register_location(register_index));
974 }
975
976
PushBacktrack(Label * label)977 void RegExpMacroAssemblerMIPS::PushBacktrack(Label* label) {
978 if (label->is_bound()) {
979 int target = label->pos();
980 __ li(a0, Operand(target + Code::kHeaderSize - kHeapObjectTag));
981 } else {
982 Assembler::BlockTrampolinePoolScope block_trampoline_pool(masm_);
983 Label after_constant;
984 __ Branch(&after_constant);
985 int offset = masm_->pc_offset();
986 int cp_offset = offset + Code::kHeaderSize - kHeapObjectTag;
987 __ emit(0);
988 masm_->label_at_put(label, offset);
989 __ bind(&after_constant);
990 if (is_int16(cp_offset)) {
991 __ lwu(a0, MemOperand(code_pointer(), cp_offset));
992 } else {
993 __ Daddu(a0, code_pointer(), cp_offset);
994 __ lwu(a0, MemOperand(a0, 0));
995 }
996 }
997 Push(a0);
998 CheckStackLimit();
999 }
1000
1001
PushCurrentPosition()1002 void RegExpMacroAssemblerMIPS::PushCurrentPosition() {
1003 Push(current_input_offset());
1004 }
1005
1006
PushRegister(int register_index,StackCheckFlag check_stack_limit)1007 void RegExpMacroAssemblerMIPS::PushRegister(int register_index,
1008 StackCheckFlag check_stack_limit) {
1009 __ ld(a0, register_location(register_index));
1010 Push(a0);
1011 if (check_stack_limit) CheckStackLimit();
1012 }
1013
1014
ReadCurrentPositionFromRegister(int reg)1015 void RegExpMacroAssemblerMIPS::ReadCurrentPositionFromRegister(int reg) {
1016 __ ld(current_input_offset(), register_location(reg));
1017 }
1018
1019
ReadStackPointerFromRegister(int reg)1020 void RegExpMacroAssemblerMIPS::ReadStackPointerFromRegister(int reg) {
1021 __ ld(backtrack_stackpointer(), register_location(reg));
1022 __ ld(a0, MemOperand(frame_pointer(), kStackHighEnd));
1023 __ Daddu(backtrack_stackpointer(), backtrack_stackpointer(), Operand(a0));
1024 }
1025
1026
SetCurrentPositionFromEnd(int by)1027 void RegExpMacroAssemblerMIPS::SetCurrentPositionFromEnd(int by) {
1028 Label after_position;
1029 __ Branch(&after_position,
1030 ge,
1031 current_input_offset(),
1032 Operand(-by * char_size()));
1033 __ li(current_input_offset(), -by * char_size());
1034 // On RegExp code entry (where this operation is used), the character before
1035 // the current position is expected to be already loaded.
1036 // We have advanced the position, so it's safe to read backwards.
1037 LoadCurrentCharacterUnchecked(-1, 1);
1038 __ bind(&after_position);
1039 }
1040
1041
SetRegister(int register_index,int to)1042 void RegExpMacroAssemblerMIPS::SetRegister(int register_index, int to) {
1043 DCHECK(register_index >= num_saved_registers_); // Reserved for positions!
1044 __ li(a0, Operand(to));
1045 __ sd(a0, register_location(register_index));
1046 }
1047
1048
Succeed()1049 bool RegExpMacroAssemblerMIPS::Succeed() {
1050 __ jmp(&success_label_);
1051 return global();
1052 }
1053
1054
WriteCurrentPositionToRegister(int reg,int cp_offset)1055 void RegExpMacroAssemblerMIPS::WriteCurrentPositionToRegister(int reg,
1056 int cp_offset) {
1057 if (cp_offset == 0) {
1058 __ sd(current_input_offset(), register_location(reg));
1059 } else {
1060 __ Daddu(a0, current_input_offset(), Operand(cp_offset * char_size()));
1061 __ sd(a0, register_location(reg));
1062 }
1063 }
1064
1065
ClearRegisters(int reg_from,int reg_to)1066 void RegExpMacroAssemblerMIPS::ClearRegisters(int reg_from, int reg_to) {
1067 DCHECK(reg_from <= reg_to);
1068 __ ld(a0, MemOperand(frame_pointer(), kInputStartMinusOne));
1069 for (int reg = reg_from; reg <= reg_to; reg++) {
1070 __ sd(a0, register_location(reg));
1071 }
1072 }
1073
1074
WriteStackPointerToRegister(int reg)1075 void RegExpMacroAssemblerMIPS::WriteStackPointerToRegister(int reg) {
1076 __ ld(a1, MemOperand(frame_pointer(), kStackHighEnd));
1077 __ Dsubu(a0, backtrack_stackpointer(), a1);
1078 __ sd(a0, register_location(reg));
1079 }
1080
1081
CanReadUnaligned()1082 bool RegExpMacroAssemblerMIPS::CanReadUnaligned() {
1083 return false;
1084 }
1085
1086
1087 // Private methods:
1088
CallCheckStackGuardState(Register scratch)1089 void RegExpMacroAssemblerMIPS::CallCheckStackGuardState(Register scratch) {
1090 int stack_alignment = base::OS::ActivationFrameAlignment();
1091
1092 // Align the stack pointer and save the original sp value on the stack.
1093 __ mov(scratch, sp);
1094 __ Dsubu(sp, sp, Operand(kPointerSize));
1095 DCHECK(base::bits::IsPowerOfTwo32(stack_alignment));
1096 __ And(sp, sp, Operand(-stack_alignment));
1097 __ sd(scratch, MemOperand(sp));
1098
1099 __ mov(a2, frame_pointer());
1100 // Code* of self.
1101 __ li(a1, Operand(masm_->CodeObject()), CONSTANT_SIZE);
1102
1103 // We need to make room for the return address on the stack.
1104 DCHECK(IsAligned(stack_alignment, kPointerSize));
1105 __ Dsubu(sp, sp, Operand(stack_alignment));
1106
1107 // Stack pointer now points to cell where return address is to be written.
1108 // Arguments are in registers, meaning we teat the return address as
1109 // argument 5. Since DirectCEntryStub will handleallocating space for the C
1110 // argument slots, we don't need to care about that here. This is how the
1111 // stack will look (sp meaning the value of sp at this moment):
1112 // [sp + 3] - empty slot if needed for alignment.
1113 // [sp + 2] - saved sp.
1114 // [sp + 1] - second word reserved for return value.
1115 // [sp + 0] - first word reserved for return value.
1116
1117 // a0 will point to the return address, placed by DirectCEntry.
1118 __ mov(a0, sp);
1119
1120 ExternalReference stack_guard_check =
1121 ExternalReference::re_check_stack_guard_state(masm_->isolate());
1122 __ li(t9, Operand(stack_guard_check));
1123 DirectCEntryStub stub(isolate());
1124 stub.GenerateCall(masm_, t9);
1125
1126 // DirectCEntryStub allocated space for the C argument slots so we have to
1127 // drop them with the return address from the stack with loading saved sp.
1128 // At this point stack must look:
1129 // [sp + 7] - empty slot if needed for alignment.
1130 // [sp + 6] - saved sp.
1131 // [sp + 5] - second word reserved for return value.
1132 // [sp + 4] - first word reserved for return value.
1133 // [sp + 3] - C argument slot.
1134 // [sp + 2] - C argument slot.
1135 // [sp + 1] - C argument slot.
1136 // [sp + 0] - C argument slot.
1137 __ ld(sp, MemOperand(sp, stack_alignment + kCArgsSlotsSize));
1138
1139 __ li(code_pointer(), Operand(masm_->CodeObject()));
1140 }
1141
1142
1143 // Helper function for reading a value out of a stack frame.
1144 template <typename T>
frame_entry(Address re_frame,int frame_offset)1145 static T& frame_entry(Address re_frame, int frame_offset) {
1146 return reinterpret_cast<T&>(Memory::int32_at(re_frame + frame_offset));
1147 }
1148
1149
CheckStackGuardState(Address * return_address,Code * re_code,Address re_frame)1150 int RegExpMacroAssemblerMIPS::CheckStackGuardState(Address* return_address,
1151 Code* re_code,
1152 Address re_frame) {
1153 Isolate* isolate = frame_entry<Isolate*>(re_frame, kIsolate);
1154 StackLimitCheck check(isolate);
1155 if (check.JsHasOverflowed()) {
1156 isolate->StackOverflow();
1157 return EXCEPTION;
1158 }
1159
1160 // If not real stack overflow the stack guard was used to interrupt
1161 // execution for another purpose.
1162
1163 // If this is a direct call from JavaScript retry the RegExp forcing the call
1164 // through the runtime system. Currently the direct call cannot handle a GC.
1165 if (frame_entry<int>(re_frame, kDirectCall) == 1) {
1166 return RETRY;
1167 }
1168
1169 // Prepare for possible GC.
1170 HandleScope handles(isolate);
1171 Handle<Code> code_handle(re_code);
1172
1173 Handle<String> subject(frame_entry<String*>(re_frame, kInputString));
1174 // Current string.
1175 bool is_one_byte = subject->IsOneByteRepresentationUnderneath();
1176
1177 DCHECK(re_code->instruction_start() <= *return_address);
1178 DCHECK(*return_address <=
1179 re_code->instruction_start() + re_code->instruction_size());
1180
1181 Object* result = isolate->stack_guard()->HandleInterrupts();
1182
1183 if (*code_handle != re_code) { // Return address no longer valid.
1184 int delta = code_handle->address() - re_code->address();
1185 // Overwrite the return address on the stack.
1186 *return_address += delta;
1187 }
1188
1189 if (result->IsException()) {
1190 return EXCEPTION;
1191 }
1192
1193 Handle<String> subject_tmp = subject;
1194 int slice_offset = 0;
1195
1196 // Extract the underlying string and the slice offset.
1197 if (StringShape(*subject_tmp).IsCons()) {
1198 subject_tmp = Handle<String>(ConsString::cast(*subject_tmp)->first());
1199 } else if (StringShape(*subject_tmp).IsSliced()) {
1200 SlicedString* slice = SlicedString::cast(*subject_tmp);
1201 subject_tmp = Handle<String>(slice->parent());
1202 slice_offset = slice->offset();
1203 }
1204
1205 // String might have changed.
1206 if (subject_tmp->IsOneByteRepresentation() != is_one_byte) {
1207 // If we changed between an Latin1 and an UC16 string, the specialized
1208 // code cannot be used, and we need to restart regexp matching from
1209 // scratch (including, potentially, compiling a new version of the code).
1210 return RETRY;
1211 }
1212
1213 // Otherwise, the content of the string might have moved. It must still
1214 // be a sequential or external string with the same content.
1215 // Update the start and end pointers in the stack frame to the current
1216 // location (whether it has actually moved or not).
1217 DCHECK(StringShape(*subject_tmp).IsSequential() ||
1218 StringShape(*subject_tmp).IsExternal());
1219
1220 // The original start address of the characters to match.
1221 const byte* start_address = frame_entry<const byte*>(re_frame, kInputStart);
1222
1223 // Find the current start address of the same character at the current string
1224 // position.
1225 int start_index = frame_entry<int>(re_frame, kStartIndex);
1226 const byte* new_address = StringCharacterPosition(*subject_tmp,
1227 start_index + slice_offset);
1228
1229 if (start_address != new_address) {
1230 // If there is a difference, update the object pointer and start and end
1231 // addresses in the RegExp stack frame to match the new value.
1232 const byte* end_address = frame_entry<const byte* >(re_frame, kInputEnd);
1233 int byte_length = static_cast<int>(end_address - start_address);
1234 frame_entry<const String*>(re_frame, kInputString) = *subject;
1235 frame_entry<const byte*>(re_frame, kInputStart) = new_address;
1236 frame_entry<const byte*>(re_frame, kInputEnd) = new_address + byte_length;
1237 } else if (frame_entry<const String*>(re_frame, kInputString) != *subject) {
1238 // Subject string might have been a ConsString that underwent
1239 // short-circuiting during GC. That will not change start_address but
1240 // will change pointer inside the subject handle.
1241 frame_entry<const String*>(re_frame, kInputString) = *subject;
1242 }
1243
1244 return 0;
1245 }
1246
1247
register_location(int register_index)1248 MemOperand RegExpMacroAssemblerMIPS::register_location(int register_index) {
1249 DCHECK(register_index < (1<<30));
1250 if (num_registers_ <= register_index) {
1251 num_registers_ = register_index + 1;
1252 }
1253 return MemOperand(frame_pointer(),
1254 kRegisterZero - register_index * kPointerSize);
1255 }
1256
1257
CheckPosition(int cp_offset,Label * on_outside_input)1258 void RegExpMacroAssemblerMIPS::CheckPosition(int cp_offset,
1259 Label* on_outside_input) {
1260 BranchOrBacktrack(on_outside_input,
1261 ge,
1262 current_input_offset(),
1263 Operand(-cp_offset * char_size()));
1264 }
1265
1266
BranchOrBacktrack(Label * to,Condition condition,Register rs,const Operand & rt)1267 void RegExpMacroAssemblerMIPS::BranchOrBacktrack(Label* to,
1268 Condition condition,
1269 Register rs,
1270 const Operand& rt) {
1271 if (condition == al) { // Unconditional.
1272 if (to == NULL) {
1273 Backtrack();
1274 return;
1275 }
1276 __ jmp(to);
1277 return;
1278 }
1279 if (to == NULL) {
1280 __ Branch(&backtrack_label_, condition, rs, rt);
1281 return;
1282 }
1283 __ Branch(to, condition, rs, rt);
1284 }
1285
1286
SafeCall(Label * to,Condition cond,Register rs,const Operand & rt)1287 void RegExpMacroAssemblerMIPS::SafeCall(Label* to,
1288 Condition cond,
1289 Register rs,
1290 const Operand& rt) {
1291 __ BranchAndLink(to, cond, rs, rt);
1292 }
1293
1294
SafeReturn()1295 void RegExpMacroAssemblerMIPS::SafeReturn() {
1296 __ pop(ra);
1297 __ Daddu(t1, ra, Operand(masm_->CodeObject()));
1298 __ Jump(t1);
1299 }
1300
1301
SafeCallTarget(Label * name)1302 void RegExpMacroAssemblerMIPS::SafeCallTarget(Label* name) {
1303 __ bind(name);
1304 __ Dsubu(ra, ra, Operand(masm_->CodeObject()));
1305 __ push(ra);
1306 }
1307
1308
Push(Register source)1309 void RegExpMacroAssemblerMIPS::Push(Register source) {
1310 DCHECK(!source.is(backtrack_stackpointer()));
1311 __ Daddu(backtrack_stackpointer(),
1312 backtrack_stackpointer(),
1313 Operand(-kIntSize));
1314 __ sw(source, MemOperand(backtrack_stackpointer()));
1315 }
1316
1317
Pop(Register target)1318 void RegExpMacroAssemblerMIPS::Pop(Register target) {
1319 DCHECK(!target.is(backtrack_stackpointer()));
1320 __ lw(target, MemOperand(backtrack_stackpointer()));
1321 __ Daddu(backtrack_stackpointer(), backtrack_stackpointer(), kIntSize);
1322 }
1323
1324
CheckPreemption()1325 void RegExpMacroAssemblerMIPS::CheckPreemption() {
1326 // Check for preemption.
1327 ExternalReference stack_limit =
1328 ExternalReference::address_of_stack_limit(masm_->isolate());
1329 __ li(a0, Operand(stack_limit));
1330 __ ld(a0, MemOperand(a0));
1331 SafeCall(&check_preempt_label_, ls, sp, Operand(a0));
1332 }
1333
1334
CheckStackLimit()1335 void RegExpMacroAssemblerMIPS::CheckStackLimit() {
1336 ExternalReference stack_limit =
1337 ExternalReference::address_of_regexp_stack_limit(masm_->isolate());
1338
1339 __ li(a0, Operand(stack_limit));
1340 __ ld(a0, MemOperand(a0));
1341 SafeCall(&stack_overflow_label_, ls, backtrack_stackpointer(), Operand(a0));
1342 }
1343
1344
LoadCurrentCharacterUnchecked(int cp_offset,int characters)1345 void RegExpMacroAssemblerMIPS::LoadCurrentCharacterUnchecked(int cp_offset,
1346 int characters) {
1347 Register offset = current_input_offset();
1348 if (cp_offset != 0) {
1349 // t3 is not being used to store the capture start index at this point.
1350 __ Daddu(t3, current_input_offset(), Operand(cp_offset * char_size()));
1351 offset = t3;
1352 }
1353 // We assume that we cannot do unaligned loads on MIPS, so this function
1354 // must only be used to load a single character at a time.
1355 DCHECK(characters == 1);
1356 __ Daddu(t1, end_of_input_address(), Operand(offset));
1357 if (mode_ == LATIN1) {
1358 __ lbu(current_character(), MemOperand(t1, 0));
1359 } else {
1360 DCHECK(mode_ == UC16);
1361 __ lhu(current_character(), MemOperand(t1, 0));
1362 }
1363 }
1364
1365 #undef __
1366
1367 #endif // V8_INTERPRETED_REGEXP
1368
1369 }} // namespace v8::internal
1370
1371 #endif // V8_TARGET_ARCH_MIPS64
1372