1 // Copyright 2014 the V8 project authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
4
5 #if V8_TARGET_ARCH_PPC || V8_TARGET_ARCH_PPC64
6
7 #include "src/regexp/ppc/regexp-macro-assembler-ppc.h"
8
9 #include "src/codegen/macro-assembler.h"
10 #include "src/codegen/ppc/assembler-ppc-inl.h"
11 #include "src/heap/factory.h"
12 #include "src/logging/log.h"
13 #include "src/objects/code-inl.h"
14 #include "src/regexp/regexp-stack.h"
15 #include "src/snapshot/embedded/embedded-data-inl.h"
16
17 namespace v8 {
18 namespace internal {
19
20 /*
21 * This assembler uses the following register assignment convention
22 * - r25: Temporarily stores the index of capture start after a matching pass
23 * for a global regexp.
24 * - r26: Pointer to current Code object including heap object tag.
25 * - r27: Current position in input, as negative offset from end of string.
26 * Please notice that this is the byte offset, not the character offset!
27 * - r28: Currently loaded character. Must be loaded using
28 * LoadCurrentCharacter before using any of the dispatch methods.
29 * - r29: Points to tip of backtrack stack
30 * - r30: End of input (points to byte after last character in input).
31 * - r31: Frame pointer. Used to access arguments, local variables and
32 * RegExp registers.
33 * - r12: IP register, used by assembler. Very volatile.
34 * - r1/sp : Points to tip of C stack.
35 *
36 * The remaining registers are free for computations.
37 * Each call to a public method should retain this convention.
38 *
39 * The stack will have the following structure
40 * - fp[44] Address regexp (address of the JSRegExp object; unused in
41 * native code, passed to match signature of
42 * the interpreter):
43 * - fp[40] Isolate* isolate (address of the current isolate)
44 * - fp[36] lr save area (currently unused)
45 * - fp[32] backchain (currently unused)
46 * --- sp when called ---
47 * - fp[28] return address (lr).
48 * - fp[24] old frame pointer (r31).
49 * - fp[0..20] backup of registers r25..r30
50 * --- frame pointer ----
51 * - fp[-4] direct_call (if 1, direct call from JavaScript code,
52 * if 0, call through the runtime system).
53 * - fp[-8] stack_area_base (high end of the memory area to use as
54 * backtracking stack).
55 * - fp[-12] capture array size (may fit multiple sets of matches)
56 * - fp[-16] int* capture_array (int[num_saved_registers_], for output).
57 * - fp[-20] end of input (address of end of string).
58 * - fp[-24] start of input (address of first character in string).
59 * - fp[-28] start index (character index of start).
60 * - fp[-32] void* input_string (location of a handle containing the string).
61 * - fp[-36] success counter (only for global regexps to count matches).
62 * - fp[-40] Offset of location before start of input (effectively character
63 * string start - 1). Used to initialize capture registers to a
64 * non-position.
65 * - fp[-44] At start (if 1, we are starting at the start of the
66 * string, otherwise 0)
67 * - fp[-48] register 0 (Only positions must be stored in the first
68 * - register 1 num_saved_registers_ registers)
69 * - ...
70 * - register num_registers-1
71 * --- sp ---
72 *
73 * The first num_saved_registers_ registers are initialized to point to
74 * "character -1" in the string (i.e., char_size() bytes before the first
75 * character of the string). The remaining registers start out as garbage.
76 *
77 * The data up to the return address must be placed there by the calling
78 * code and the remaining arguments are passed in registers, e.g. by calling the
79 * code entry as cast to a function with the signature:
80 * int (*match)(String input_string,
81 * int start_index,
82 * Address start,
83 * Address end,
84 * int* capture_output_array,
85 * int num_capture_registers,
86 * byte* stack_area_base,
87 * bool direct_call = false,
88 * Isolate* isolate,
89 * Address regexp);
90 * The call is performed by NativeRegExpMacroAssembler::Execute()
91 * (in regexp-macro-assembler.cc) via the GeneratedCode wrapper.
92 */
93
94 #define __ ACCESS_MASM(masm_)
95
96 const int RegExpMacroAssemblerPPC::kRegExpCodeSize;
97
RegExpMacroAssemblerPPC(Isolate* isolate, Zone* zone, Mode mode, int registers_to_save)98 RegExpMacroAssemblerPPC::RegExpMacroAssemblerPPC(Isolate* isolate, Zone* zone,
99 Mode mode,
100 int registers_to_save)
101 : NativeRegExpMacroAssembler(isolate, zone),
102 masm_(std::make_unique<MacroAssembler>(
103 isolate, CodeObjectRequired::kYes,
104 NewAssemblerBuffer(kRegExpCodeSize))),
105 no_root_array_scope_(masm_.get()),
106 mode_(mode),
107 num_registers_(registers_to_save),
108 num_saved_registers_(registers_to_save),
109 entry_label_(),
110 start_label_(),
111 success_label_(),
112 backtrack_label_(),
113 exit_label_(),
114 internal_failure_label_() {
115 DCHECK_EQ(0, registers_to_save % 2);
116
117
118 __ b(&entry_label_); // We'll write the entry code later.
119 // If the code gets too big or corrupted, an internal exception will be
120 // raised, and we will exit right away.
121 __ bind(&internal_failure_label_);
122 __ li(r3, Operand(FAILURE));
123 __ Ret();
124 __ bind(&start_label_); // And then continue from here.
125 }
126
~RegExpMacroAssemblerPPC()127 RegExpMacroAssemblerPPC::~RegExpMacroAssemblerPPC() {
128 // Unuse labels in case we throw away the assembler without calling GetCode.
129 entry_label_.Unuse();
130 start_label_.Unuse();
131 success_label_.Unuse();
132 backtrack_label_.Unuse();
133 exit_label_.Unuse();
134 check_preempt_label_.Unuse();
135 stack_overflow_label_.Unuse();
136 internal_failure_label_.Unuse();
137 fallback_label_.Unuse();
138 }
139
140
stack_limit_slack()141 int RegExpMacroAssemblerPPC::stack_limit_slack() {
142 return RegExpStack::kStackLimitSlack;
143 }
144
145
AdvanceCurrentPosition(int by)146 void RegExpMacroAssemblerPPC::AdvanceCurrentPosition(int by) {
147 if (by != 0) {
148 if (is_int16(by * char_size())) {
149 __ addi(current_input_offset(), current_input_offset(),
150 Operand(by * char_size()));
151 } else {
152 __ mov(r0, Operand(by * char_size()));
153 __ add(current_input_offset(), r0, current_input_offset());
154 }
155 }
156 }
157
158
AdvanceRegister(int reg, int by)159 void RegExpMacroAssemblerPPC::AdvanceRegister(int reg, int by) {
160 DCHECK_LE(0, reg);
161 DCHECK_GT(num_registers_, reg);
162 if (by != 0) {
163 __ LoadU64(r3, register_location(reg), r0);
164 __ mov(r0, Operand(by));
165 __ add(r3, r3, r0);
166 __ StoreU64(r3, register_location(reg), r0);
167 }
168 }
169
170
Backtrack()171 void RegExpMacroAssemblerPPC::Backtrack() {
172 CheckPreemption();
173 if (has_backtrack_limit()) {
174 Label next;
175 __ LoadU64(r3, MemOperand(frame_pointer(), kBacktrackCount), r0);
176 __ addi(r3, r3, Operand(1));
177 __ StoreU64(r3, MemOperand(frame_pointer(), kBacktrackCount), r0);
178 __ mov(r0, Operand(backtrack_limit()));
179 __ CmpS64(r3, r0);
180 __ bne(&next);
181
182 // Backtrack limit exceeded.
183 if (can_fallback()) {
184 __ b(&fallback_label_);
185 } else {
186 // Can't fallback, so we treat it as a failed match.
187 Fail();
188 }
189
190 __ bind(&next);
191 }
192 // Pop Code offset from backtrack stack, add Code and jump to location.
193 Pop(r3);
194 __ add(r3, r3, code_pointer());
195 __ Jump(r3);
196 }
197
198
Bind(Label* label)199 void RegExpMacroAssemblerPPC::Bind(Label* label) { __ bind(label); }
200
201
CheckCharacter(uint32_t c, Label* on_equal)202 void RegExpMacroAssemblerPPC::CheckCharacter(uint32_t c, Label* on_equal) {
203 __ CmpU64(current_character(), Operand(c), r0);
204 BranchOrBacktrack(eq, on_equal);
205 }
206
CheckCharacterGT(base::uc16 limit, Label* on_greater)207 void RegExpMacroAssemblerPPC::CheckCharacterGT(base::uc16 limit,
208 Label* on_greater) {
209 __ CmpU64(current_character(), Operand(limit), r0);
210 BranchOrBacktrack(gt, on_greater);
211 }
212
CheckAtStart(int cp_offset, Label* on_at_start)213 void RegExpMacroAssemblerPPC::CheckAtStart(int cp_offset, Label* on_at_start) {
214 __ LoadU64(r4, MemOperand(frame_pointer(), kStringStartMinusOne));
215 __ addi(r3, current_input_offset(),
216 Operand(-char_size() + cp_offset * char_size()));
217 __ CmpS64(r3, r4);
218 BranchOrBacktrack(eq, on_at_start);
219 }
220
CheckNotAtStart(int cp_offset, Label* on_not_at_start)221 void RegExpMacroAssemblerPPC::CheckNotAtStart(int cp_offset,
222 Label* on_not_at_start) {
223 __ LoadU64(r4, MemOperand(frame_pointer(), kStringStartMinusOne));
224 __ addi(r3, current_input_offset(),
225 Operand(-char_size() + cp_offset * char_size()));
226 __ CmpS64(r3, r4);
227 BranchOrBacktrack(ne, on_not_at_start);
228 }
229
CheckCharacterLT(base::uc16 limit, Label* on_less)230 void RegExpMacroAssemblerPPC::CheckCharacterLT(base::uc16 limit,
231 Label* on_less) {
232 __ CmpU64(current_character(), Operand(limit), r0);
233 BranchOrBacktrack(lt, on_less);
234 }
235
CheckGreedyLoop(Label* on_equal)236 void RegExpMacroAssemblerPPC::CheckGreedyLoop(Label* on_equal) {
237 Label backtrack_non_equal;
238 __ LoadU64(r3, MemOperand(backtrack_stackpointer(), 0));
239 __ CmpS64(current_input_offset(), r3);
240 __ bne(&backtrack_non_equal);
241 __ addi(backtrack_stackpointer(), backtrack_stackpointer(),
242 Operand(kSystemPointerSize));
243
244 __ bind(&backtrack_non_equal);
245 BranchOrBacktrack(eq, on_equal);
246 }
247
CheckNotBackReferenceIgnoreCase( int start_reg, bool read_backward, bool unicode, Label* on_no_match)248 void RegExpMacroAssemblerPPC::CheckNotBackReferenceIgnoreCase(
249 int start_reg, bool read_backward, bool unicode, Label* on_no_match) {
250 Label fallthrough;
251 __ LoadU64(r3, register_location(start_reg),
252 r0); // Index of start of capture
253 __ LoadU64(r4, register_location(start_reg + 1), r0); // Index of end
254 __ sub(r4, r4, r3, LeaveOE, SetRC); // Length of capture.
255
256 // At this point, the capture registers are either both set or both cleared.
257 // If the capture length is zero, then the capture is either empty or cleared.
258 // Fall through in both cases.
259 __ beq(&fallthrough, cr0);
260
261 // Check that there are enough characters left in the input.
262 if (read_backward) {
263 __ LoadU64(r6, MemOperand(frame_pointer(), kStringStartMinusOne));
264 __ add(r6, r6, r4);
265 __ CmpS64(current_input_offset(), r6);
266 BranchOrBacktrack(le, on_no_match);
267 } else {
268 __ add(r0, r4, current_input_offset(), LeaveOE, SetRC);
269 BranchOrBacktrack(gt, on_no_match, cr0);
270 }
271
272 if (mode_ == LATIN1) {
273 Label success;
274 Label fail;
275 Label loop_check;
276
277 // r3 - offset of start of capture
278 // r4 - length of capture
279 __ add(r3, r3, end_of_input_address());
280 __ add(r5, end_of_input_address(), current_input_offset());
281 if (read_backward) {
282 __ sub(r5, r5, r4); // Offset by length when matching backwards.
283 }
284 __ add(r4, r3, r4);
285
286 // r3 - Address of start of capture.
287 // r4 - Address of end of capture
288 // r5 - Address of current input position.
289
290 Label loop;
291 __ bind(&loop);
292 __ lbz(r6, MemOperand(r3));
293 __ addi(r3, r3, Operand(char_size()));
294 __ lbz(r25, MemOperand(r5));
295 __ addi(r5, r5, Operand(char_size()));
296 __ CmpS64(r25, r6);
297 __ beq(&loop_check);
298
299 // Mismatch, try case-insensitive match (converting letters to lower-case).
300 __ ori(r6, r6, Operand(0x20)); // Convert capture character to lower-case.
301 __ ori(r25, r25, Operand(0x20)); // Also convert input character.
302 __ CmpS64(r25, r6);
303 __ bne(&fail);
304 __ subi(r6, r6, Operand('a'));
305 __ cmpli(r6, Operand('z' - 'a')); // Is r6 a lowercase letter?
306 __ ble(&loop_check); // In range 'a'-'z'.
307 // Latin-1: Check for values in range [224,254] but not 247.
308 __ subi(r6, r6, Operand(224 - 'a'));
309 __ cmpli(r6, Operand(254 - 224));
310 __ bgt(&fail); // Weren't Latin-1 letters.
311 __ cmpi(r6, Operand(247 - 224)); // Check for 247.
312 __ beq(&fail);
313
314 __ bind(&loop_check);
315 __ CmpS64(r3, r4);
316 __ blt(&loop);
317 __ b(&success);
318
319 __ bind(&fail);
320 BranchOrBacktrack(al, on_no_match);
321
322 __ bind(&success);
323 // Compute new value of character position after the matched part.
324 __ sub(current_input_offset(), r5, end_of_input_address());
325 if (read_backward) {
326 __ LoadU64(r3,
327 register_location(start_reg)); // Index of start of capture
328 __ LoadU64(r4,
329 register_location(start_reg + 1)); // Index of end of capture
330 __ add(current_input_offset(), current_input_offset(), r3);
331 __ sub(current_input_offset(), current_input_offset(), r4);
332 }
333 } else {
334 DCHECK(mode_ == UC16);
335 int argument_count = 4;
336 __ PrepareCallCFunction(argument_count, r5);
337
338 // r3 - offset of start of capture
339 // r4 - length of capture
340
341 // Put arguments into arguments registers.
342 // Parameters are
343 // r3: Address byte_offset1 - Address captured substring's start.
344 // r4: Address byte_offset2 - Address of current character position.
345 // r5: size_t byte_length - length of capture in bytes(!)
346 // r6: Isolate* isolate.
347
348 // Address of start of capture.
349 __ add(r3, r3, end_of_input_address());
350 // Length of capture.
351 __ mr(r5, r4);
352 // Save length in callee-save register for use on return.
353 __ mr(r25, r4);
354 // Address of current input position.
355 __ add(r4, current_input_offset(), end_of_input_address());
356 if (read_backward) {
357 __ sub(r4, r4, r25);
358 }
359 // Isolate.
360 __ mov(r6, Operand(ExternalReference::isolate_address(isolate())));
361
362 {
363 AllowExternalCallThatCantCauseGC scope(masm_.get());
364 ExternalReference function =
365 unicode
366 ? ExternalReference::re_case_insensitive_compare_unicode()
367 : ExternalReference::re_case_insensitive_compare_non_unicode();
368 __ CallCFunction(function, argument_count);
369 }
370
371 // Check if function returned non-zero for success or zero for failure.
372 __ cmpi(r3, Operand::Zero());
373 BranchOrBacktrack(eq, on_no_match);
374
375 // On success, advance position by length of capture.
376 if (read_backward) {
377 __ sub(current_input_offset(), current_input_offset(), r25);
378 } else {
379 __ add(current_input_offset(), current_input_offset(), r25);
380 }
381 }
382
383 __ bind(&fallthrough);
384 }
385
CheckNotBackReference(int start_reg, bool read_backward, Label* on_no_match)386 void RegExpMacroAssemblerPPC::CheckNotBackReference(int start_reg,
387 bool read_backward,
388 Label* on_no_match) {
389 Label fallthrough;
390
391 // Find length of back-referenced capture.
392 __ LoadU64(r3, register_location(start_reg), r0);
393 __ LoadU64(r4, register_location(start_reg + 1), r0);
394 __ sub(r4, r4, r3, LeaveOE, SetRC); // Length to check.
395
396 // At this point, the capture registers are either both set or both cleared.
397 // If the capture length is zero, then the capture is either empty or cleared.
398 // Fall through in both cases.
399 __ beq(&fallthrough, cr0);
400
401 // Check that there are enough characters left in the input.
402 if (read_backward) {
403 __ LoadU64(r6, MemOperand(frame_pointer(), kStringStartMinusOne));
404 __ add(r6, r6, r4);
405 __ CmpS64(current_input_offset(), r6);
406 BranchOrBacktrack(le, on_no_match);
407 } else {
408 __ add(r0, r4, current_input_offset(), LeaveOE, SetRC);
409 BranchOrBacktrack(gt, on_no_match, cr0);
410 }
411
412 // r3 - offset of start of capture
413 // r4 - length of capture
414 __ add(r3, r3, end_of_input_address());
415 __ add(r5, end_of_input_address(), current_input_offset());
416 if (read_backward) {
417 __ sub(r5, r5, r4); // Offset by length when matching backwards.
418 }
419 __ add(r4, r4, r3);
420
421 Label loop;
422 __ bind(&loop);
423 if (mode_ == LATIN1) {
424 __ lbz(r6, MemOperand(r3));
425 __ addi(r3, r3, Operand(char_size()));
426 __ lbz(r25, MemOperand(r5));
427 __ addi(r5, r5, Operand(char_size()));
428 } else {
429 DCHECK(mode_ == UC16);
430 __ lhz(r6, MemOperand(r3));
431 __ addi(r3, r3, Operand(char_size()));
432 __ lhz(r25, MemOperand(r5));
433 __ addi(r5, r5, Operand(char_size()));
434 }
435 __ CmpS64(r6, r25);
436 BranchOrBacktrack(ne, on_no_match);
437 __ CmpS64(r3, r4);
438 __ blt(&loop);
439
440 // Move current character position to position after match.
441 __ sub(current_input_offset(), r5, end_of_input_address());
442 if (read_backward) {
443 __ LoadU64(r3, register_location(start_reg)); // Index of start of capture
444 __ LoadU64(r4,
445 register_location(start_reg + 1)); // Index of end of capture
446 __ add(current_input_offset(), current_input_offset(), r3);
447 __ sub(current_input_offset(), current_input_offset(), r4);
448 }
449
450 __ bind(&fallthrough);
451 }
452
453
CheckNotCharacter(unsigned c, Label* on_not_equal)454 void RegExpMacroAssemblerPPC::CheckNotCharacter(unsigned c,
455 Label* on_not_equal) {
456 __ CmpU64(current_character(), Operand(c), r0);
457 BranchOrBacktrack(ne, on_not_equal);
458 }
459
460
CheckCharacterAfterAnd(uint32_t c, uint32_t mask, Label* on_equal)461 void RegExpMacroAssemblerPPC::CheckCharacterAfterAnd(uint32_t c, uint32_t mask,
462 Label* on_equal) {
463 __ mov(r0, Operand(mask));
464 if (c == 0) {
465 __ and_(r3, current_character(), r0, SetRC);
466 } else {
467 __ and_(r3, current_character(), r0);
468 __ CmpU64(r3, Operand(c), r0, cr0);
469 }
470 BranchOrBacktrack(eq, on_equal, cr0);
471 }
472
473
CheckNotCharacterAfterAnd(unsigned c, unsigned mask, Label* on_not_equal)474 void RegExpMacroAssemblerPPC::CheckNotCharacterAfterAnd(unsigned c,
475 unsigned mask,
476 Label* on_not_equal) {
477 __ mov(r0, Operand(mask));
478 if (c == 0) {
479 __ and_(r3, current_character(), r0, SetRC);
480 } else {
481 __ and_(r3, current_character(), r0);
482 __ CmpU64(r3, Operand(c), r0, cr0);
483 }
484 BranchOrBacktrack(ne, on_not_equal, cr0);
485 }
486
CheckNotCharacterAfterMinusAnd( base::uc16 c, base::uc16 minus, base::uc16 mask, Label* on_not_equal)487 void RegExpMacroAssemblerPPC::CheckNotCharacterAfterMinusAnd(
488 base::uc16 c, base::uc16 minus, base::uc16 mask, Label* on_not_equal) {
489 DCHECK_GT(String::kMaxUtf16CodeUnit, minus);
490 __ subi(r3, current_character(), Operand(minus));
491 __ mov(r0, Operand(mask));
492 __ and_(r3, r3, r0);
493 __ CmpU64(r3, Operand(c), r0);
494 BranchOrBacktrack(ne, on_not_equal);
495 }
496
CheckCharacterInRange(base::uc16 from, base::uc16 to, Label* on_in_range)497 void RegExpMacroAssemblerPPC::CheckCharacterInRange(base::uc16 from,
498 base::uc16 to,
499 Label* on_in_range) {
500 __ mov(r0, Operand(from));
501 __ sub(r3, current_character(), r0);
502 __ CmpU64(r3, Operand(to - from), r0);
503 BranchOrBacktrack(le, on_in_range); // Unsigned lower-or-same condition.
504 }
505
CheckCharacterNotInRange(base::uc16 from, base::uc16 to, Label* on_not_in_range)506 void RegExpMacroAssemblerPPC::CheckCharacterNotInRange(base::uc16 from,
507 base::uc16 to,
508 Label* on_not_in_range) {
509 __ mov(r0, Operand(from));
510 __ sub(r3, current_character(), r0);
511 __ CmpU64(r3, Operand(to - from), r0);
512 BranchOrBacktrack(gt, on_not_in_range); // Unsigned higher condition.
513 }
514
CallIsCharacterInRangeArray( const ZoneList<CharacterRange>* ranges)515 void RegExpMacroAssemblerPPC::CallIsCharacterInRangeArray(
516 const ZoneList<CharacterRange>* ranges) {
517 static const int kNumArguments = 3;
518 __ PrepareCallCFunction(kNumArguments, r0);
519
520 __ mr(r3, current_character());
521 __ mov(r4, Operand(GetOrAddRangeArray(ranges)));
522 __ mov(r5, Operand(ExternalReference::isolate_address(isolate())));
523
524 {
525 // We have a frame (set up in GetCode), but the assembler doesn't know.
526 FrameScope scope(masm_.get(), StackFrame::MANUAL);
527 __ CallCFunction(ExternalReference::re_is_character_in_range_array(),
528 kNumArguments);
529 }
530
531 __ mov(code_pointer(), Operand(masm_->CodeObject()));
532 }
533
CheckCharacterInRangeArray( const ZoneList<CharacterRange>* ranges, Label* on_in_range)534 bool RegExpMacroAssemblerPPC::CheckCharacterInRangeArray(
535 const ZoneList<CharacterRange>* ranges, Label* on_in_range) {
536 CallIsCharacterInRangeArray(ranges);
537 __ cmpi(r3, Operand::Zero());
538 BranchOrBacktrack(ne, on_in_range);
539 return true;
540 }
541
CheckCharacterNotInRangeArray( const ZoneList<CharacterRange>* ranges, Label* on_not_in_range)542 bool RegExpMacroAssemblerPPC::CheckCharacterNotInRangeArray(
543 const ZoneList<CharacterRange>* ranges, Label* on_not_in_range) {
544 CallIsCharacterInRangeArray(ranges);
545 __ cmpi(r3, Operand::Zero());
546 BranchOrBacktrack(eq, on_not_in_range);
547 return true;
548 }
549
CheckBitInTable(Handle<ByteArray> table, Label* on_bit_set)550 void RegExpMacroAssemblerPPC::CheckBitInTable(Handle<ByteArray> table,
551 Label* on_bit_set) {
552 __ mov(r3, Operand(table));
553 if (mode_ != LATIN1 || kTableMask != String::kMaxOneByteCharCode) {
554 __ andi(r4, current_character(), Operand(kTableSize - 1));
555 __ addi(r4, r4, Operand(ByteArray::kHeaderSize - kHeapObjectTag));
556 } else {
557 __ addi(r4, current_character(),
558 Operand(ByteArray::kHeaderSize - kHeapObjectTag));
559 }
560 __ lbzx(r3, MemOperand(r3, r4));
561 __ cmpi(r3, Operand::Zero());
562 BranchOrBacktrack(ne, on_bit_set);
563 }
564
CheckSpecialCharacterClass( StandardCharacterSet type, Label* on_no_match)565 bool RegExpMacroAssemblerPPC::CheckSpecialCharacterClass(
566 StandardCharacterSet type, Label* on_no_match) {
567 // Range checks (c in min..max) are generally implemented by an unsigned
568 // (c - min) <= (max - min) check
569 // TODO(jgruber): No custom implementation (yet): s(UC16), S(UC16).
570 switch (type) {
571 case StandardCharacterSet::kWhitespace:
572 // Match space-characters.
573 if (mode_ == LATIN1) {
574 // One byte space characters are '\t'..'\r', ' ' and \u00a0.
575 Label success;
576 __ cmpi(current_character(), Operand(' '));
577 __ beq(&success);
578 // Check range 0x09..0x0D.
579 __ subi(r3, current_character(), Operand('\t'));
580 __ cmpli(r3, Operand('\r' - '\t'));
581 __ ble(&success);
582 // \u00a0 (NBSP).
583 __ cmpi(r3, Operand(0x00A0 - '\t'));
584 BranchOrBacktrack(ne, on_no_match);
585 __ bind(&success);
586 return true;
587 }
588 return false;
589 case StandardCharacterSet::kNotWhitespace:
590 // The emitted code for generic character classes is good enough.
591 return false;
592 case StandardCharacterSet::kDigit:
593 // Match ASCII digits ('0'..'9')
594 __ subi(r3, current_character(), Operand('0'));
595 __ cmpli(r3, Operand('9' - '0'));
596 BranchOrBacktrack(gt, on_no_match);
597 return true;
598 case StandardCharacterSet::kNotDigit:
599 // Match non ASCII-digits
600 __ subi(r3, current_character(), Operand('0'));
601 __ cmpli(r3, Operand('9' - '0'));
602 BranchOrBacktrack(le, on_no_match);
603 return true;
604 case StandardCharacterSet::kNotLineTerminator: {
605 // Match non-newlines (not 0x0A('\n'), 0x0D('\r'), 0x2028 and 0x2029)
606 __ xori(r3, current_character(), Operand(0x01));
607 // See if current character is '\n'^1 or '\r'^1, i.e., 0x0B or 0x0C
608 __ subi(r3, r3, Operand(0x0B));
609 __ cmpli(r3, Operand(0x0C - 0x0B));
610 BranchOrBacktrack(le, on_no_match);
611 if (mode_ == UC16) {
612 // Compare original value to 0x2028 and 0x2029, using the already
613 // computed (current_char ^ 0x01 - 0x0B). I.e., check for
614 // 0x201D (0x2028 - 0x0B) or 0x201E.
615 __ subi(r3, r3, Operand(0x2028 - 0x0B));
616 __ cmpli(r3, Operand(1));
617 BranchOrBacktrack(le, on_no_match);
618 }
619 return true;
620 }
621 case StandardCharacterSet::kLineTerminator: {
622 // Match newlines (0x0A('\n'), 0x0D('\r'), 0x2028 and 0x2029)
623 __ xori(r3, current_character(), Operand(0x01));
624 // See if current character is '\n'^1 or '\r'^1, i.e., 0x0B or 0x0C
625 __ subi(r3, r3, Operand(0x0B));
626 __ cmpli(r3, Operand(0x0C - 0x0B));
627 if (mode_ == LATIN1) {
628 BranchOrBacktrack(gt, on_no_match);
629 } else {
630 Label done;
631 __ ble(&done);
632 // Compare original value to 0x2028 and 0x2029, using the already
633 // computed (current_char ^ 0x01 - 0x0B). I.e., check for
634 // 0x201D (0x2028 - 0x0B) or 0x201E.
635 __ subi(r3, r3, Operand(0x2028 - 0x0B));
636 __ cmpli(r3, Operand(1));
637 BranchOrBacktrack(gt, on_no_match);
638 __ bind(&done);
639 }
640 return true;
641 }
642 case StandardCharacterSet::kWord: {
643 if (mode_ != LATIN1) {
644 // Table is 256 entries, so all Latin1 characters can be tested.
645 __ cmpi(current_character(), Operand('z'));
646 BranchOrBacktrack(gt, on_no_match);
647 }
648 ExternalReference map = ExternalReference::re_word_character_map();
649 __ mov(r3, Operand(map));
650 __ lbzx(r3, MemOperand(r3, current_character()));
651 __ cmpli(r3, Operand::Zero());
652 BranchOrBacktrack(eq, on_no_match);
653 return true;
654 }
655 case StandardCharacterSet::kNotWord: {
656 Label done;
657 if (mode_ != LATIN1) {
658 // Table is 256 entries, so all Latin1 characters can be tested.
659 __ cmpli(current_character(), Operand('z'));
660 __ bgt(&done);
661 }
662 ExternalReference map = ExternalReference::re_word_character_map();
663 __ mov(r3, Operand(map));
664 __ lbzx(r3, MemOperand(r3, current_character()));
665 __ cmpli(r3, Operand::Zero());
666 BranchOrBacktrack(ne, on_no_match);
667 if (mode_ != LATIN1) {
668 __ bind(&done);
669 }
670 return true;
671 }
672 case StandardCharacterSet::kEverything:
673 // Match any character.
674 return true;
675 }
676 }
677
Fail()678 void RegExpMacroAssemblerPPC::Fail() {
679 __ li(r3, Operand(FAILURE));
680 __ b(&exit_label_);
681 }
682
LoadRegExpStackPointerFromMemory(Register dst)683 void RegExpMacroAssemblerPPC::LoadRegExpStackPointerFromMemory(Register dst) {
684 ExternalReference ref =
685 ExternalReference::address_of_regexp_stack_stack_pointer(isolate());
686 __ mov(dst, Operand(ref));
687 __ LoadU64(dst, MemOperand(dst));
688 }
689
StoreRegExpStackPointerToMemory( Register src, Register scratch)690 void RegExpMacroAssemblerPPC::StoreRegExpStackPointerToMemory(
691 Register src, Register scratch) {
692 ExternalReference ref =
693 ExternalReference::address_of_regexp_stack_stack_pointer(isolate());
694 __ mov(scratch, Operand(ref));
695 __ StoreU64(src, MemOperand(scratch));
696 }
697
PushRegExpBasePointer(Register stack_pointer, Register scratch)698 void RegExpMacroAssemblerPPC::PushRegExpBasePointer(Register stack_pointer,
699 Register scratch) {
700 ExternalReference ref =
701 ExternalReference::address_of_regexp_stack_memory_top_address(isolate());
702 __ mov(scratch, Operand(ref));
703 __ LoadU64(scratch, MemOperand(scratch));
704 __ SubS64(scratch, stack_pointer, scratch);
705 __ StoreU64(scratch, MemOperand(frame_pointer(), kRegExpStackBasePointer));
706 }
707
PopRegExpBasePointer(Register stack_pointer_out, Register scratch)708 void RegExpMacroAssemblerPPC::PopRegExpBasePointer(Register stack_pointer_out,
709 Register scratch) {
710 ExternalReference ref =
711 ExternalReference::address_of_regexp_stack_memory_top_address(isolate());
712 __ LoadU64(stack_pointer_out,
713 MemOperand(frame_pointer(), kRegExpStackBasePointer));
714 __ mov(scratch, Operand(ref));
715 __ LoadU64(scratch, MemOperand(scratch));
716 __ AddS64(stack_pointer_out, stack_pointer_out, scratch);
717 StoreRegExpStackPointerToMemory(stack_pointer_out, scratch);
718 }
719
GetCode(Handle<String> source)720 Handle<HeapObject> RegExpMacroAssemblerPPC::GetCode(Handle<String> source) {
721 Label return_r3;
722
723 if (masm_->has_exception()) {
724 // If the code gets corrupted due to long regular expressions and lack of
725 // space on trampolines, an internal exception flag is set. If this case
726 // is detected, we will jump into exit sequence right away.
727 __ bind_to(&entry_label_, internal_failure_label_.pos());
728 } else {
729 // Finalize code - write the entry point code now we know how many
730 // registers we need.
731
732 // Entry code:
733 __ bind(&entry_label_);
734
735 // Tell the system that we have a stack frame. Because the type
736 // is MANUAL, no is generated.
737 FrameScope scope(masm_.get(), StackFrame::MANUAL);
738
739 // Ensure register assigments are consistent with callee save mask
740 DCHECK(kRegExpCalleeSaved.has(r25));
741 DCHECK(kRegExpCalleeSaved.has(code_pointer()));
742 DCHECK(kRegExpCalleeSaved.has(current_input_offset()));
743 DCHECK(kRegExpCalleeSaved.has(current_character()));
744 DCHECK(kRegExpCalleeSaved.has(backtrack_stackpointer()));
745 DCHECK(kRegExpCalleeSaved.has(end_of_input_address()));
746 DCHECK(kRegExpCalleeSaved.has(frame_pointer()));
747
748 // Actually emit code to start a new stack frame.
749 // Push arguments
750 // Save callee-save registers.
751 // Start new stack frame.
752 // Store link register in existing stack-cell.
753 // Order here should correspond to order of offset constants in header file.
754 RegList registers_to_retain = kRegExpCalleeSaved;
755 RegList argument_registers = {r3, r4, r5, r6, r7, r8, r9, r10};
756 __ mflr(r0);
757 __ push(r0);
758 __ MultiPush(argument_registers | registers_to_retain);
759 // Set frame pointer in space for it if this is not a direct call
760 // from generated code.
761 __ addi(frame_pointer(), sp, Operand(8 * kSystemPointerSize));
762
763 STATIC_ASSERT(kSuccessfulCaptures == kInputString - kSystemPointerSize);
764 __ li(r3, Operand::Zero());
765 __ push(r3); // Make room for success counter and initialize it to 0.
766 STATIC_ASSERT(kStringStartMinusOne ==
767 kSuccessfulCaptures - kSystemPointerSize);
768 __ push(r3); // Make room for "string start - 1" constant.
769 STATIC_ASSERT(kBacktrackCount == kStringStartMinusOne - kSystemPointerSize);
770 __ push(r3); // The backtrack counter.
771 STATIC_ASSERT(kRegExpStackBasePointer ==
772 kBacktrackCount - kSystemPointerSize);
773 __ push(r3); // The regexp stack base ptr.
774
775 // Initialize backtrack stack pointer. It must not be clobbered from here
776 // on. Note the backtrack_stackpointer is callee-saved.
777 STATIC_ASSERT(backtrack_stackpointer() == r29);
778 LoadRegExpStackPointerFromMemory(backtrack_stackpointer());
779
780 // Store the regexp base pointer - we'll later restore it / write it to
781 // memory when returning from this irregexp code object.
782 PushRegExpBasePointer(backtrack_stackpointer(), r4);
783
784 {
785 // Check if we have space on the stack for registers.
786 Label stack_limit_hit, stack_ok;
787
788 ExternalReference stack_limit =
789 ExternalReference::address_of_jslimit(isolate());
790 __ mov(r3, Operand(stack_limit));
791 __ LoadU64(r3, MemOperand(r3));
792 __ sub(r3, sp, r3, LeaveOE, SetRC);
793 // Handle it if the stack pointer is already below the stack limit.
794 __ ble(&stack_limit_hit, cr0);
795 // Check if there is room for the variable number of registers above
796 // the stack limit.
797 __ CmpU64(r3, Operand(num_registers_ * kSystemPointerSize), r0);
798 __ bge(&stack_ok);
799 // Exit with OutOfMemory exception. There is not enough space on the stack
800 // for our working registers.
801 __ li(r3, Operand(EXCEPTION));
802 __ b(&return_r3);
803
804 __ bind(&stack_limit_hit);
805 CallCheckStackGuardState(r3);
806 __ cmpi(r3, Operand::Zero());
807 // If returned value is non-zero, we exit with the returned value as
808 // result.
809 __ bne(&return_r3);
810
811 __ bind(&stack_ok);
812 }
813
814 // Allocate space on stack for registers.
815 __ AddS64(sp, sp, Operand(-num_registers_ * kSystemPointerSize), r0);
816 // Load string end.
817 __ LoadU64(end_of_input_address(), MemOperand(frame_pointer(), kInputEnd));
818 // Load input start.
819 __ LoadU64(r3, MemOperand(frame_pointer(), kInputStart));
820 // Find negative length (offset of start relative to end).
821 __ sub(current_input_offset(), r3, end_of_input_address());
822 // Set r3 to address of char before start of the input string
823 // (effectively string position -1).
824 __ LoadU64(r4, MemOperand(frame_pointer(), kStartIndex));
825 __ subi(r3, current_input_offset(), Operand(char_size()));
826 if (mode_ == UC16) {
827 __ ShiftLeftU64(r0, r4, Operand(1));
828 __ sub(r3, r3, r0);
829 } else {
830 __ sub(r3, r3, r4);
831 }
832 // Store this value in a local variable, for use when clearing
833 // position registers.
834 __ StoreU64(r3, MemOperand(frame_pointer(), kStringStartMinusOne));
835
836 // Initialize code pointer register
837 __ mov(code_pointer(), Operand(masm_->CodeObject()));
838
839 Label load_char_start_regexp;
840 {
841 Label start_regexp;
842 // Load newline if index is at start, previous character otherwise.
843 __ cmpi(r4, Operand::Zero());
844 __ bne(&load_char_start_regexp);
845 __ li(current_character(), Operand('\n'));
846 __ b(&start_regexp);
847
848 // Global regexp restarts matching here.
849 __ bind(&load_char_start_regexp);
850 // Load previous char as initial value of current character register.
851 LoadCurrentCharacterUnchecked(-1, 1);
852 __ bind(&start_regexp);
853 }
854
855 // Initialize on-stack registers.
856 if (num_saved_registers_ > 0) { // Always is, if generated from a regexp.
857 // Fill saved registers with initial value = start offset - 1
858 if (num_saved_registers_ > 8) {
859 // One slot beyond address of register 0.
860 __ addi(r4, frame_pointer(),
861 Operand(kRegisterZero + kSystemPointerSize));
862 __ mov(r5, Operand(num_saved_registers_));
863 __ mtctr(r5);
864 Label init_loop;
865 __ bind(&init_loop);
866 __ StoreU64WithUpdate(r3, MemOperand(r4, -kSystemPointerSize));
867 __ bdnz(&init_loop);
868 } else {
869 for (int i = 0; i < num_saved_registers_; i++) {
870 __ StoreU64(r3, register_location(i), r0);
871 }
872 }
873 }
874
875 __ b(&start_label_);
876
877 // Exit code:
878 if (success_label_.is_linked()) {
879 // Save captures when successful.
880 __ bind(&success_label_);
881 if (num_saved_registers_ > 0) {
882 // copy captures to output
883 __ LoadU64(r4, MemOperand(frame_pointer(), kInputStart));
884 __ LoadU64(r3, MemOperand(frame_pointer(), kRegisterOutput));
885 __ LoadU64(r5, MemOperand(frame_pointer(), kStartIndex));
886 __ sub(r4, end_of_input_address(), r4);
887 // r4 is length of input in bytes.
888 if (mode_ == UC16) {
889 __ ShiftRightU64(r4, r4, Operand(1));
890 }
891 // r4 is length of input in characters.
892 __ add(r4, r4, r5);
893 // r4 is length of string in characters.
894
895 DCHECK_EQ(0, num_saved_registers_ % 2);
896 // Always an even number of capture registers. This allows us to
897 // unroll the loop once to add an operation between a load of a register
898 // and the following use of that register.
899 for (int i = 0; i < num_saved_registers_; i += 2) {
900 __ LoadU64(r5, register_location(i), r0);
901 __ LoadU64(r6, register_location(i + 1), r0);
902 if (i == 0 && global_with_zero_length_check()) {
903 // Keep capture start in r25 for the zero-length check later.
904 __ mr(r25, r5);
905 }
906 if (mode_ == UC16) {
907 __ ShiftRightS64(r5, r5, Operand(1));
908 __ add(r5, r4, r5);
909 __ ShiftRightS64(r6, r6, Operand(1));
910 __ add(r6, r4, r6);
911 } else {
912 __ add(r5, r4, r5);
913 __ add(r6, r4, r6);
914 }
915 __ stw(r5, MemOperand(r3));
916 __ addi(r3, r3, Operand(kIntSize));
917 __ stw(r6, MemOperand(r3));
918 __ addi(r3, r3, Operand(kIntSize));
919 }
920 }
921
922 if (global()) {
923 // Restart matching if the regular expression is flagged as global.
924 __ LoadU64(r3, MemOperand(frame_pointer(), kSuccessfulCaptures));
925 __ LoadU64(r4, MemOperand(frame_pointer(), kNumOutputRegisters));
926 __ LoadU64(r5, MemOperand(frame_pointer(), kRegisterOutput));
927 // Increment success counter.
928 __ addi(r3, r3, Operand(1));
929 __ StoreU64(r3, MemOperand(frame_pointer(), kSuccessfulCaptures));
930 // Capture results have been stored, so the number of remaining global
931 // output registers is reduced by the number of stored captures.
932 __ subi(r4, r4, Operand(num_saved_registers_));
933 // Check whether we have enough room for another set of capture results.
934 __ cmpi(r4, Operand(num_saved_registers_));
935 __ blt(&return_r3);
936
937 __ StoreU64(r4, MemOperand(frame_pointer(), kNumOutputRegisters));
938 // Advance the location for output.
939 __ addi(r5, r5, Operand(num_saved_registers_ * kIntSize));
940 __ StoreU64(r5, MemOperand(frame_pointer(), kRegisterOutput));
941
942 // Prepare r3 to initialize registers with its value in the next run.
943 __ LoadU64(r3, MemOperand(frame_pointer(), kStringStartMinusOne));
944
945 // Restore the original regexp stack pointer value (effectively, pop the
946 // stored base pointer).
947 PopRegExpBasePointer(backtrack_stackpointer(), r5);
948
949 if (global_with_zero_length_check()) {
950 // Special case for zero-length matches.
951 // r25: capture start index
952 __ CmpS64(current_input_offset(), r25);
953 // Not a zero-length match, restart.
954 __ bne(&load_char_start_regexp);
955 // Offset from the end is zero if we already reached the end.
956 __ cmpi(current_input_offset(), Operand::Zero());
957 __ beq(&exit_label_);
958 // Advance current position after a zero-length match.
959 Label advance;
960 __ bind(&advance);
961 __ addi(current_input_offset(), current_input_offset(),
962 Operand((mode_ == UC16) ? 2 : 1));
963 if (global_unicode()) CheckNotInSurrogatePair(0, &advance);
964 }
965
966 __ b(&load_char_start_regexp);
967 } else {
968 __ li(r3, Operand(SUCCESS));
969 }
970 }
971
972 // Exit and return r3
973 __ bind(&exit_label_);
974 if (global()) {
975 __ LoadU64(r3, MemOperand(frame_pointer(), kSuccessfulCaptures));
976 }
977
978 __ bind(&return_r3);
979 // Restore the original regexp stack pointer value (effectively, pop the
980 // stored base pointer).
981 PopRegExpBasePointer(backtrack_stackpointer(), r5);
982
983 // Skip sp past regexp registers and local variables..
984 __ mr(sp, frame_pointer());
985 // Restore registers r25..r31 and return (restoring lr to pc).
986 __ MultiPop(registers_to_retain);
987 __ pop(r0);
988 __ mtlr(r0);
989 __ blr();
990
991 // Backtrack code (branch target for conditional backtracks).
992 if (backtrack_label_.is_linked()) {
993 __ bind(&backtrack_label_);
994 Backtrack();
995 }
996
997 Label exit_with_exception;
998
999 // Preempt-code
1000 if (check_preempt_label_.is_linked()) {
1001 SafeCallTarget(&check_preempt_label_);
1002
1003 StoreRegExpStackPointerToMemory(backtrack_stackpointer(), r4);
1004
1005 CallCheckStackGuardState(r3);
1006 __ cmpi(r3, Operand::Zero());
1007 // If returning non-zero, we should end execution with the given
1008 // result as return value.
1009 __ bne(&return_r3);
1010
1011 LoadRegExpStackPointerFromMemory(backtrack_stackpointer());
1012
1013 // String might have moved: Reload end of string from frame.
1014 __ LoadU64(end_of_input_address(),
1015 MemOperand(frame_pointer(), kInputEnd));
1016 SafeReturn();
1017 }
1018
1019 // Backtrack stack overflow code.
1020 if (stack_overflow_label_.is_linked()) {
1021 SafeCallTarget(&stack_overflow_label_);
1022
1023 // Call GrowStack(isolate).
1024
1025 StoreRegExpStackPointerToMemory(backtrack_stackpointer(), r4);
1026
1027 static constexpr int kNumArguments = 1;
1028 __ PrepareCallCFunction(kNumArguments, r3);
1029 __ mov(r3, Operand(ExternalReference::isolate_address(isolate())));
1030 ExternalReference grow_stack = ExternalReference::re_grow_stack();
1031 __ CallCFunction(grow_stack, kNumArguments);
1032 // If nullptr is returned, we have failed to grow the stack, and must exit
1033 // with a stack-overflow exception.
1034 __ cmpi(r3, Operand::Zero());
1035 __ beq(&exit_with_exception);
1036 // Otherwise use return value as new stack pointer.
1037 __ mr(backtrack_stackpointer(), r3);
1038 // Restore saved registers and continue.
1039 SafeReturn();
1040 }
1041
1042 if (exit_with_exception.is_linked()) {
1043 // If any of the code above needed to exit with an exception.
1044 __ bind(&exit_with_exception);
1045 // Exit with Result EXCEPTION(-1) to signal thrown exception.
1046 __ li(r3, Operand(EXCEPTION));
1047 __ b(&return_r3);
1048 }
1049
1050 if (fallback_label_.is_linked()) {
1051 __ bind(&fallback_label_);
1052 __ li(r3, Operand(FALLBACK_TO_EXPERIMENTAL));
1053 __ b(&return_r3);
1054 }
1055 }
1056
1057 CodeDesc code_desc;
1058 masm_->GetCode(isolate(), &code_desc);
1059 Handle<Code> code =
1060 Factory::CodeBuilder(isolate(), code_desc, CodeKind::REGEXP)
1061 .set_self_reference(masm_->CodeObject())
1062 .Build();
1063 PROFILE(masm_->isolate(),
1064 RegExpCodeCreateEvent(Handle<AbstractCode>::cast(code), source));
1065 return Handle<HeapObject>::cast(code);
1066 }
1067
1068
GoTo(Label* to)1069 void RegExpMacroAssemblerPPC::GoTo(Label* to) { BranchOrBacktrack(al, to); }
1070
1071
IfRegisterGE(int reg, int comparand, Label* if_ge)1072 void RegExpMacroAssemblerPPC::IfRegisterGE(int reg, int comparand,
1073 Label* if_ge) {
1074 __ LoadU64(r3, register_location(reg), r0);
1075 __ CmpS64(r3, Operand(comparand), r0);
1076 BranchOrBacktrack(ge, if_ge);
1077 }
1078
1079
IfRegisterLT(int reg, int comparand, Label* if_lt)1080 void RegExpMacroAssemblerPPC::IfRegisterLT(int reg, int comparand,
1081 Label* if_lt) {
1082 __ LoadU64(r3, register_location(reg), r0);
1083 __ CmpS64(r3, Operand(comparand), r0);
1084 BranchOrBacktrack(lt, if_lt);
1085 }
1086
1087
IfRegisterEqPos(int reg, Label* if_eq)1088 void RegExpMacroAssemblerPPC::IfRegisterEqPos(int reg, Label* if_eq) {
1089 __ LoadU64(r3, register_location(reg), r0);
1090 __ CmpS64(r3, current_input_offset());
1091 BranchOrBacktrack(eq, if_eq);
1092 }
1093
1094
1095 RegExpMacroAssembler::IrregexpImplementation
Implementation()1096 RegExpMacroAssemblerPPC::Implementation() {
1097 return kPPCImplementation;
1098 }
1099
1100
PopCurrentPosition()1101 void RegExpMacroAssemblerPPC::PopCurrentPosition() {
1102 Pop(current_input_offset());
1103 }
1104
1105
PopRegister(int register_index)1106 void RegExpMacroAssemblerPPC::PopRegister(int register_index) {
1107 Pop(r3);
1108 __ StoreU64(r3, register_location(register_index), r0);
1109 }
1110
1111
PushBacktrack(Label* label)1112 void RegExpMacroAssemblerPPC::PushBacktrack(Label* label) {
1113 __ mov_label_offset(r3, label);
1114 Push(r3);
1115 CheckStackLimit();
1116 }
1117
1118
PushCurrentPosition()1119 void RegExpMacroAssemblerPPC::PushCurrentPosition() {
1120 Push(current_input_offset());
1121 }
1122
1123
PushRegister(int register_index, StackCheckFlag check_stack_limit)1124 void RegExpMacroAssemblerPPC::PushRegister(int register_index,
1125 StackCheckFlag check_stack_limit) {
1126 __ LoadU64(r3, register_location(register_index), r0);
1127 Push(r3);
1128 if (check_stack_limit) CheckStackLimit();
1129 }
1130
1131
ReadCurrentPositionFromRegister(int reg)1132 void RegExpMacroAssemblerPPC::ReadCurrentPositionFromRegister(int reg) {
1133 __ LoadU64(current_input_offset(), register_location(reg), r0);
1134 }
1135
WriteStackPointerToRegister(int reg)1136 void RegExpMacroAssemblerPPC::WriteStackPointerToRegister(int reg) {
1137 ExternalReference ref =
1138 ExternalReference::address_of_regexp_stack_memory_top_address(isolate());
1139 __ mov(r4, Operand(ref));
1140 __ LoadU64(r4, MemOperand(r4));
1141 __ SubS64(r3, backtrack_stackpointer(), r4);
1142 __ StoreU64(r3, register_location(reg), r0);
1143 }
1144
ReadStackPointerFromRegister(int reg)1145 void RegExpMacroAssemblerPPC::ReadStackPointerFromRegister(int reg) {
1146 ExternalReference ref =
1147 ExternalReference::address_of_regexp_stack_memory_top_address(isolate());
1148 __ mov(r3, Operand(ref));
1149 __ LoadU64(r3, MemOperand(r3));
1150 __ LoadU64(backtrack_stackpointer(), register_location(reg), r0);
1151 __ AddS64(backtrack_stackpointer(), backtrack_stackpointer(), r3);
1152 }
1153
SetCurrentPositionFromEnd(int by)1154 void RegExpMacroAssemblerPPC::SetCurrentPositionFromEnd(int by) {
1155 Label after_position;
1156 __ CmpS64(current_input_offset(), Operand(-by * char_size()), r0);
1157 __ bge(&after_position);
1158 __ mov(current_input_offset(), Operand(-by * char_size()));
1159 // On RegExp code entry (where this operation is used), the character before
1160 // the current position is expected to be already loaded.
1161 // We have advanced the position, so it's safe to read backwards.
1162 LoadCurrentCharacterUnchecked(-1, 1);
1163 __ bind(&after_position);
1164 }
1165
1166
SetRegister(int register_index, int to)1167 void RegExpMacroAssemblerPPC::SetRegister(int register_index, int to) {
1168 DCHECK(register_index >= num_saved_registers_); // Reserved for positions!
1169 __ mov(r3, Operand(to));
1170 __ StoreU64(r3, register_location(register_index), r0);
1171 }
1172
1173
Succeed()1174 bool RegExpMacroAssemblerPPC::Succeed() {
1175 __ b(&success_label_);
1176 return global();
1177 }
1178
1179
WriteCurrentPositionToRegister(int reg, int cp_offset)1180 void RegExpMacroAssemblerPPC::WriteCurrentPositionToRegister(int reg,
1181 int cp_offset) {
1182 if (cp_offset == 0) {
1183 __ StoreU64(current_input_offset(), register_location(reg), r0);
1184 } else {
1185 __ mov(r0, Operand(cp_offset * char_size()));
1186 __ add(r3, current_input_offset(), r0);
1187 __ StoreU64(r3, register_location(reg), r0);
1188 }
1189 }
1190
1191
ClearRegisters(int reg_from, int reg_to)1192 void RegExpMacroAssemblerPPC::ClearRegisters(int reg_from, int reg_to) {
1193 DCHECK(reg_from <= reg_to);
1194 __ LoadU64(r3, MemOperand(frame_pointer(), kStringStartMinusOne));
1195 for (int reg = reg_from; reg <= reg_to; reg++) {
1196 __ StoreU64(r3, register_location(reg), r0);
1197 }
1198 }
1199
1200 // Private methods:
1201
CallCheckStackGuardState(Register scratch)1202 void RegExpMacroAssemblerPPC::CallCheckStackGuardState(Register scratch) {
1203 DCHECK(!isolate()->IsGeneratingEmbeddedBuiltins());
1204 DCHECK(!masm_->options().isolate_independent_code);
1205
1206 int frame_alignment = masm_->ActivationFrameAlignment();
1207 int stack_space = kNumRequiredStackFrameSlots;
1208 int stack_passed_arguments = 1; // space for return address pointer
1209
1210 // The following stack manipulation logic is similar to
1211 // PrepareCallCFunction. However, we need an extra slot on the
1212 // stack to house the return address parameter.
1213 if (frame_alignment > kSystemPointerSize) {
1214 // Make stack end at alignment and make room for stack arguments
1215 // -- preserving original value of sp.
1216 __ mr(scratch, sp);
1217 __ addi(sp, sp,
1218 Operand(-(stack_passed_arguments + 1) * kSystemPointerSize));
1219 DCHECK(base::bits::IsPowerOfTwo(frame_alignment));
1220 __ ClearRightImm(sp, sp,
1221 Operand(base::bits::WhichPowerOfTwo(frame_alignment)));
1222 __ StoreU64(scratch,
1223 MemOperand(sp, stack_passed_arguments * kSystemPointerSize));
1224 } else {
1225 // Make room for stack arguments
1226 stack_space += stack_passed_arguments;
1227 }
1228
1229 // Allocate frame with required slots to make ABI work.
1230 __ li(r0, Operand::Zero());
1231 __ StoreU64WithUpdate(r0, MemOperand(sp, -stack_space * kSystemPointerSize));
1232
1233 // RegExp code frame pointer.
1234 __ mr(r5, frame_pointer());
1235 // Code of self.
1236 __ mov(r4, Operand(masm_->CodeObject()));
1237 // r3 will point to the return address, placed by DirectCEntry.
1238 __ addi(r3, sp, Operand(kStackFrameExtraParamSlot * kSystemPointerSize));
1239
1240 ExternalReference stack_guard_check =
1241 ExternalReference::re_check_stack_guard_state();
1242 __ mov(ip, Operand(stack_guard_check));
1243
1244 EmbeddedData d = EmbeddedData::FromBlob();
1245 Address entry = d.InstructionStartOfBuiltin(Builtin::kDirectCEntry);
1246 __ mov(r0, Operand(entry, RelocInfo::OFF_HEAP_TARGET));
1247 __ Call(r0);
1248
1249 // Restore the stack pointer
1250 stack_space = kNumRequiredStackFrameSlots + stack_passed_arguments;
1251 if (frame_alignment > kSystemPointerSize) {
1252 __ LoadU64(sp, MemOperand(sp, stack_space * kSystemPointerSize));
1253 } else {
1254 __ addi(sp, sp, Operand(stack_space * kSystemPointerSize));
1255 }
1256
1257 __ mov(code_pointer(), Operand(masm_->CodeObject()));
1258 }
1259
1260
1261 // Helper function for reading a value out of a stack frame.
1262 template <typename T>
frame_entry(Address re_frame, int frame_offset)1263 static T& frame_entry(Address re_frame, int frame_offset) {
1264 return reinterpret_cast<T&>(Memory<int32_t>(re_frame + frame_offset));
1265 }
1266
1267
1268 template <typename T>
frame_entry_address(Address re_frame, int frame_offset)1269 static T* frame_entry_address(Address re_frame, int frame_offset) {
1270 return reinterpret_cast<T*>(re_frame + frame_offset);
1271 }
1272
CheckStackGuardState(Address* return_address, Address raw_code, Address re_frame)1273 int RegExpMacroAssemblerPPC::CheckStackGuardState(Address* return_address,
1274 Address raw_code,
1275 Address re_frame) {
1276 Code re_code = Code::cast(Object(raw_code));
1277 return NativeRegExpMacroAssembler::CheckStackGuardState(
1278 frame_entry<Isolate*>(re_frame, kIsolate),
1279 frame_entry<intptr_t>(re_frame, kStartIndex),
1280 static_cast<RegExp::CallOrigin>(
1281 frame_entry<intptr_t>(re_frame, kDirectCall)),
1282 return_address, re_code,
1283 frame_entry_address<Address>(re_frame, kInputString),
1284 frame_entry_address<const byte*>(re_frame, kInputStart),
1285 frame_entry_address<const byte*>(re_frame, kInputEnd));
1286 }
1287
1288
register_location(int register_index)1289 MemOperand RegExpMacroAssemblerPPC::register_location(int register_index) {
1290 DCHECK(register_index < (1 << 30));
1291 if (num_registers_ <= register_index) {
1292 num_registers_ = register_index + 1;
1293 }
1294 return MemOperand(frame_pointer(),
1295 kRegisterZero - register_index * kSystemPointerSize);
1296 }
1297
1298
1299 void RegExpMacroAssemblerPPC::CheckPosition(int cp_offset,
1300 Label* on_outside_input) {
1301 if (cp_offset >= 0) {
1302 __ CmpS64(current_input_offset(), Operand(-cp_offset * char_size()), r0);
1303 BranchOrBacktrack(ge, on_outside_input);
1304 } else {
1305 __ LoadU64(r4, MemOperand(frame_pointer(), kStringStartMinusOne));
1306 __ addi(r3, current_input_offset(), Operand(cp_offset * char_size()));
1307 __ CmpS64(r3, r4);
1308 BranchOrBacktrack(le, on_outside_input);
1309 }
1310 }
1311
1312
1313 void RegExpMacroAssemblerPPC::BranchOrBacktrack(Condition condition, Label* to,
1314 CRegister cr) {
1315 if (condition == al) { // Unconditional.
1316 if (to == nullptr) {
1317 Backtrack();
1318 return;
1319 }
1320 __ b(to);
1321 return;
1322 }
1323 if (to == nullptr) {
1324 __ b(condition, &backtrack_label_, cr);
1325 return;
1326 }
1327 __ b(condition, to, cr);
1328 }
1329
1330
1331 void RegExpMacroAssemblerPPC::SafeCall(Label* to, Condition cond,
1332 CRegister cr) {
1333 __ b(cond, to, cr, SetLK);
1334 }
1335
1336
1337 void RegExpMacroAssemblerPPC::SafeReturn() {
1338 __ pop(r0);
1339 __ mov(ip, Operand(masm_->CodeObject()));
1340 __ add(r0, r0, ip);
1341 __ mtlr(r0);
1342 __ blr();
1343 }
1344
1345
1346 void RegExpMacroAssemblerPPC::SafeCallTarget(Label* name) {
1347 __ bind(name);
1348 __ mflr(r0);
1349 __ mov(ip, Operand(masm_->CodeObject()));
1350 __ sub(r0, r0, ip);
1351 __ push(r0);
1352 }
1353
1354
1355 void RegExpMacroAssemblerPPC::Push(Register source) {
1356 DCHECK(source != backtrack_stackpointer());
1357 __ StoreU64WithUpdate(
1358 source, MemOperand(backtrack_stackpointer(), -kSystemPointerSize));
1359 }
1360
1361
1362 void RegExpMacroAssemblerPPC::Pop(Register target) {
1363 DCHECK(target != backtrack_stackpointer());
1364 __ LoadU64(target, MemOperand(backtrack_stackpointer()));
1365 __ addi(backtrack_stackpointer(), backtrack_stackpointer(),
1366 Operand(kSystemPointerSize));
1367 }
1368
1369
1370 void RegExpMacroAssemblerPPC::CheckPreemption() {
1371 // Check for preemption.
1372 ExternalReference stack_limit =
1373 ExternalReference::address_of_jslimit(isolate());
1374 __ mov(r3, Operand(stack_limit));
1375 __ LoadU64(r3, MemOperand(r3));
1376 __ CmpU64(sp, r3);
1377 SafeCall(&check_preempt_label_, le);
1378 }
1379
1380
1381 void RegExpMacroAssemblerPPC::CheckStackLimit() {
1382 ExternalReference stack_limit =
1383 ExternalReference::address_of_regexp_stack_limit_address(isolate());
1384 __ mov(r3, Operand(stack_limit));
1385 __ LoadU64(r3, MemOperand(r3));
1386 __ CmpU64(backtrack_stackpointer(), r3);
1387 SafeCall(&stack_overflow_label_, le);
1388 }
1389
1390
1391 void RegExpMacroAssemblerPPC::LoadCurrentCharacterUnchecked(int cp_offset,
1392 int characters) {
1393 Register offset = current_input_offset();
1394 if (cp_offset != 0) {
1395 // r25 is not being used to store the capture start index at this point.
1396 if (is_int16(cp_offset * char_size())) {
1397 __ addi(r25, current_input_offset(), Operand(cp_offset * char_size()));
1398 } else {
1399 __ mov(r25, Operand(cp_offset * char_size()));
1400 __ add(r25, r25, current_input_offset());
1401 }
1402 offset = r25;
1403 }
1404 // The lwz, stw, lhz, sth instructions can do unaligned accesses, if the CPU
1405 // and the operating system running on the target allow it.
1406 // We assume we don't want to do unaligned loads on PPC, so this function
1407 // must only be used to load a single character at a time.
1408
1409 __ add(current_character(), end_of_input_address(), offset);
1410 #if V8_TARGET_LITTLE_ENDIAN
1411 if (mode_ == LATIN1) {
1412 if (characters == 4) {
1413 __ lwz(current_character(), MemOperand(current_character()));
1414 } else if (characters == 2) {
1415 __ lhz(current_character(), MemOperand(current_character()));
1416 } else {
1417 DCHECK_EQ(1, characters);
1418 __ lbz(current_character(), MemOperand(current_character()));
1419 }
1420 } else {
1421 DCHECK(mode_ == UC16);
1422 if (characters == 2) {
1423 __ lwz(current_character(), MemOperand(current_character()));
1424 } else {
1425 DCHECK_EQ(1, characters);
1426 __ lhz(current_character(), MemOperand(current_character()));
1427 }
1428 }
1429 #else
1430 if (mode_ == LATIN1) {
1431 if (characters == 4) {
1432 __ lwbrx(current_character(), MemOperand(r0, current_character()));
1433 } else if (characters == 2) {
1434 __ lhbrx(current_character(), MemOperand(r0, current_character()));
1435 } else {
1436 DCHECK_EQ(1, characters);
1437 __ lbz(current_character(), MemOperand(current_character()));
1438 }
1439 } else {
1440 DCHECK(mode_ == UC16);
1441 if (characters == 2) {
1442 __ lwz(current_character(), MemOperand(current_character()));
1443 __ rlwinm(current_character(), current_character(), 16, 0, 31);
1444 } else {
1445 DCHECK_EQ(1, characters);
1446 __ lhz(current_character(), MemOperand(current_character()));
1447 }
1448 }
1449 #endif
1450 }
1451
1452 #undef __
1453
1454 } // namespace internal
1455 } // namespace v8
1456
1457 #endif // V8_TARGET_ARCH_PPC || V8_TARGET_ARCH_PPC64
1458