Index: src/ia32/code-stubs-ia32.cc |
diff --git a/src/ia32/code-stubs-ia32.cc b/src/ia32/code-stubs-ia32.cc |
index 5affd6eaf0283d429557c5a1b2e665b0376ed4ec..4055e96cc5fc79b82dcf37f6ddd7ee3fe9a919df 100644 |
--- a/src/ia32/code-stubs-ia32.cc |
+++ b/src/ia32/code-stubs-ia32.cc |
@@ -3827,7 +3827,8 @@ void RegExpExecStub::Generate(MacroAssembler* masm) { |
static const int kSubjectOffset = 3 * kPointerSize; |
static const int kJSRegExpOffset = 4 * kPointerSize; |
- Label runtime, invoke_regexp; |
+ Label runtime; |
+ Factory* factory = masm->isolate()->factory(); |
// Ensure that a RegExp stack is allocated. |
ExternalReference address_of_regexp_stack_memory_address = |
@@ -3845,6 +3846,7 @@ void RegExpExecStub::Generate(MacroAssembler* masm) { |
__ JumpIfSmi(eax, &runtime); |
__ CmpObjectType(eax, JS_REGEXP_TYPE, ecx); |
__ j(not_equal, &runtime); |
+ |
// Check that the RegExp has been compiled (data contains a fixed array). |
__ mov(ecx, FieldOperand(eax, JSRegExp::kDataOffset)); |
if (FLAG_debug_code) { |
@@ -3863,156 +3865,124 @@ void RegExpExecStub::Generate(MacroAssembler* masm) { |
// ecx: RegExp data (FixedArray) |
// Check that the number of captures fit in the static offsets vector buffer. |
__ mov(edx, FieldOperand(ecx, JSRegExp::kIrregexpCaptureCountOffset)); |
- // Calculate number of capture registers (number_of_captures + 1) * 2. This |
- // uses the asumption that smis are 2 * their untagged value. |
+ // Check (number_of_captures + 1) * 2 <= offsets vector size |
+ // Or number_of_captures * 2 <= offsets vector size - 2 |
+ // Multiplying by 2 comes for free since edx is smi-tagged. |
STATIC_ASSERT(kSmiTag == 0); |
STATIC_ASSERT(kSmiTagSize + kSmiShiftSize == 1); |
- __ add(edx, Immediate(2)); // edx was a smi. |
- // Check that the static offsets vector buffer is large enough. |
- __ cmp(edx, Isolate::kJSRegexpStaticOffsetsVectorSize); |
+ STATIC_ASSERT(Isolate::kJSRegexpStaticOffsetsVectorSize >= 2); |
+ __ cmp(edx, Isolate::kJSRegexpStaticOffsetsVectorSize - 2); |
__ j(above, &runtime); |
- // ecx: RegExp data (FixedArray) |
- // edx: Number of capture registers |
- // Check that the second argument is a string. |
- __ mov(eax, Operand(esp, kSubjectOffset)); |
- __ JumpIfSmi(eax, &runtime); |
- Condition is_string = masm->IsObjectStringType(eax, ebx, ebx); |
- __ j(NegateCondition(is_string), &runtime); |
- // Get the length of the string to ebx. |
- __ mov(ebx, FieldOperand(eax, String::kLengthOffset)); |
- |
- // ebx: Length of subject string as a smi |
- // ecx: RegExp data (FixedArray) |
- // edx: Number of capture registers |
- // Check that the third argument is a positive smi less than the subject |
- // string length. A negative value will be greater (unsigned comparison). |
- __ mov(eax, Operand(esp, kPreviousIndexOffset)); |
- __ JumpIfNotSmi(eax, &runtime); |
- __ cmp(eax, ebx); |
- __ j(above_equal, &runtime); |
- |
- // ecx: RegExp data (FixedArray) |
- // edx: Number of capture registers |
- // Check that the fourth object is a JSArray object. |
- __ mov(eax, Operand(esp, kLastMatchInfoOffset)); |
- __ JumpIfSmi(eax, &runtime); |
- __ CmpObjectType(eax, JS_ARRAY_TYPE, ebx); |
- __ j(not_equal, &runtime); |
- // Check that the JSArray is in fast case. |
- __ mov(ebx, FieldOperand(eax, JSArray::kElementsOffset)); |
- __ mov(eax, FieldOperand(ebx, HeapObject::kMapOffset)); |
- Factory* factory = masm->isolate()->factory(); |
- __ cmp(eax, factory->fixed_array_map()); |
- __ j(not_equal, &runtime); |
- // Check that the last match info has space for the capture registers and the |
- // additional information. |
- __ mov(eax, FieldOperand(ebx, FixedArray::kLengthOffset)); |
- __ SmiUntag(eax); |
- __ add(edx, Immediate(RegExpImpl::kLastMatchOverhead)); |
- __ cmp(edx, eax); |
- __ j(greater, &runtime); |
- |
// Reset offset for possibly sliced string. |
__ Set(edi, Immediate(0)); |
- // ecx: RegExp data (FixedArray) |
- // Check the representation and encoding of the subject string. |
- Label seq_ascii_string, seq_two_byte_string, check_code; |
__ mov(eax, Operand(esp, kSubjectOffset)); |
+ __ JumpIfSmi(eax, &runtime); |
+ __ mov(edx, eax); // Make a copy of the original subject string. |
__ mov(ebx, FieldOperand(eax, HeapObject::kMapOffset)); |
__ movzx_b(ebx, FieldOperand(ebx, Map::kInstanceTypeOffset)); |
- // First check for flat two byte string. |
+ |
+ // eax: subject string |
+ // edx: subject string |
+ // ebx: subject string instance type |
+ // ecx: RegExp data (FixedArray) |
+ // Handle subject string according to its encoding and representation: |
+ // (1) Sequential two byte? If yes, go to (9). |
+ // (2) Sequential one byte? If yes, go to (6). |
+ // (3) Anything but sequential or cons? If yes, go to (7). |
+ // (4) Cons string. If the string is flat, replace subject with first string. |
+ // Otherwise bailout. |
+ // (5a) Is subject sequential two byte? If yes, go to (9). |
+ // (5b) Is subject external? If yes, go to (8). |
+ // (6) One byte sequential. Load regexp code for one byte. |
+ // (E) Carry on. |
+ /// [...] |
+ |
+ // Deferred code at the end of the stub: |
+ // (7) Not a long external string? If yes, go to (10). |
+ // (8) External string. Make it, offset-wise, look like a sequential string. |
+ // (8a) Is the external string one byte? If yes, go to (6). |
+ // (9) Two byte sequential. Load regexp code for one byte. Go to (E). |
+ // (10) Short external string or not a string? If yes, bail out to runtime. |
+ // (11) Sliced string. Replace subject with parent. Go to (5a). |
+ |
+ Label seq_one_byte_string /* 6 */, seq_two_byte_string /* 9 */, |
+ external_string /* 8 */, check_underlying /* 5a */, |
+ not_seq_nor_cons /* 7 */, check_code /* E */, |
+ not_long_external /* 10 */; |
+ |
+ // (1) Sequential two byte? If yes, go to (9). |
__ and_(ebx, kIsNotStringMask | |
kStringRepresentationMask | |
kStringEncodingMask | |
kShortExternalStringMask); |
STATIC_ASSERT((kStringTag | kSeqStringTag | kTwoByteStringTag) == 0); |
- __ j(zero, &seq_two_byte_string, Label::kNear); |
- // Any other flat string must be a flat ASCII string. None of the following |
- // string type tests will succeed if subject is not a string or a short |
- // external string. |
+ __ j(zero, &seq_two_byte_string); // Go to (9). |
+ |
+ // (2) Sequential one byte? If yes, go to (6). |
+ // Any other sequential string must be one byte. |
__ and_(ebx, Immediate(kIsNotStringMask | |
kStringRepresentationMask | |
kShortExternalStringMask)); |
- __ j(zero, &seq_ascii_string, Label::kNear); |
- |
- // ebx: whether subject is a string and if yes, its string representation |
- // Check for flat cons string or sliced string. |
- // A flat cons string is a cons string where the second part is the empty |
- // string. In that case the subject string is just the first part of the cons |
- // string. Also in this case the first part of the cons string is known to be |
- // a sequential string or an external string. |
- // In the case of a sliced string its offset has to be taken into account. |
- Label cons_string, external_string, check_encoding; |
+ __ j(zero, &seq_one_byte_string, Label::kNear); // Go to (6). |
+ |
+ // (3) Anything but sequential or cons? If yes, go to (7). |
+ // We check whether the subject string is a cons, since sequential strings |
+ // have already been covered. |
STATIC_ASSERT(kConsStringTag < kExternalStringTag); |
STATIC_ASSERT(kSlicedStringTag > kExternalStringTag); |
STATIC_ASSERT(kIsNotStringMask > kExternalStringTag); |
STATIC_ASSERT(kShortExternalStringTag > kExternalStringTag); |
__ cmp(ebx, Immediate(kExternalStringTag)); |
- __ j(less, &cons_string); |
- __ j(equal, &external_string); |
+ __ j(greater_equal, ¬_seq_nor_cons); // Go to (7). |
- // Catch non-string subject or short external string. |
- STATIC_ASSERT(kNotStringTag != 0 && kShortExternalStringTag !=0); |
- __ test(ebx, Immediate(kIsNotStringMask | kShortExternalStringTag)); |
- __ j(not_zero, &runtime); |
- |
- // String is sliced. |
- __ mov(edi, FieldOperand(eax, SlicedString::kOffsetOffset)); |
- __ mov(eax, FieldOperand(eax, SlicedString::kParentOffset)); |
- // edi: offset of sliced string, smi-tagged. |
- // eax: parent string. |
- __ jmp(&check_encoding, Label::kNear); |
- // String is a cons string, check whether it is flat. |
- __ bind(&cons_string); |
+ // (4) Cons string. Check that it's flat. |
+ // Replace subject with first string and reload instance type. |
__ cmp(FieldOperand(eax, ConsString::kSecondOffset), factory->empty_string()); |
__ j(not_equal, &runtime); |
__ mov(eax, FieldOperand(eax, ConsString::kFirstOffset)); |
- __ bind(&check_encoding); |
+ __ bind(&check_underlying); |
__ mov(ebx, FieldOperand(eax, HeapObject::kMapOffset)); |
- // eax: first part of cons string or parent of sliced string. |
- // ebx: map of first part of cons string or map of parent of sliced string. |
- // Is first part of cons or parent of slice a flat two byte string? |
- __ test_b(FieldOperand(ebx, Map::kInstanceTypeOffset), |
- kStringRepresentationMask | kStringEncodingMask); |
+ __ mov(ebx, FieldOperand(ebx, Map::kInstanceTypeOffset)); |
+ |
+ // (5a) Is subject sequential two byte? If yes, go to (9). |
+ __ test_b(ebx, kStringRepresentationMask | kStringEncodingMask); |
STATIC_ASSERT((kSeqStringTag | kTwoByteStringTag) == 0); |
- __ j(zero, &seq_two_byte_string, Label::kNear); |
- // Any other flat string must be sequential ASCII or external. |
- __ test_b(FieldOperand(ebx, Map::kInstanceTypeOffset), |
- kStringRepresentationMask); |
- __ j(not_zero, &external_string); |
- |
- __ bind(&seq_ascii_string); |
- // eax: subject string (flat ASCII) |
+ __ j(zero, &seq_two_byte_string); // Go to (9). |
+ // (5b) Is subject external? If yes, go to (8). |
+ __ test_b(ebx, kStringRepresentationMask); |
+ // The underlying external string is never a short external string. |
+ STATIC_CHECK(ExternalString::kMaxShortLength < ConsString::kMinLength); |
+ STATIC_CHECK(ExternalString::kMaxShortLength < SlicedString::kMinLength); |
+ __ j(not_zero, &external_string); // Go to (8). |
+ |
+ // eax: sequential subject string (or look-alike, external string) |
+ // edx: original subject string |
// ecx: RegExp data (FixedArray) |
+ // (6) One byte sequential. Load regexp code for one byte. |
+ __ bind(&seq_one_byte_string); |
+ // Load previous index and check range before edx is overwritten. We have |
+ // to use edx instead of eax here because it might have been only made to |
+ // look like a sequential string when it actually is an external string. |
+ __ mov(ebx, Operand(esp, kPreviousIndexOffset)); |
+ __ JumpIfNotSmi(ebx, &runtime); |
+ __ cmp(ebx, FieldOperand(edx, String::kLengthOffset)); |
+ __ j(above_equal, &runtime); |
__ mov(edx, FieldOperand(ecx, JSRegExp::kDataAsciiCodeOffset)); |
- __ Set(ecx, Immediate(1)); // Type is ASCII. |
- __ jmp(&check_code, Label::kNear); |
- |
- __ bind(&seq_two_byte_string); |
- // eax: subject string (flat two byte) |
- // ecx: RegExp data (FixedArray) |
- __ mov(edx, FieldOperand(ecx, JSRegExp::kDataUC16CodeOffset)); |
- __ Set(ecx, Immediate(0)); // Type is two byte. |
+ __ Set(ecx, Immediate(1)); // Type is one byte. |
+ // (E) Carry on. String handling is done. |
__ bind(&check_code); |
+ // edx: irregexp code |
// Check that the irregexp code has been generated for the actual string |
// encoding. If it has, the field contains a code object otherwise it contains |
// a smi (code flushing support). |
__ JumpIfSmi(edx, &runtime); |
// eax: subject string |
+ // ebx: previous index (smi) |
// edx: code |
// ecx: encoding of subject string (1 if ASCII, 0 if two_byte); |
- // Load used arguments before starting to push arguments for call to native |
- // RegExp code to avoid handling changing stack height. |
- __ mov(ebx, Operand(esp, kPreviousIndexOffset)); |
- __ SmiUntag(ebx); // Previous index from smi. |
- |
- // eax: subject string |
- // ebx: previous index |
- // edx: code |
- // ecx: encoding of subject string (1 if ASCII 0 if two_byte); |
// All checks done. Now push arguments for native regexp code. |
Counters* counters = masm->isolate()->counters(); |
__ IncrementCounter(counters->regexp_entry_native(), 1); |
@@ -4043,6 +4013,7 @@ void RegExpExecStub::Generate(MacroAssembler* masm) { |
masm->isolate()))); |
// Argument 2: Previous index. |
+ __ SmiUntag(ebx); |
__ mov(Operand(esp, 1 * kPointerSize), ebx); |
// Argument 1: Original subject string. |
@@ -4152,8 +4123,23 @@ void RegExpExecStub::Generate(MacroAssembler* masm) { |
// edx: Number of capture registers |
// Load last_match_info which is still known to be a fast case JSArray. |
+ // Check that the fourth object is a JSArray object. |
__ mov(eax, Operand(esp, kLastMatchInfoOffset)); |
+ __ JumpIfSmi(eax, &runtime); |
+ __ CmpObjectType(eax, JS_ARRAY_TYPE, ebx); |
+ __ j(not_equal, &runtime); |
+ // Check that the JSArray is in fast case. |
__ mov(ebx, FieldOperand(eax, JSArray::kElementsOffset)); |
+ __ mov(eax, FieldOperand(ebx, HeapObject::kMapOffset)); |
+ __ cmp(eax, factory->fixed_array_map()); |
+ __ j(not_equal, &runtime); |
+ // Check that the last match info has space for the capture registers and the |
+ // additional information. |
+ __ mov(eax, FieldOperand(ebx, FixedArray::kLengthOffset)); |
+ __ SmiUntag(eax); |
+ __ sub(eax, Immediate(RegExpImpl::kLastMatchOverhead)); |
+ __ cmp(edx, eax); |
+ __ j(greater, &runtime); |
// ebx: last_match_info backing store (FixedArray) |
// edx: number of capture registers |
@@ -4163,13 +4149,14 @@ void RegExpExecStub::Generate(MacroAssembler* masm) { |
__ SmiUntag(edx); // Number of capture registers back from smi. |
// Store last subject and last input. |
__ mov(eax, Operand(esp, kSubjectOffset)); |
+ __ mov(ecx, eax); |
__ mov(FieldOperand(ebx, RegExpImpl::kLastSubjectOffset), eax); |
__ RecordWriteField(ebx, |
RegExpImpl::kLastSubjectOffset, |
eax, |
edi, |
kDontSaveFPRegs); |
- __ mov(eax, Operand(esp, kSubjectOffset)); |
+ __ mov(eax, ecx); |
__ mov(FieldOperand(ebx, RegExpImpl::kLastInputOffset), eax); |
__ RecordWriteField(ebx, |
RegExpImpl::kLastInputOffset, |
@@ -4207,10 +4194,19 @@ void RegExpExecStub::Generate(MacroAssembler* masm) { |
__ mov(eax, Operand(esp, kLastMatchInfoOffset)); |
__ ret(4 * kPointerSize); |
- // External string. Short external strings have already been ruled out. |
- // eax: subject string (expected to be external) |
- // ebx: scratch |
+ // Do the runtime call to execute the regexp. |
+ __ bind(&runtime); |
+ __ TailCallRuntime(Runtime::kRegExpExec, 4, 1); |
+ |
+ // Deferred code for string handling. |
+ // (7) Not a long external string? If yes, go to (10). |
+ __ bind(¬_seq_nor_cons); |
+ // Compare flags are still set from (3). |
+ __ j(greater, ¬_long_external, Label::kNear); // Go to (10). |
+ |
+ // (8) External string. Short external strings have been ruled out. |
__ bind(&external_string); |
+ // Reload instance type. |
__ mov(ebx, FieldOperand(eax, HeapObject::kMapOffset)); |
__ movzx_b(ebx, FieldOperand(ebx, Map::kInstanceTypeOffset)); |
if (FLAG_debug_code) { |
@@ -4224,13 +4220,38 @@ void RegExpExecStub::Generate(MacroAssembler* masm) { |
STATIC_ASSERT(SeqTwoByteString::kHeaderSize == SeqOneByteString::kHeaderSize); |
__ sub(eax, Immediate(SeqTwoByteString::kHeaderSize - kHeapObjectTag)); |
STATIC_ASSERT(kTwoByteStringTag == 0); |
+ // (8a) Is the external string one byte? If yes, go to (6). |
__ test_b(ebx, kStringEncodingMask); |
- __ j(not_zero, &seq_ascii_string); |
- __ jmp(&seq_two_byte_string); |
+ __ j(not_zero, &seq_one_byte_string); // Goto (6). |
- // Do the runtime call to execute the regexp. |
- __ bind(&runtime); |
- __ TailCallRuntime(Runtime::kRegExpExec, 4, 1); |
+ // eax: sequential subject string (or look-alike, external string) |
+ // edx: original subject string |
+ // ecx: RegExp data (FixedArray) |
+ // (9) Two byte sequential. Load regexp code for one byte. Go to (E). |
+ __ bind(&seq_two_byte_string); |
+ // Load previous index and check range before edx is overwritten. We have |
+ // to use edx instead of eax here because it might have been only made to |
+ // look like a sequential string when it actually is an external string. |
+ __ mov(ebx, Operand(esp, kPreviousIndexOffset)); |
+ __ JumpIfNotSmi(ebx, &runtime); |
+ __ cmp(ebx, FieldOperand(edx, String::kLengthOffset)); |
+ __ j(above_equal, &runtime); |
+ __ mov(edx, FieldOperand(ecx, JSRegExp::kDataUC16CodeOffset)); |
+ __ Set(ecx, Immediate(0)); // Type is two byte. |
+ __ jmp(&check_code); // Go to (E). |
+ |
+ // (10) Not a string or a short external string? If yes, bail out to runtime. |
+ __ bind(¬_long_external); |
+ // Catch non-string subject or short external string. |
+ STATIC_ASSERT(kNotStringTag != 0 && kShortExternalStringTag !=0); |
+ __ test(ebx, Immediate(kIsNotStringMask | kShortExternalStringTag)); |
+ __ j(not_zero, &runtime); |
+ |
+ // (11) Sliced string. Replace subject with parent. Go to (5a). |
+ // Load offset into edi and replace subject string with parent. |
+ __ mov(edi, FieldOperand(eax, SlicedString::kOffsetOffset)); |
+ __ mov(eax, FieldOperand(eax, SlicedString::kParentOffset)); |
+ __ jmp(&check_underlying); // Go to (5a). |
#endif // V8_INTERPRETED_REGEXP |
} |