[turbofan] Introduce a dedicated StringLength operator.

Strings are immutable in JavaScript land (contrast with the runtime,
where we can truncate strings that haven't escaped to JavaScript yet),
so the length of a String is immutable. Thus loading the length of a
String is a pure operation and should be expressed as such (i.e. doesn't
depend on control or effect). The StringLength operator does exactly
this and is hooked up to the effect chain in the EffectControlLinearizer.

This will eventually allow us to simplify the optimization of string
concatention and other operations that are a bit cumbersome in TurboFan
currently, and it will also allow us to optimize string operations
across effectful operations, for example combining multiple invocations
to String#slice with the same inputs.

Bug: v8:5269, v8:6936, v8:7109, v8:7137
Change-Id: Iffcccbb0c7fc4cfe1281c10e7af24b40eba4c987
Reviewed-on: https://chromium-review.googlesource.com/799690
Reviewed-by: Yang Guo <yangguo@chromium.org>
Reviewed-by: Benedikt Meurer <bmeurer@chromium.org>
Commit-Queue: Benedikt Meurer <bmeurer@chromium.org>
Cr-Commit-Position: refs/heads/master@{#49731}
This commit is contained in:
Benedikt Meurer 2017-11-30 07:10:35 +01:00 committed by Commit Bot
parent b43b11f98d
commit 500d7b9315
15 changed files with 52 additions and 35 deletions

View File

@ -860,6 +860,9 @@ bool EffectControlLinearizer::TryWireInStateEffect(Node* node,
case IrOpcode::kStringIndexOf: case IrOpcode::kStringIndexOf:
result = LowerStringIndexOf(node); result = LowerStringIndexOf(node);
break; break;
case IrOpcode::kStringLength:
result = LowerStringLength(node);
break;
case IrOpcode::kStringToNumber: case IrOpcode::kStringToNumber:
result = LowerStringToNumber(node); result = LowerStringToNumber(node);
break; break;
@ -2843,6 +2846,12 @@ Node* EffectControlLinearizer::LowerStringIndexOf(Node* node) {
position, __ NoContextConstant()); position, __ NoContextConstant());
} }
Node* EffectControlLinearizer::LowerStringLength(Node* node) {
Node* subject = node->InputAt(0);
return __ LoadField(AccessBuilder::ForStringLength(), subject);
}
Node* EffectControlLinearizer::LowerStringComparison(Callable const& callable, Node* EffectControlLinearizer::LowerStringComparison(Callable const& callable,
Node* node) { Node* node) {
Node* lhs = node->InputAt(0); Node* lhs = node->InputAt(0);

View File

@ -117,6 +117,7 @@ class V8_EXPORT_PRIVATE EffectControlLinearizer {
Node* LowerStringFromCharCode(Node* node); Node* LowerStringFromCharCode(Node* node);
Node* LowerStringFromCodePoint(Node* node); Node* LowerStringFromCodePoint(Node* node);
Node* LowerStringIndexOf(Node* node); Node* LowerStringIndexOf(Node* node);
Node* LowerStringLength(Node* node);
Node* LowerStringEqual(Node* node); Node* LowerStringEqual(Node* node);
Node* LowerStringLessThan(Node* node); Node* LowerStringLessThan(Node* node);
Node* LowerStringLessThanOrEqual(Node* node); Node* LowerStringLessThanOrEqual(Node* node);

View File

@ -2391,9 +2391,8 @@ Reduction JSBuiltinReducer::ReduceStringCharAt(Node* node) {
} }
// Determine the {receiver} length. // Determine the {receiver} length.
Node* receiver_length = effect = graph()->NewNode( Node* receiver_length =
simplified()->LoadField(AccessBuilder::ForStringLength()), receiver, graph()->NewNode(simplified()->StringLength(), receiver);
effect, control);
// Check if {index} is less than {receiver} length. // Check if {index} is less than {receiver} length.
Node* check = graph()->NewNode(simplified()->NumberLessThan(), index, Node* check = graph()->NewNode(simplified()->NumberLessThan(), index,
@ -2445,9 +2444,8 @@ Reduction JSBuiltinReducer::ReduceStringCharCodeAt(Node* node) {
} }
// Determine the {receiver} length. // Determine the {receiver} length.
Node* receiver_length = effect = graph()->NewNode( Node* receiver_length =
simplified()->LoadField(AccessBuilder::ForStringLength()), receiver, graph()->NewNode(simplified()->StringLength(), receiver);
effect, control);
// Check if {index} is less than {receiver} length. // Check if {index} is less than {receiver} length.
Node* check = graph()->NewNode(simplified()->NumberLessThan(), index, Node* check = graph()->NewNode(simplified()->NumberLessThan(), index,
@ -2577,9 +2575,7 @@ Reduction JSBuiltinReducer::ReduceStringIteratorNext(Node* node) {
Node* index = effect = graph()->NewNode( Node* index = effect = graph()->NewNode(
simplified()->LoadField(AccessBuilder::ForJSStringIteratorIndex()), simplified()->LoadField(AccessBuilder::ForJSStringIteratorIndex()),
receiver, effect, control); receiver, effect, control);
Node* length = effect = graph()->NewNode( Node* length = graph()->NewNode(simplified()->StringLength(), string);
simplified()->LoadField(AccessBuilder::ForStringLength()), string,
effect, control);
// branch0: if (index < length) // branch0: if (index < length)
Node* check0 = Node* check0 =
@ -2670,9 +2666,8 @@ Reduction JSBuiltinReducer::ReduceStringIteratorNext(Node* node) {
simplified()->StringFromCodePoint(UnicodeEncoding::UTF16), vtrue0); simplified()->StringFromCodePoint(UnicodeEncoding::UTF16), vtrue0);
// Update iterator.[[NextIndex]] // Update iterator.[[NextIndex]]
Node* char_length = etrue0 = graph()->NewNode( Node* char_length =
simplified()->LoadField(AccessBuilder::ForStringLength()), vtrue0, graph()->NewNode(simplified()->StringLength(), vtrue0);
etrue0, if_true0);
index = graph()->NewNode(simplified()->NumberAdd(), index, char_length); index = graph()->NewNode(simplified()->NumberAdd(), index, char_length);
etrue0 = graph()->NewNode( etrue0 = graph()->NewNode(
simplified()->StoreField(AccessBuilder::ForJSStringIteratorIndex()), simplified()->StoreField(AccessBuilder::ForJSStringIteratorIndex()),
@ -2721,9 +2716,8 @@ Reduction JSBuiltinReducer::ReduceStringSlice(Node* node) {
if (start_type->Is(type_cache_.kSingletonMinusOne) && if (start_type->Is(type_cache_.kSingletonMinusOne) &&
end_type->Is(Type::Undefined())) { end_type->Is(Type::Undefined())) {
Node* receiver_length = effect = graph()->NewNode( Node* receiver_length =
simplified()->LoadField(AccessBuilder::ForStringLength()), receiver, graph()->NewNode(simplified()->StringLength(), receiver);
effect, control);
Node* check = Node* check =
graph()->NewNode(simplified()->NumberEqual(), receiver_length, graph()->NewNode(simplified()->NumberEqual(), receiver_length,

View File

@ -1065,9 +1065,7 @@ Reduction JSNativeContextSpecialization::ReduceElementAccess(
effect, control); effect, control);
// Determine the {receiver} length. // Determine the {receiver} length.
Node* length = effect = graph()->NewNode( Node* length = graph()->NewNode(simplified()->StringLength(), receiver);
simplified()->LoadField(AccessBuilder::ForStringLength()), receiver,
effect, control);
// Load the single character string from {receiver} or yield undefined // Load the single character string from {receiver} or yield undefined
// if the {index} is out of bounds (depending on the {load_mode}). // if the {index} is out of bounds (depending on the {load_mode}).

View File

@ -648,8 +648,8 @@ Reduction JSTypedLowering::ReduceCreateConsString(Node* node) {
} }
// Determine the {first} length. // Determine the {first} length.
Node* first_length = BuildGetStringLength(first, &effect, control); Node* first_length = BuildGetStringLength(first);
Node* second_length = BuildGetStringLength(second, &effect, control); Node* second_length = BuildGetStringLength(second);
// Compute the resulting length. // Compute the resulting length.
Node* length = Node* length =
@ -708,15 +708,14 @@ Reduction JSTypedLowering::ReduceCreateConsString(Node* node) {
return Replace(value); return Replace(value);
} }
Node* JSTypedLowering::BuildGetStringLength(Node* value, Node** effect, Node* JSTypedLowering::BuildGetStringLength(Node* value) {
Node* control) { // TODO(bmeurer): Get rid of this hack and instead have a way to
// express the string length in the types.
HeapObjectMatcher m(value); HeapObjectMatcher m(value);
Node* length = Node* length =
(m.HasValue() && m.Value()->IsString()) (m.HasValue() && m.Value()->IsString())
? jsgraph()->Constant(Handle<String>::cast(m.Value())->length()) ? jsgraph()->Constant(Handle<String>::cast(m.Value())->length())
: (*effect) = graph()->NewNode( : graph()->NewNode(simplified()->StringLength(), value);
simplified()->LoadField(AccessBuilder::ForStringLength()),
value, *effect, control);
return length; return length;
} }
@ -1118,16 +1117,12 @@ Reduction JSTypedLowering::ReduceJSLoadNamed(Node* node) {
DCHECK_EQ(IrOpcode::kJSLoadNamed, node->opcode()); DCHECK_EQ(IrOpcode::kJSLoadNamed, node->opcode());
Node* receiver = NodeProperties::GetValueInput(node, 0); Node* receiver = NodeProperties::GetValueInput(node, 0);
Type* receiver_type = NodeProperties::GetType(receiver); Type* receiver_type = NodeProperties::GetType(receiver);
Node* effect = NodeProperties::GetEffectInput(node);
Node* control = NodeProperties::GetControlInput(node);
Handle<Name> name = NamedAccessOf(node->op()).name(); Handle<Name> name = NamedAccessOf(node->op()).name();
// Optimize "length" property of strings. // Optimize "length" property of strings.
if (name.is_identical_to(factory()->length_string()) && if (name.is_identical_to(factory()->length_string()) &&
receiver_type->Is(Type::String())) { receiver_type->Is(Type::String())) {
Node* value = effect = graph()->NewNode( Node* value = graph()->NewNode(simplified()->StringLength(), receiver);
simplified()->LoadField(AccessBuilder::ForStringLength()), receiver, ReplaceWithValue(node, value);
effect, control);
ReplaceWithValue(node, value, effect);
return Replace(value); return Replace(value);
} }
return NoChange(); return NoChange();

View File

@ -85,8 +85,8 @@ class V8_EXPORT_PRIVATE JSTypedLowering final
// Helper for ReduceJSLoadModule and ReduceJSStoreModule. // Helper for ReduceJSLoadModule and ReduceJSStoreModule.
Node* BuildGetModuleCell(Node* node); Node* BuildGetModuleCell(Node* node);
// Helpers for ReduceJSCreateConsString and ReduceJSStringConcat. // Helpers for ReduceJSCreateConsString.
Node* BuildGetStringLength(Node* value, Node** effect, Node* control); Node* BuildGetStringLength(Node* value);
Factory* factory() const; Factory* factory() const;
Graph* graph() const; Graph* graph() const;

View File

@ -335,6 +335,7 @@
V(StringFromCharCode) \ V(StringFromCharCode) \
V(StringFromCodePoint) \ V(StringFromCodePoint) \
V(StringIndexOf) \ V(StringIndexOf) \
V(StringLength) \
V(StringToLowerCaseIntl) \ V(StringToLowerCaseIntl) \
V(StringToUpperCaseIntl) \ V(StringToUpperCaseIntl) \
V(CheckBounds) \ V(CheckBounds) \

View File

@ -2415,6 +2415,14 @@ class RepresentationSelector {
SetOutput(node, MachineRepresentation::kTaggedSigned); SetOutput(node, MachineRepresentation::kTaggedSigned);
return; return;
} }
case IrOpcode::kStringLength: {
// TODO(bmeurer): The input representation should be TaggedPointer.
// Fix this once we have a dedicated StringConcat/JSStringAdd
// operator, which marks it's output as TaggedPointer properly.
VisitUnop(node, UseInfo::AnyTagged(),
MachineRepresentation::kTaggedSigned);
return;
}
case IrOpcode::kStringToLowerCaseIntl: case IrOpcode::kStringToLowerCaseIntl:
case IrOpcode::kStringToUpperCaseIntl: { case IrOpcode::kStringToUpperCaseIntl: {
VisitUnop(node, UseInfo::AnyTagged(), VisitUnop(node, UseInfo::AnyTagged(),

View File

@ -590,6 +590,7 @@ DeoptimizeReason DeoptimizeReasonOf(const Operator* op) {
V(SeqStringCharCodeAt, Operator::kNoProperties, 2, 1) \ V(SeqStringCharCodeAt, Operator::kNoProperties, 2, 1) \
V(StringFromCharCode, Operator::kNoProperties, 1, 0) \ V(StringFromCharCode, Operator::kNoProperties, 1, 0) \
V(StringIndexOf, Operator::kNoProperties, 3, 0) \ V(StringIndexOf, Operator::kNoProperties, 3, 0) \
V(StringLength, Operator::kNoProperties, 1, 0) \
V(StringToLowerCaseIntl, Operator::kNoProperties, 1, 0) \ V(StringToLowerCaseIntl, Operator::kNoProperties, 1, 0) \
V(StringToUpperCaseIntl, Operator::kNoProperties, 1, 0) \ V(StringToUpperCaseIntl, Operator::kNoProperties, 1, 0) \
V(TypeOf, Operator::kNoProperties, 1, 1) \ V(TypeOf, Operator::kNoProperties, 1, 1) \

View File

@ -405,6 +405,7 @@ class V8_EXPORT_PRIVATE SimplifiedOperatorBuilder final
const Operator* StringFromCharCode(); const Operator* StringFromCharCode();
const Operator* StringFromCodePoint(UnicodeEncoding encoding); const Operator* StringFromCodePoint(UnicodeEncoding encoding);
const Operator* StringIndexOf(); const Operator* StringIndexOf();
const Operator* StringLength();
const Operator* StringToLowerCaseIntl(); const Operator* StringToLowerCaseIntl();
const Operator* StringToUpperCaseIntl(); const Operator* StringToUpperCaseIntl();

View File

@ -1978,6 +1978,10 @@ Type* Typer::Visitor::TypeStringFromCodePoint(Node* node) {
Type* Typer::Visitor::TypeStringIndexOf(Node* node) { UNREACHABLE(); } Type* Typer::Visitor::TypeStringIndexOf(Node* node) { UNREACHABLE(); }
Type* Typer::Visitor::TypeStringLength(Node* node) {
return typer_->cache_.kStringLengthType;
}
Type* Typer::Visitor::TypeCheckBounds(Node* node) { Type* Typer::Visitor::TypeCheckBounds(Node* node) {
Type* index = Operand(node, 0); Type* index = Operand(node, 0);
Type* length = Operand(node, 1); Type* length = Operand(node, 1);

View File

@ -1058,6 +1058,10 @@ void Verifier::Visitor::Check(Node* node, const AllNodes& all) {
CheckValueInputIs(node, 2, Type::SignedSmall()); CheckValueInputIs(node, 2, Type::SignedSmall());
CheckTypeIs(node, Type::SignedSmall()); CheckTypeIs(node, Type::SignedSmall());
break; break;
case IrOpcode::kStringLength:
CheckValueInputIs(node, 0, Type::String());
CheckTypeIs(node, TypeCache::Get().kStringLengthType);
break;
case IrOpcode::kStringToLowerCaseIntl: case IrOpcode::kStringToLowerCaseIntl:
case IrOpcode::kStringToUpperCaseIntl: case IrOpcode::kStringToUpperCaseIntl:
CheckValueInputIs(node, 0, Type::String()); CheckValueInputIs(node, 0, Type::String());

View File

@ -382,8 +382,7 @@ TEST_F(JSTypedLoweringTest, JSLoadNamedStringLength) {
Reduce(graph()->NewNode(javascript()->LoadNamed(name, feedback), receiver, Reduce(graph()->NewNode(javascript()->LoadNamed(name, feedback), receiver,
context, EmptyFrameState(), effect, control)); context, EmptyFrameState(), effect, control));
ASSERT_TRUE(r.Changed()); ASSERT_TRUE(r.Changed());
EXPECT_THAT(r.replacement(), IsLoadField(AccessBuilder::ForStringLength(), EXPECT_THAT(r.replacement(), IsStringLength(receiver));
receiver, effect, control));
} }

View File

@ -2182,6 +2182,7 @@ IS_UNOP_MATCHER(ObjectIsReceiver)
IS_UNOP_MATCHER(ObjectIsSmi) IS_UNOP_MATCHER(ObjectIsSmi)
IS_UNOP_MATCHER(ObjectIsUndetectable) IS_UNOP_MATCHER(ObjectIsUndetectable)
IS_UNOP_MATCHER(StringFromCharCode) IS_UNOP_MATCHER(StringFromCharCode)
IS_UNOP_MATCHER(StringLength)
IS_UNOP_MATCHER(Word32Clz) IS_UNOP_MATCHER(Word32Clz)
IS_UNOP_MATCHER(Word32Ctz) IS_UNOP_MATCHER(Word32Ctz)
IS_UNOP_MATCHER(Word32Popcnt) IS_UNOP_MATCHER(Word32Popcnt)

View File

@ -272,6 +272,7 @@ Matcher<Node*> IsNumberTan(const Matcher<Node*>& value_matcher);
Matcher<Node*> IsNumberTanh(const Matcher<Node*>& value_matcher); Matcher<Node*> IsNumberTanh(const Matcher<Node*>& value_matcher);
Matcher<Node*> IsNumberTrunc(const Matcher<Node*>& value_matcher); Matcher<Node*> IsNumberTrunc(const Matcher<Node*>& value_matcher);
Matcher<Node*> IsStringFromCharCode(const Matcher<Node*>& value_matcher); Matcher<Node*> IsStringFromCharCode(const Matcher<Node*>& value_matcher);
Matcher<Node*> IsStringLength(const Matcher<Node*>& value_matcher);
Matcher<Node*> IsAllocate(const Matcher<Node*>& size_matcher, Matcher<Node*> IsAllocate(const Matcher<Node*>& size_matcher,
const Matcher<Node*>& effect_matcher, const Matcher<Node*>& effect_matcher,
const Matcher<Node*>& control_matcher); const Matcher<Node*>& control_matcher);