[regexp] Named capture support for string replacements

This implements support for named captures in
RegExp.prototype[@@replace] for when the replaceValue is not callable.

Named captures can be referenced from replacement strings by using the
"$<name>" syntax. A couple of examples:

let re = /(?<fst>.)(?<snd>.)/u;
"abcd".replace(re, "$<snd>$<fst>")  // "bacd"
"abcd".replace(re, "$2$1")     // "bacd" (numbered refs work as always)
"abcd".replace(re, "$<snd")    // SyntaxError (unterminated named ref)
"abcd".replace(re, "$<42$1>")  // "cd" (invalid name)
"abcd".replace(re, "$<thd>")   // "cd" (non-existent name)
"abcd".replace(/(?<fst>.)|(?<snd>.)/u, "$<snd>")  // "cd" (non-matched capture)

Support is currently behind the --harmony-regexp-named-captures flag.

BUG=v8:5437

Review-Url: https://codereview.chromium.org/2775303002
Cr-Commit-Position: refs/heads/master@{#44171}
This commit is contained in:
jgruber 2017-03-28 01:02:03 -07:00 committed by Commit bot
parent 54a1942a84
commit 17f13863b6
9 changed files with 362 additions and 58 deletions

View File

@ -456,6 +456,7 @@ class ErrorUtils : public AllStatic {
T(ReduceNoInitial, "Reduce of empty array with no initial value") \ T(ReduceNoInitial, "Reduce of empty array with no initial value") \
T(RegExpFlags, \ T(RegExpFlags, \
"Cannot supply flags when constructing one RegExp from another") \ "Cannot supply flags when constructing one RegExp from another") \
T(RegExpInvalidReplaceString, "Invalid replacement string: '%'") \
T(RegExpNonObject, "% getter called on non-object %") \ T(RegExpNonObject, "% getter called on non-object %") \
T(RegExpNonRegExp, "% getter called on non-RegExp object") \ T(RegExpNonRegExp, "% getter called on non-RegExp object") \
T(ReinitializeIntl, "Trying to re-initialize % object.") \ T(ReinitializeIntl, "Trying to re-initialize % object.") \

View File

@ -11403,6 +11403,8 @@ int String::IndexOf(Isolate* isolate, Handle<String> receiver,
MaybeHandle<String> String::GetSubstitution(Isolate* isolate, Match* match, MaybeHandle<String> String::GetSubstitution(Isolate* isolate, Match* match,
Handle<String> replacement) { Handle<String> replacement) {
DCHECK_IMPLIES(match->HasNamedCaptures(), FLAG_harmony_regexp_named_captures);
Factory* factory = isolate->factory(); Factory* factory = isolate->factory();
const int replacement_length = replacement->length(); const int replacement_length = replacement->length();
@ -11489,6 +11491,37 @@ MaybeHandle<String> String::GetSubstitution(Isolate* isolate, Match* match,
continue_from_ix = peek_ix + advance; continue_from_ix = peek_ix + advance;
break; break;
} }
case '<': { // $<name> - named capture
if (!match->HasNamedCaptures()) {
builder.AppendCharacter('$');
continue_from_ix = peek_ix;
break;
}
Handle<String> bracket_string =
factory->LookupSingleCharacterStringFromCode('>');
const int closing_bracket_ix =
String::IndexOf(isolate, replacement, bracket_string, peek_ix + 1);
if (closing_bracket_ix == -1) {
THROW_NEW_ERROR(
isolate,
NewSyntaxError(MessageTemplate::kRegExpInvalidReplaceString,
replacement),
String);
}
Handle<String> capture_name =
factory->NewSubString(replacement, peek_ix + 1, closing_bracket_ix);
bool capture_exists;
Handle<String> capture;
ASSIGN_RETURN_ON_EXCEPTION(
isolate, capture,
match->GetNamedCapture(capture_name, &capture_exists), String);
if (capture_exists) builder.AppendString(capture);
continue_from_ix = closing_bracket_ix + 1;
break;
}
default: default:
builder.AppendCharacter('$'); builder.AppendCharacter('$');
continue_from_ix = peek_ix; continue_from_ix = peek_ix;
@ -11659,6 +11692,15 @@ bool String::IsUtf8EqualTo(Vector<const char> str, bool allow_prefix_match) {
return (allow_prefix_match || i == slen) && remaining_in_str == 0; return (allow_prefix_match || i == slen) && remaining_in_str == 0;
} }
template <>
bool String::IsEqualTo(Vector<const uint8_t> str) {
return IsOneByteEqualTo(str);
}
template <>
bool String::IsEqualTo(Vector<const uc16> str) {
return IsTwoByteEqualTo(str);
}
bool String::IsOneByteEqualTo(Vector<const uint8_t> str) { bool String::IsOneByteEqualTo(Vector<const uint8_t> str) {
int slen = length(); int slen = length();

View File

@ -8269,6 +8269,7 @@ class JSRegExp: public JSObject {
Handle<String> flags_string); Handle<String> flags_string);
inline Type TypeTag(); inline Type TypeTag();
// Number of captures (without the match itself).
inline int CaptureCount(); inline int CaptureCount();
inline Flags GetFlags(); inline Flags GetFlags();
inline String* Pattern(); inline String* Pattern();
@ -8341,7 +8342,7 @@ class JSRegExp: public JSObject {
// Number of captures in the compiled regexp. // Number of captures in the compiled regexp.
static const int kIrregexpCaptureCountIndex = kDataIndex + 5; static const int kIrregexpCaptureCountIndex = kDataIndex + 5;
// Maps names of named capture groups (at indices 2i) to their corresponding // Maps names of named capture groups (at indices 2i) to their corresponding
// capture group indices (at indices 2i + 1). // (1-based) capture group indices (at indices 2i + 1).
static const int kIrregexpCaptureNameMapIndex = kDataIndex + 6; static const int kIrregexpCaptureNameMapIndex = kDataIndex + 6;
static const int kIrregexpDataSize = kIrregexpCaptureNameMapIndex + 1; static const int kIrregexpDataSize = kIrregexpCaptureNameMapIndex + 1;
@ -9196,10 +9197,15 @@ class String: public Name {
class Match { class Match {
public: public:
virtual Handle<String> GetMatch() = 0; virtual Handle<String> GetMatch() = 0;
virtual MaybeHandle<String> GetCapture(int i, bool* capture_exists) = 0;
virtual Handle<String> GetPrefix() = 0; virtual Handle<String> GetPrefix() = 0;
virtual Handle<String> GetSuffix() = 0; virtual Handle<String> GetSuffix() = 0;
virtual int CaptureCount() = 0; virtual int CaptureCount() = 0;
virtual bool HasNamedCaptures() = 0;
virtual MaybeHandle<String> GetCapture(int i, bool* capture_exists) = 0;
virtual MaybeHandle<String> GetNamedCapture(Handle<String> name,
bool* capture_exists) = 0;
virtual ~Match() {} virtual ~Match() {}
}; };
@ -9214,6 +9220,11 @@ class String: public Name {
inline bool Equals(String* other); inline bool Equals(String* other);
inline static bool Equals(Handle<String> one, Handle<String> two); inline static bool Equals(Handle<String> one, Handle<String> two);
bool IsUtf8EqualTo(Vector<const char> str, bool allow_prefix_match = false); bool IsUtf8EqualTo(Vector<const char> str, bool allow_prefix_match = false);
// Dispatches to Is{One,Two}ByteEqualTo.
template <typename Char>
bool IsEqualTo(Vector<const Char> str);
bool IsOneByteEqualTo(Vector<const uint8_t> str); bool IsOneByteEqualTo(Vector<const uint8_t> str);
bool IsTwoByteEqualTo(Vector<const uc16> str); bool IsTwoByteEqualTo(Vector<const uc16> str);

View File

@ -19,14 +19,45 @@
namespace v8 { namespace v8 {
namespace internal { namespace internal {
namespace {
// Looks up the capture of the given name. Returns the (1-based) numbered
// capture index or -1 on failure.
int LookupNamedCapture(std::function<bool(String*)> name_matches,
FixedArray* capture_name_map) {
// TODO(jgruber): Sort capture_name_map and do binary search via
// internalized strings.
int maybe_capture_index = -1;
const int named_capture_count = capture_name_map->length() >> 1;
for (int j = 0; j < named_capture_count; j++) {
// The format of {capture_name_map} is documented at
// JSRegExp::kIrregexpCaptureNameMapIndex.
const int name_ix = j * 2;
const int index_ix = j * 2 + 1;
String* capture_name = String::cast(capture_name_map->get(name_ix));
if (!name_matches(capture_name)) continue;
maybe_capture_index = Smi::cast(capture_name_map->get(index_ix))->value();
break;
}
return maybe_capture_index;
}
} // namespace
class CompiledReplacement { class CompiledReplacement {
public: public:
explicit CompiledReplacement(Zone* zone) explicit CompiledReplacement(Zone* zone)
: parts_(1, zone), replacement_substrings_(0, zone), zone_(zone) {} : parts_(1, zone), replacement_substrings_(0, zone), zone_(zone) {}
// Return whether the replacement is simple. // Return whether the replacement is simple. Can also fail and return Nothing
bool Compile(Handle<String> replacement, int capture_count, // if the given replacement string is invalid (and requires throwing a
int subject_length); // SyntaxError).
Maybe<bool> Compile(Handle<JSRegExp> regexp, Handle<String> replacement,
int capture_count, int subject_length);
// Use Apply only if Compile returned false. // Use Apply only if Compile returned false.
void Apply(ReplacementStringBuilder* builder, int match_from, int match_to, void Apply(ReplacementStringBuilder* builder, int match_from, int match_to,
@ -44,6 +75,7 @@ class CompiledReplacement {
SUBJECT_CAPTURE, SUBJECT_CAPTURE,
REPLACEMENT_SUBSTRING, REPLACEMENT_SUBSTRING,
REPLACEMENT_STRING, REPLACEMENT_STRING,
EMPTY,
NUMBER_OF_PART_TYPES NUMBER_OF_PART_TYPES
}; };
@ -68,6 +100,7 @@ class CompiledReplacement {
DCHECK(to > from); DCHECK(to > from);
return ReplacementPart(-from, to); return ReplacementPart(-from, to);
} }
static inline ReplacementPart Empty() { return ReplacementPart(EMPTY, 0); }
// If tag <= 0 then it is the negation of a start index of a substring of // If tag <= 0 then it is the negation of a start index of a substring of
// the replacement pattern, otherwise it's a value from PartType. // the replacement pattern, otherwise it's a value from PartType.
@ -80,7 +113,8 @@ class CompiledReplacement {
int tag; int tag;
// The data value's interpretation depends on the value of tag: // The data value's interpretation depends on the value of tag:
// tag == SUBJECT_PREFIX || // tag == SUBJECT_PREFIX ||
// tag == SUBJECT_SUFFIX: data is unused. // tag == SUBJECT_SUFFIX ||
// tag == EMPTY: data is unused.
// tag == SUBJECT_CAPTURE: data is the number of the capture. // tag == SUBJECT_CAPTURE: data is the number of the capture.
// tag == REPLACEMENT_SUBSTRING || // tag == REPLACEMENT_SUBSTRING ||
// tag == REPLACEMENT_STRING: data is index into array of substrings // tag == REPLACEMENT_STRING: data is index into array of substrings
@ -93,9 +127,17 @@ class CompiledReplacement {
}; };
template <typename Char> template <typename Char>
bool ParseReplacementPattern(ZoneList<ReplacementPart>* parts, Maybe<bool> ParseReplacementPattern(ZoneList<ReplacementPart>* parts,
Vector<Char> characters, int capture_count, Vector<Char> characters,
int subject_length, Zone* zone) { FixedArray* capture_name_map,
int capture_count, int subject_length,
Zone* zone) {
// Equivalent to String::GetSubstitution, except that this method converts
// the replacement string into an internal representation that avoids
// repeated parsing when used repeatedly.
DCHECK_IMPLIES(capture_name_map != nullptr,
FLAG_harmony_regexp_named_captures);
int length = characters.length(); int length = characters.length();
int last = 0; int last = 0;
for (int i = 0; i < length; i++) { for (int i = 0; i < length; i++) {
@ -183,6 +225,60 @@ class CompiledReplacement {
i = next_index; i = next_index;
break; break;
} }
case '<': {
if (capture_name_map == nullptr) {
i = next_index;
break;
}
// Scan until the next '>', throwing a SyntaxError exception if one
// is not found, and let the enclosed substring be groupName.
const int name_start_index = next_index + 1;
int closing_bracket_index = -1;
for (int j = name_start_index; j < length; j++) {
if (characters[j] == '>') {
closing_bracket_index = j;
break;
}
}
// Throw a SyntaxError for invalid replacement strings.
if (closing_bracket_index == -1) return Nothing<bool>();
Vector<Char> requested_name =
characters.SubVector(name_start_index, closing_bracket_index);
// Let capture be ? Get(namedCaptures, groupName).
int capture_index = LookupNamedCapture(
[=](String* capture_name) {
return capture_name->IsEqualTo(requested_name);
},
capture_name_map);
// If capture is undefined, replace the text through the following
// '>' with the empty string.
// Otherwise, replace the text through the following '>' with
// ? ToString(capture).
DCHECK_IMPLIES(
capture_index != -1,
1 <= capture_index && capture_index <= capture_count);
ReplacementPart replacement =
(capture_index == -1)
? ReplacementPart::Empty()
: ReplacementPart::SubjectCapture(capture_index);
if (i > last) {
parts->Add(ReplacementPart::ReplacementSubString(last, i), zone);
}
parts->Add(replacement, zone);
last = closing_bracket_index + 1;
i = closing_bracket_index;
break;
}
default: default:
i = next_index; i = next_index;
break; break;
@ -192,12 +288,12 @@ class CompiledReplacement {
if (length > last) { if (length > last) {
if (last == 0) { if (last == 0) {
// Replacement is simple. Do not use Apply to do the replacement. // Replacement is simple. Do not use Apply to do the replacement.
return true; return Just(true);
} else { } else {
parts->Add(ReplacementPart::ReplacementSubString(last, length), zone); parts->Add(ReplacementPart::ReplacementSubString(last, length), zone);
} }
} }
return false; return Just(false);
} }
ZoneList<ReplacementPart> parts_; ZoneList<ReplacementPart> parts_;
@ -205,23 +301,37 @@ class CompiledReplacement {
Zone* zone_; Zone* zone_;
}; };
Maybe<bool> CompiledReplacement::Compile(Handle<JSRegExp> regexp,
bool CompiledReplacement::Compile(Handle<String> replacement, int capture_count, Handle<String> replacement,
int capture_count,
int subject_length) { int subject_length) {
{ {
DisallowHeapAllocation no_gc; DisallowHeapAllocation no_gc;
String::FlatContent content = replacement->GetFlatContent(); String::FlatContent content = replacement->GetFlatContent();
DCHECK(content.IsFlat()); DCHECK(content.IsFlat());
bool simple = false;
FixedArray* capture_name_map = nullptr;
if (capture_count > 0) {
DCHECK_EQ(regexp->TypeTag(), JSRegExp::IRREGEXP);
Object* maybe_capture_name_map = regexp->CaptureNameMap();
if (maybe_capture_name_map->IsFixedArray()) {
DCHECK(FLAG_harmony_regexp_named_captures);
capture_name_map = FixedArray::cast(maybe_capture_name_map);
}
}
Maybe<bool> simple = Nothing<bool>();
if (content.IsOneByte()) { if (content.IsOneByte()) {
simple = ParseReplacementPattern(&parts_, content.ToOneByteVector(), simple = ParseReplacementPattern(&parts_, content.ToOneByteVector(),
capture_count, subject_length, zone()); capture_name_map, capture_count,
subject_length, zone());
} else { } else {
DCHECK(content.IsTwoByte()); DCHECK(content.IsTwoByte());
simple = ParseReplacementPattern(&parts_, content.ToUC16Vector(), simple = ParseReplacementPattern(&parts_, content.ToUC16Vector(),
capture_count, subject_length, zone()); capture_name_map, capture_count,
subject_length, zone());
} }
if (simple) return true; if (simple.IsNothing() || simple.FromJust()) return simple;
} }
Isolate* isolate = replacement->GetIsolate(); Isolate* isolate = replacement->GetIsolate();
@ -243,7 +353,7 @@ bool CompiledReplacement::Compile(Handle<String> replacement, int capture_count,
substring_index++; substring_index++;
} }
} }
return false; return Just(false);
} }
@ -276,6 +386,8 @@ void CompiledReplacement::Apply(ReplacementStringBuilder* builder,
case REPLACEMENT_STRING: case REPLACEMENT_STRING:
builder->AddString(replacement_substrings_[part.data]); builder->AddString(replacement_substrings_[part.data]);
break; break;
case EMPTY:
break;
default: default:
UNREACHABLE(); UNREACHABLE();
} }
@ -491,14 +603,27 @@ MUST_USE_RESULT static Object* StringReplaceGlobalRegExpWithString(
int capture_count = regexp->CaptureCount(); int capture_count = regexp->CaptureCount();
int subject_length = subject->length(); int subject_length = subject->length();
JSRegExp::Type typeTag = regexp->TypeTag();
if (typeTag == JSRegExp::IRREGEXP) {
// Ensure the RegExp is compiled so we can access the capture-name map.
RegExpImpl::IrregexpPrepare(regexp, subject);
}
// CompiledReplacement uses zone allocation. // CompiledReplacement uses zone allocation.
Zone zone(isolate->allocator(), ZONE_NAME); Zone zone(isolate->allocator(), ZONE_NAME);
CompiledReplacement compiled_replacement(&zone); CompiledReplacement compiled_replacement(&zone);
bool simple_replace = Maybe<bool> maybe_simple_replace = compiled_replacement.Compile(
compiled_replacement.Compile(replacement, capture_count, subject_length); regexp, replacement, capture_count, subject_length);
if (maybe_simple_replace.IsNothing()) {
THROW_NEW_ERROR_RETURN_FAILURE(
isolate, NewSyntaxError(MessageTemplate::kRegExpInvalidReplaceString,
replacement));
}
const bool simple_replace = maybe_simple_replace.FromJust();
// Shortcut for simple non-regexp global replacements // Shortcut for simple non-regexp global replacements
if (regexp->TypeTag() == JSRegExp::ATOM && simple_replace) { if (typeTag == JSRegExp::ATOM && simple_replace) {
if (subject->HasOnlyOneByteChars() && replacement->HasOnlyOneByteChars()) { if (subject->HasOnlyOneByteChars() && replacement->HasOnlyOneByteChars()) {
return StringReplaceGlobalAtomRegExpWithString<SeqOneByteString>( return StringReplaceGlobalAtomRegExpWithString<SeqOneByteString>(
isolate, subject, regexp, replacement, last_match_info); isolate, subject, regexp, replacement, last_match_info);
@ -649,7 +774,7 @@ MUST_USE_RESULT static Object* StringReplaceGlobalRegExpWithEmptyString(
Heap* heap = isolate->heap(); Heap* heap = isolate->heap();
// The trimming is performed on a newly allocated object, which is on a // The trimming is performed on a newly allocated object, which is on a
// fresly allocated page or on an already swept page. Hence, the sweeper // freshly allocated page or on an already swept page. Hence, the sweeper
// thread can not get confused with the filler creation. No synchronization // thread can not get confused with the filler creation. No synchronization
// needed. // needed.
// TODO(hpayer): We should shrink the large object page if the size // TODO(hpayer): We should shrink the large object page if the size
@ -843,23 +968,28 @@ namespace {
class MatchInfoBackedMatch : public String::Match { class MatchInfoBackedMatch : public String::Match {
public: public:
MatchInfoBackedMatch(Isolate* isolate, Handle<String> subject, MatchInfoBackedMatch(Isolate* isolate, Handle<JSRegExp> regexp,
Handle<String> subject,
Handle<RegExpMatchInfo> match_info) Handle<RegExpMatchInfo> match_info)
: isolate_(isolate), match_info_(match_info) { : isolate_(isolate), match_info_(match_info) {
subject_ = String::Flatten(subject); subject_ = String::Flatten(subject);
if (regexp->TypeTag() == JSRegExp::IRREGEXP) {
Object* o = regexp->CaptureNameMap();
has_named_captures_ = o->IsFixedArray();
if (has_named_captures_) {
DCHECK(FLAG_harmony_regexp_named_captures);
capture_name_map_ = handle(FixedArray::cast(o));
}
} else {
has_named_captures_ = false;
}
} }
Handle<String> GetMatch() override { Handle<String> GetMatch() override {
return RegExpUtils::GenericCaptureGetter(isolate_, match_info_, 0, nullptr); return RegExpUtils::GenericCaptureGetter(isolate_, match_info_, 0, nullptr);
} }
MaybeHandle<String> GetCapture(int i, bool* capture_exists) override {
Handle<Object> capture_obj = RegExpUtils::GenericCaptureGetter(
isolate_, match_info_, i, capture_exists);
return (*capture_exists) ? Object::ToString(isolate_, capture_obj)
: isolate_->factory()->empty_string();
}
Handle<String> GetPrefix() override { Handle<String> GetPrefix() override {
const int match_start = match_info_->Capture(0); const int match_start = match_info_->Capture(0);
return isolate_->factory()->NewSubString(subject_, 0, match_start); return isolate_->factory()->NewSubString(subject_, 0, match_start);
@ -871,42 +1001,63 @@ class MatchInfoBackedMatch : public String::Match {
subject_->length()); subject_->length());
} }
bool HasNamedCaptures() override { return has_named_captures_; }
int CaptureCount() override { int CaptureCount() override {
return match_info_->NumberOfCaptureRegisters() / 2; return match_info_->NumberOfCaptureRegisters() / 2;
} }
virtual ~MatchInfoBackedMatch() {} MaybeHandle<String> GetCapture(int i, bool* capture_exists) override {
Handle<Object> capture_obj = RegExpUtils::GenericCaptureGetter(
isolate_, match_info_, i, capture_exists);
return (*capture_exists) ? Object::ToString(isolate_, capture_obj)
: isolate_->factory()->empty_string();
}
MaybeHandle<String> GetNamedCapture(Handle<String> name,
bool* capture_exists) override {
DCHECK(has_named_captures_);
const int capture_index = LookupNamedCapture(
[=](String* capture_name) { return capture_name->Equals(*name); },
*capture_name_map_);
if (capture_index == -1) {
*capture_exists = false;
return name; // Arbitrary string handle.
}
DCHECK(1 <= capture_index && capture_index <= CaptureCount());
return GetCapture(capture_index, capture_exists);
}
private: private:
Isolate* isolate_; Isolate* isolate_;
Handle<String> subject_; Handle<String> subject_;
Handle<RegExpMatchInfo> match_info_; Handle<RegExpMatchInfo> match_info_;
bool has_named_captures_;
Handle<FixedArray> capture_name_map_;
}; };
class VectorBackedMatch : public String::Match { class VectorBackedMatch : public String::Match {
public: public:
VectorBackedMatch(Isolate* isolate, Handle<String> subject, VectorBackedMatch(Isolate* isolate, Handle<String> subject,
Handle<String> match, int match_position, Handle<String> match, int match_position,
std::vector<Handle<Object>>* captures) std::vector<Handle<Object>>* captures,
Handle<Object> groups_obj)
: isolate_(isolate), : isolate_(isolate),
match_(match), match_(match),
match_position_(match_position), match_position_(match_position),
captures_(captures) { captures_(captures) {
subject_ = String::Flatten(subject); subject_ = String::Flatten(subject);
DCHECK(groups_obj->IsUndefined(isolate) || groups_obj->IsJSReceiver());
has_named_captures_ = !groups_obj->IsUndefined(isolate);
if (has_named_captures_) groups_obj_ = Handle<JSReceiver>::cast(groups_obj);
} }
Handle<String> GetMatch() override { return match_; } Handle<String> GetMatch() override { return match_; }
MaybeHandle<String> GetCapture(int i, bool* capture_exists) override {
Handle<Object> capture_obj = captures_->at(i);
if (capture_obj->IsUndefined(isolate_)) {
*capture_exists = false;
return isolate_->factory()->empty_string();
}
*capture_exists = true;
return Object::ToString(isolate_, capture_obj);
}
Handle<String> GetPrefix() override { Handle<String> GetPrefix() override {
return isolate_->factory()->NewSubString(subject_, 0, match_position_); return isolate_->factory()->NewSubString(subject_, 0, match_position_);
} }
@ -917,9 +1068,34 @@ class VectorBackedMatch : public String::Match {
subject_->length()); subject_->length());
} }
bool HasNamedCaptures() override { return has_named_captures_; }
int CaptureCount() override { return static_cast<int>(captures_->size()); } int CaptureCount() override { return static_cast<int>(captures_->size()); }
virtual ~VectorBackedMatch() {} MaybeHandle<String> GetCapture(int i, bool* capture_exists) override {
Handle<Object> capture_obj = captures_->at(i);
if (capture_obj->IsUndefined(isolate_)) {
*capture_exists = false;
return isolate_->factory()->empty_string();
}
*capture_exists = true;
return Object::ToString(isolate_, capture_obj);
}
MaybeHandle<String> GetNamedCapture(Handle<String> name,
bool* capture_exists) override {
DCHECK(has_named_captures_);
Handle<Object> capture_obj;
ASSIGN_RETURN_ON_EXCEPTION(isolate_, capture_obj,
Object::GetProperty(groups_obj_, name), String);
if (capture_obj->IsUndefined(isolate_)) {
*capture_exists = false;
return name;
} else {
*capture_exists = true;
return Object::ToString(isolate_, capture_obj);
}
}
private: private:
Isolate* isolate_; Isolate* isolate_;
@ -927,6 +1103,9 @@ class VectorBackedMatch : public String::Match {
Handle<String> match_; Handle<String> match_;
const int match_position_; const int match_position_;
std::vector<Handle<Object>>* captures_; std::vector<Handle<Object>>* captures_;
bool has_named_captures_;
Handle<JSReceiver> groups_obj_;
}; };
// Create the groups object (see also the RegExp result creation in // Create the groups object (see also the RegExp result creation in
@ -1072,6 +1251,7 @@ static Object* SearchRegExpMultiple(Isolate* isolate, Handle<String> subject,
elements->set(cursor++, *subject); elements->set(cursor++, *subject);
if (has_named_captures) { if (has_named_captures) {
DCHECK(FLAG_harmony_regexp_named_captures);
Handle<FixedArray> capture_map = Handle<FixedArray> capture_map =
Handle<FixedArray>::cast(maybe_capture_map); Handle<FixedArray>::cast(maybe_capture_map);
Handle<JSObject> groups = ConstructNamedCaptureGroupsObject( Handle<JSObject> groups = ConstructNamedCaptureGroupsObject(
@ -1183,7 +1363,7 @@ MUST_USE_RESULT MaybeHandle<String> RegExpReplace(Isolate* isolate,
builder.AppendString(factory->NewSubString(string, 0, start_index)); builder.AppendString(factory->NewSubString(string, 0, start_index));
if (replace->length() > 0) { if (replace->length() > 0) {
MatchInfoBackedMatch m(isolate, string, match_indices); MatchInfoBackedMatch m(isolate, regexp, string, match_indices);
Handle<String> replacement; Handle<String> replacement;
ASSIGN_RETURN_ON_EXCEPTION(isolate, replacement, ASSIGN_RETURN_ON_EXCEPTION(isolate, replacement,
String::GetSubstitution(isolate, &m, replace), String::GetSubstitution(isolate, &m, replace),
@ -1316,6 +1496,7 @@ RUNTIME_FUNCTION(Runtime_StringReplaceNonGlobalRegExpWithFunction) {
Object* maybe_capture_map = regexp->CaptureNameMap(); Object* maybe_capture_map = regexp->CaptureNameMap();
if (maybe_capture_map->IsFixedArray()) { if (maybe_capture_map->IsFixedArray()) {
DCHECK(FLAG_harmony_regexp_named_captures);
has_named_captures = true; has_named_captures = true;
capture_map = handle(FixedArray::cast(maybe_capture_map)); capture_map = handle(FixedArray::cast(maybe_capture_map));
} }
@ -1703,7 +1884,13 @@ RUNTIME_FUNCTION(Runtime_RegExpReplace) {
isolate, replacement, Object::ToString(isolate, replacement_obj)); isolate, replacement, Object::ToString(isolate, replacement_obj));
} else { } else {
DCHECK(!functional_replace); DCHECK(!functional_replace);
VectorBackedMatch m(isolate, string, match, position, &captures); if (!groups_obj->IsUndefined(isolate)) {
// TODO(jgruber): Behavior in this case is not yet specced.
ASSIGN_RETURN_FAILURE_ON_EXCEPTION(
isolate, groups_obj, JSReceiver::ToObject(isolate, groups_obj));
}
VectorBackedMatch m(isolate, string, match, position, &captures,
groups_obj);
ASSIGN_RETURN_FAILURE_ON_EXCEPTION( ASSIGN_RETURN_FAILURE_ON_EXCEPTION(
isolate, replacement, String::GetSubstitution(isolate, &m, replace)); isolate, replacement, String::GetSubstitution(isolate, &m, replace));
} }

View File

@ -31,13 +31,20 @@ RUNTIME_FUNCTION(Runtime_GetSubstitution) {
: match_(match), prefix_(prefix), suffix_(suffix) {} : match_(match), prefix_(prefix), suffix_(suffix) {}
Handle<String> GetMatch() override { return match_; } Handle<String> GetMatch() override { return match_; }
Handle<String> GetPrefix() override { return prefix_; }
Handle<String> GetSuffix() override { return suffix_; }
int CaptureCount() override { return 0; }
bool HasNamedCaptures() override { return false; }
MaybeHandle<String> GetCapture(int i, bool* capture_exists) override { MaybeHandle<String> GetCapture(int i, bool* capture_exists) override {
*capture_exists = false; *capture_exists = false;
return match_; // Return arbitrary string handle. return match_; // Return arbitrary string handle.
} }
Handle<String> GetPrefix() override { return prefix_; } MaybeHandle<String> GetNamedCapture(Handle<String> name,
Handle<String> GetSuffix() override { return suffix_; } bool* capture_exists) override {
int CaptureCount() override { return 0; } UNREACHABLE();
return MaybeHandle<String>();
}
private: private:
Handle<String> match_, prefix_, suffix_; Handle<String> match_, prefix_, suffix_;

View File

@ -217,7 +217,7 @@ bytecodes: [
B(TestTypeOf), U8(5), B(TestTypeOf), U8(5),
B(JumpIfFalse), U8(4), B(JumpIfFalse), U8(4),
B(Jump), U8(18), B(Jump), U8(18),
B(Wide), B(LdaSmi), I16(129), B(Wide), B(LdaSmi), I16(130),
B(Star), R(12), B(Star), R(12),
B(LdaConstant), U8(11), B(LdaConstant), U8(11),
B(Star), R(13), B(Star), R(13),
@ -701,7 +701,7 @@ bytecodes: [
B(TestTypeOf), U8(5), B(TestTypeOf), U8(5),
B(JumpIfFalse), U8(4), B(JumpIfFalse), U8(4),
B(Jump), U8(18), B(Jump), U8(18),
B(Wide), B(LdaSmi), I16(129), B(Wide), B(LdaSmi), I16(130),
B(Star), R(12), B(Star), R(12),
B(LdaConstant), U8(11), B(LdaConstant), U8(11),
B(Star), R(13), B(Star), R(13),
@ -1219,7 +1219,7 @@ bytecodes: [
B(TestTypeOf), U8(5), B(TestTypeOf), U8(5),
B(JumpIfFalse), U8(4), B(JumpIfFalse), U8(4),
B(Jump), U8(18), B(Jump), U8(18),
B(Wide), B(LdaSmi), I16(129), B(Wide), B(LdaSmi), I16(130),
B(Star), R(12), B(Star), R(12),
B(LdaConstant), U8(11), B(LdaConstant), U8(11),
B(Star), R(13), B(Star), R(13),
@ -1627,7 +1627,7 @@ bytecodes: [
B(TestTypeOf), U8(5), B(TestTypeOf), U8(5),
B(JumpIfFalse), U8(4), B(JumpIfFalse), U8(4),
B(Jump), U8(18), B(Jump), U8(18),
B(Wide), B(LdaSmi), I16(129), B(Wide), B(LdaSmi), I16(130),
B(Star), R(11), B(Star), R(11),
B(LdaConstant), U8(10), B(LdaConstant), U8(10),
B(Star), R(12), B(Star), R(12),

View File

@ -85,7 +85,7 @@ bytecodes: [
B(TestTypeOf), U8(5), B(TestTypeOf), U8(5),
B(JumpIfFalse), U8(4), B(JumpIfFalse), U8(4),
B(Jump), U8(18), B(Jump), U8(18),
B(Wide), B(LdaSmi), I16(129), B(Wide), B(LdaSmi), I16(130),
B(Star), R(12), B(Star), R(12),
B(LdaConstant), U8(8), B(LdaConstant), U8(8),
B(Star), R(13), B(Star), R(13),
@ -226,7 +226,7 @@ bytecodes: [
B(TestTypeOf), U8(5), B(TestTypeOf), U8(5),
B(JumpIfFalse), U8(4), B(JumpIfFalse), U8(4),
B(Jump), U8(18), B(Jump), U8(18),
B(Wide), B(LdaSmi), I16(129), B(Wide), B(LdaSmi), I16(130),
B(Star), R(13), B(Star), R(13),
B(LdaConstant), U8(8), B(LdaConstant), U8(8),
B(Star), R(14), B(Star), R(14),
@ -380,7 +380,7 @@ bytecodes: [
B(TestTypeOf), U8(5), B(TestTypeOf), U8(5),
B(JumpIfFalse), U8(4), B(JumpIfFalse), U8(4),
B(Jump), U8(18), B(Jump), U8(18),
B(Wide), B(LdaSmi), I16(129), B(Wide), B(LdaSmi), I16(130),
B(Star), R(12), B(Star), R(12),
B(LdaConstant), U8(8), B(LdaConstant), U8(8),
B(Star), R(13), B(Star), R(13),
@ -524,7 +524,7 @@ bytecodes: [
B(TestTypeOf), U8(5), B(TestTypeOf), U8(5),
B(JumpIfFalse), U8(4), B(JumpIfFalse), U8(4),
B(Jump), U8(18), B(Jump), U8(18),
B(Wide), B(LdaSmi), I16(129), B(Wide), B(LdaSmi), I16(130),
B(Star), R(11), B(Star), R(11),
B(LdaConstant), U8(10), B(LdaConstant), U8(10),
B(Star), R(12), B(Star), R(12),

View File

@ -493,7 +493,7 @@ bytecodes: [
B(TestTypeOf), U8(5), B(TestTypeOf), U8(5),
B(JumpIfFalse), U8(4), B(JumpIfFalse), U8(4),
B(Jump), U8(18), B(Jump), U8(18),
B(Wide), B(LdaSmi), I16(129), B(Wide), B(LdaSmi), I16(130),
B(Star), R(11), B(Star), R(11),
B(LdaConstant), U8(10), B(LdaConstant), U8(10),
B(Star), R(12), B(Star), R(12),

View File

@ -208,3 +208,59 @@ function toSlowMode(re) {
}); });
assertEquals("bacd", result); assertEquals("bacd", result);
} }
// @@replace with a string replacement argument (no named captures).
{
let re = /(.)(.)/u;
assertEquals("$<snd>$<fst>cd", "abcd".replace(re, "$<snd>$<fst>"));
assertEquals("bacd", "abcd".replace(re, "$2$1"));
assertEquals("$<sndcd", "abcd".replace(re, "$<snd"));
assertEquals("$<42a>cd", "abcd".replace(re, "$<42$1>"));
assertEquals("$<thd>cd", "abcd".replace(re, "$<thd>"));
assertEquals("$<a>cd", "abcd".replace(re, "$<$1>"));
}
// @@replace with a string replacement argument (global, named captures).
{
let re = /(?<fst>.)(?<snd>.)/gu;
assertEquals("badc", "abcd".replace(re, "$<snd>$<fst>"));
assertEquals("badc", "abcd".replace(re, "$2$1"));
assertThrows(() => "abcd".replace(re, "$<snd"), SyntaxError);
assertEquals("", "abcd".replace(re, "$<42$1>"));
assertEquals("", "abcd".replace(re, "$<thd>"));
assertEquals("", "abcd".replace(re, "$<$1>"));
}
// @@replace with a string replacement argument (non-global, named captures).
{
let re = /(?<fst>.)(?<snd>.)/u;
assertEquals("bacd", "abcd".replace(re, "$<snd>$<fst>"));
assertEquals("bacd", "abcd".replace(re, "$2$1"));
assertThrows(() => "abcd".replace(re, "$<snd"), SyntaxError);
assertEquals("cd", "abcd".replace(re, "$<42$1>"));
assertEquals("cd", "abcd".replace(re, "$<thd>"));
assertEquals("cd", "abcd".replace(re, "$<$1>"));
}
// @@replace with a string replacement argument (slow, global, named captures).
{
let re = toSlowMode(/(?<fst>.)(?<snd>.)/gu);
assertEquals("badc", "abcd".replace(re, "$<snd>$<fst>"));
assertEquals("badc", "abcd".replace(re, "$2$1"));
assertThrows(() => "abcd".replace(re, "$<snd"), SyntaxError);
assertEquals("", "abcd".replace(re, "$<42$1>"));
assertEquals("", "abcd".replace(re, "$<thd>"));
assertEquals("", "abcd".replace(re, "$<$1>"));
}
// @@replace with a string replacement argument (slow, non-global,
// named captures).
{
let re = toSlowMode(/(?<fst>.)(?<snd>.)/u);
assertEquals("bacd", "abcd".replace(re, "$<snd>$<fst>"));
assertEquals("bacd", "abcd".replace(re, "$2$1"));
assertThrows(() => "abcd".replace(re, "$<snd"), SyntaxError);
assertEquals("cd", "abcd".replace(re, "$<42$1>"));
assertEquals("cd", "abcd".replace(re, "$<thd>"));
assertEquals("cd", "abcd".replace(re, "$<$1>"));
}