[scanner] Replace PushBack2 with Peek() after PushBack

Change-Id: Ic70a83335c60ba2f1f656398fc6b19db7af99348
Reviewed-on: https://chromium-review.googlesource.com/1175915
Commit-Queue: Toon Verwaest <verwaest@chromium.org>
Reviewed-by: Leszek Swirski <leszeks@chromium.org>
Cr-Commit-Position: refs/heads/master@{#55157}
This commit is contained in:
Toon Verwaest 2018-08-16 11:47:23 +02:00 committed by Commit Bot
parent 84894ce6d2
commit 4aa3ad271b
3 changed files with 15 additions and 44 deletions

View File

@ -53,16 +53,17 @@ class CharacterStream : public ScannerStream {
// Returns and advances past the next UTF-16 code unit in the input
// stream. If there are no more code units it returns kEndOfInput.
inline uc32 Advance() final {
if (V8_LIKELY(buffer_cursor_ < buffer_end_)) {
return static_cast<uc32>(*(buffer_cursor_++));
} else if (ReadBlockChecked()) {
return static_cast<uc32>(*(buffer_cursor_++));
} else {
// Note: currently the following increment is necessary to avoid a
// parser problem! The scanner treats the final kEndOfInput as
// a code unit with a position, and does math relative to that
// position.
uc32 result = Peek();
buffer_cursor_++;
return result;
}
inline uc32 Peek() {
if (V8_LIKELY(buffer_cursor_ < buffer_end_)) {
return static_cast<uc32>(*buffer_cursor_);
} else if (ReadBlockChecked()) {
return static_cast<uc32>(*buffer_cursor_);
} else {
return kEndOfInput;
}
}
@ -105,17 +106,6 @@ class CharacterStream : public ScannerStream {
}
}
// Go back one by two characters in the input stream. (This is the same as
// calling Back() twice. But Back() may - in some instances - do substantial
// work. Back2() guarantees this work will be done only once.)
inline void Back2() {
if (V8_LIKELY(buffer_cursor_ - 2 >= buffer_start_)) {
buffer_cursor_ -= 2;
} else {
ReadBlockAt(pos() - 2);
}
}
inline size_t pos() const final {
return buffer_pos_ + (buffer_cursor_ - buffer_start_);
}
@ -157,7 +147,7 @@ class CharacterStream : public ScannerStream {
}
void ReadBlockAt(size_t new_pos) {
// The callers of this method (Back/Back2/Seek) should handle the easy
// The callers of this method (Back/Seek) should handle the easy
// case (seeking within the current buffer), and we should only get here
// if we actually require new data.
// (This is really an efficiency check, not a correctness invariant.)

View File

@ -415,21 +415,17 @@ Token::Value Scanner::PeekAhead() {
Token::Value Scanner::TryToSkipHTMLCommentAndWhiteSpaces(int start_position) {
while (true) {
DCHECK_EQ('-', c0_);
Advance();
// If there is an HTML comment end '-->' at the beginning of a
// line, we treat the rest of the line as a comment. This is in line with
// the way SpiderMonkey handles it.
if (c0_ != '-') {
if (c0_ != '-' || Peek() != '>') {
PushBack('-'); // undo Advance()
break;
}
Advance();
if (c0_ != '>') {
PushBack2('-', '-'); // undo 2x Advance();
break;
}
// Treat the rest of the line as a comment.
Token::Value token = SkipSingleHTMLComment();
@ -566,16 +562,11 @@ Token::Value Scanner::ScanHtmlComment() {
// Check for <!-- comments.
DCHECK_EQ(c0_, '!');
Advance();
if (c0_ != '-') {
if (c0_ != '-' || Peek() != '-') {
PushBack('!'); // undo Advance()
return Token::LT;
}
Advance();
if (c0_ != '-') {
PushBack2('-', '!'); // undo 2x Advance()
return Token::LT;
}
found_html_comment_ = true;
return SkipSingleHTMLComment();

View File

@ -500,22 +500,12 @@ class Scanner {
}
void PushBack(uc32 ch) {
if (c0_ > static_cast<uc32>(unibrow::Utf16::kMaxNonSurrogateCharCode)) {
source_->Back2();
} else {
DCHECK_LE(c0_, static_cast<uc32>(unibrow::Utf16::kMaxNonSurrogateCharCode));
source_->Back();
}
c0_ = ch;
}
// Same as PushBack(ch1); PushBack(ch2).
// - Potentially more efficient as it uses Back2() on the stream.
// - Uses char as parameters, since we're only calling it with ASCII chars in
// practice. This way, we can avoid a few edge cases.
void PushBack2(char ch1, char ch2) {
source_->Back2();
c0_ = ch2;
}
uc32 Peek() const { return source_->Peek(); }
inline Token::Value Select(Token::Value tok) {
Advance();