be014256ad
Bug: v8:9247 Change-Id: I9bcf2694b449f79cdbe03f5fde59cb21b8cad418 Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/1619758 Commit-Queue: Yang Guo <yangguo@chromium.org> Reviewed-by: Michael Lippautz <mlippautz@chromium.org> Reviewed-by: Andreas Haas <ahaas@chromium.org> Reviewed-by: Georg Neis <neis@chromium.org> Cr-Commit-Position: refs/heads/master@{#61676}
32 lines
970 B
C++
32 lines
970 B
C++
// Copyright 2018 the V8 project authors. All rights reserved.
|
|
// Use of this source code is governed by a BSD-style license that can be
|
|
// found in the LICENSE file.
|
|
|
|
#include "test/cctest/unicode-helpers.h"
|
|
#include "src/strings/unicode-inl.h"
|
|
|
|
int Ucs2CharLength(unibrow::uchar c) {
|
|
if (c == unibrow::Utf8::kIncomplete || c == unibrow::Utf8::kBufferEmpty) {
|
|
return 0;
|
|
} else if (c < 0xFFFF) {
|
|
return 1;
|
|
} else {
|
|
return 2;
|
|
}
|
|
}
|
|
|
|
int Utf8LengthHelper(const char* s) {
|
|
unibrow::Utf8::Utf8IncrementalBuffer buffer(unibrow::Utf8::kBufferEmpty);
|
|
unibrow::Utf8::State state = unibrow::Utf8::State::kAccept;
|
|
|
|
int length = 0;
|
|
const uint8_t* c = reinterpret_cast<const uint8_t*>(s);
|
|
while (*c != '\0') {
|
|
unibrow::uchar tmp = unibrow::Utf8::ValueOfIncremental(&c, &state, &buffer);
|
|
length += Ucs2CharLength(tmp);
|
|
}
|
|
unibrow::uchar tmp = unibrow::Utf8::ValueOfIncrementalFinish(&state);
|
|
length += Ucs2CharLength(tmp);
|
|
return length;
|
|
}
|