2018-09-07 09:17:06 +00:00
|
|
|
// Copyright 2018 the V8 project authors. All rights reserved.
|
|
|
|
// Use of this source code is governed by a BSD-style license that can be
|
|
|
|
// found in the LICENSE file.
|
|
|
|
|
|
|
|
#include "test/cctest/unicode-helpers.h"
|
2019-05-21 06:38:38 +00:00
|
|
|
#include "src/strings/unicode-inl.h"
|
2018-09-07 09:17:06 +00:00
|
|
|
|
|
|
|
int Ucs2CharLength(unibrow::uchar c) {
|
|
|
|
if (c == unibrow::Utf8::kIncomplete || c == unibrow::Utf8::kBufferEmpty) {
|
|
|
|
return 0;
|
|
|
|
} else if (c < 0xFFFF) {
|
|
|
|
return 1;
|
|
|
|
} else {
|
|
|
|
return 2;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
int Utf8LengthHelper(const char* s) {
|
|
|
|
unibrow::Utf8::Utf8IncrementalBuffer buffer(unibrow::Utf8::kBufferEmpty);
|
|
|
|
unibrow::Utf8::State state = unibrow::Utf8::State::kAccept;
|
|
|
|
|
|
|
|
int length = 0;
|
2019-02-06 12:26:06 +00:00
|
|
|
const uint8_t* c = reinterpret_cast<const uint8_t*>(s);
|
|
|
|
while (*c != '\0') {
|
|
|
|
unibrow::uchar tmp = unibrow::Utf8::ValueOfIncremental(&c, &state, &buffer);
|
2018-09-07 09:17:06 +00:00
|
|
|
length += Ucs2CharLength(tmp);
|
|
|
|
}
|
|
|
|
unibrow::uchar tmp = unibrow::Utf8::ValueOfIncrementalFinish(&state);
|
|
|
|
length += Ucs2CharLength(tmp);
|
|
|
|
return length;
|
|
|
|
}
|