skia2/experimental/editor/word_boundaries.cpp
Hal Canary ded867f126 experimental/editor: shape.h to unify all shaping code
also simplify handling of implicit position at end of line.

also simplfy move() operation.

Change-Id: Ic242b5413c65295b1ac1bf7aa3a4948c3ed1c742
Reviewed-on: https://skia-review.googlesource.com/c/skia/+/233303
Commit-Queue: Hal Canary <halcanary@google.com>
Reviewed-by: Ben Wagner <bungeman@google.com>
2019-08-09 14:20:10 +00:00

51 lines
1.5 KiB
C++

// Copyright 2019 Google LLC.
// Use of this source code is governed by a BSD-style license that can be found in the LICENSE file.
#include "experimental/editor/word_boundaries.h"
#include <unicode/brkiter.h>
#include <unicode/unistr.h>
#include <memory>
std::vector<bool> GetUtf8WordBoundaries(const char* begin, size_t byteCount, const char* locale) {
static constexpr UBreakIteratorType kIteratorType = UBRK_WORD;
struct UTextCloser {
void operator()(UText* p) { (void)utext_close(p); }
};
struct UBreakCloser {
void operator()(UBreakIterator* p) { (void)ubrk_close(p); }
};
std::vector<bool> result;
if (0 == byteCount) {
return result;
}
result.resize(byteCount);
UText utf8UText = UTEXT_INITIALIZER;
UErrorCode errorCode = U_ZERO_ERROR;
(void)utext_openUTF8(&utf8UText, begin, byteCount, &errorCode);
std::unique_ptr<UText, UTextCloser> autoclose1(&utf8UText);
if (U_FAILURE(errorCode)) {
return result;
}
UBreakIterator* iter = ubrk_open(kIteratorType, locale, nullptr, 0, &errorCode);
std::unique_ptr<UBreakIterator, UBreakCloser> autoclose2(iter);
if (U_FAILURE(errorCode)) {
return result;
}
ubrk_setUText(iter, &utf8UText, &errorCode);
if (U_FAILURE(errorCode)) {
return result;
}
int pos = ubrk_first(iter);
while (pos != icu::BreakIterator::DONE) {
if ((unsigned)pos < (unsigned)byteCount) {
result[pos] = true;
}
pos = ubrk_next(iter);
}
return result;
}