v8/src/unicode-inl.h

// Copyright 2007-2010 the V8 project authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.

#ifndef V8_UNICODE_INL_H_
#define V8_UNICODE_INL_H_

#include "src/unicode.h"
#include "src/base/logging.h"
#include "src/utils.h"

namespace unibrow {

template <class T, int s> bool Predicate<T, s>::get(uchar code_point) {
  CacheEntry entry = entries_[code_point & kMask];
  if (entry.code_point_ == code_point) return entry.value_;
  return CalculateValue(code_point);
}

template <class T, int s> bool Predicate<T, s>::CalculateValue(
    uchar code_point) {
  bool result = T::Is(code_point);
  entries_[code_point & kMask] = CacheEntry(code_point, result);
  return result;
}

template <class T, int s> int Mapping<T, s>::get(uchar c, uchar n,
    uchar* result) {
  CacheEntry entry = entries_[c & kMask];
  if (entry.code_point_ == c) {
    if (entry.offset_ == 0) {
      return 0;
    } else {
      result[0] = c + entry.offset_;
      return 1;
    }
  } else {
    return CalculateValue(c, n, result);
  }
}

template <class T, int s> int Mapping<T, s>::CalculateValue(uchar c, uchar n,
    uchar* result) {
  bool allow_caching = true;
  int length = T::Convert(c, n, result, &allow_caching);
  if (allow_caching) {
    if (length == 1) {
      entries_[c & kMask] = CacheEntry(c, result[0] - c);
      return 1;
    } else {
      entries_[c & kMask] = CacheEntry(c, 0);
      return 0;
    }
  } else {
    return length;
  }
}


uint16_t Latin1::ConvertNonLatin1ToLatin1(uint16_t c) {
  ASSERT(c > Latin1::kMaxChar);
  switch (c) {
    // This are equivalent characters in unicode.
    case 0x39c:
    case 0x3bc:
      return 0xb5;
    // This is an uppercase of a Latin-1 character
    // outside of Latin-1.
    case 0x178:
      return 0xff;
  }
  return 0;
}


unsigned Utf8::EncodeOneByte(char* str, uint8_t c) {
  static const int kMask = ~(1 << 6);
  if (c <= kMaxOneByteChar) {
    str[0] = c;
    return 1;
  }
  str[0] = 0xC0 | (c >> 6);
  str[1] = 0x80 | (c & kMask);
  return 2;
}

// Encode encodes the UTF-16 code units c and previous into the given str
// buffer, and combines surrogate code units into single code points. If
// replace_invalid is set to true, orphan surrogate code units will be replaced
// with kBadChar.
unsigned Utf8::Encode(char* str,
                      uchar c,
                      int previous,
                      bool replace_invalid) {
  static const int kMask = ~(1 << 6);
  if (c <= kMaxOneByteChar) {
    str[0] = c;
    return 1;
  } else if (c <= kMaxTwoByteChar) {
    str[0] = 0xC0 | (c >> 6);
    str[1] = 0x80 | (c & kMask);
    return 2;
  } else if (c <= kMaxThreeByteChar) {
    if (Utf16::IsSurrogatePair(previous, c)) {
      const int kUnmatchedSize = kSizeOfUnmatchedSurrogate;
      return Encode(str - kUnmatchedSize,
                    Utf16::CombineSurrogatePair(previous, c),
                    Utf16::kNoPreviousCharacter,
                    replace_invalid) - kUnmatchedSize;
    } else if (replace_invalid &&
               (Utf16::IsLeadSurrogate(c) ||
               Utf16::IsTrailSurrogate(c))) {
      c = kBadChar;
    }
    str[0] = 0xE0 | (c >> 12);
    str[1] = 0x80 | ((c >> 6) & kMask);
    str[2] = 0x80 | (c & kMask);
    return 3;
  } else {
    str[0] = 0xF0 | (c >> 18);
    str[1] = 0x80 | ((c >> 12) & kMask);
    str[2] = 0x80 | ((c >> 6) & kMask);
    str[3] = 0x80 | (c & kMask);
    return 4;
  }
}


uchar Utf8::ValueOf(const byte* bytes, unsigned length, unsigned* cursor) {
  if (length <= 0) return kBadChar;
  byte first = bytes[0];
  // Characters between 0000 and 0007F are encoded as a single character
  if (first <= kMaxOneByteChar) {
    *cursor += 1;
    return first;
  }
  return CalculateValue(bytes, length, cursor);
}

unsigned Utf8::Length(uchar c, int previous) {
  if (c <= kMaxOneByteChar) {
    return 1;
  } else if (c <= kMaxTwoByteChar) {
    return 2;
  } else if (c <= kMaxThreeByteChar) {
    if (Utf16::IsTrailSurrogate(c) &&
        Utf16::IsLeadSurrogate(previous)) {
      return kSizeOfUnmatchedSurrogate - kBytesSavedByCombiningSurrogates;
    }
    return 3;
  } else {
    return 4;
  }
}

Utf8DecoderBase::Utf8DecoderBase()
  : unbuffered_start_(NULL),
    utf16_length_(0),
    last_byte_of_buffer_unused_(false) {}

Utf8DecoderBase::Utf8DecoderBase(uint16_t* buffer,
                                 unsigned buffer_length,
                                 const uint8_t* stream,
                                 unsigned stream_length) {
  Reset(buffer, buffer_length, stream, stream_length);
}

template<unsigned kBufferSize>
Utf8Decoder<kBufferSize>::Utf8Decoder(const char* stream, unsigned length)
  : Utf8DecoderBase(buffer_,
                    kBufferSize,
                    reinterpret_cast<const uint8_t*>(stream),
                    length) {
}

template<unsigned kBufferSize>
void Utf8Decoder<kBufferSize>::Reset(const char* stream, unsigned length) {
  Utf8DecoderBase::Reset(buffer_,
                         kBufferSize,
                         reinterpret_cast<const uint8_t*>(stream),
                         length);
}

template <unsigned kBufferSize>
unsigned Utf8Decoder<kBufferSize>::WriteUtf16(uint16_t* data,
                                              unsigned length) const {
  ASSERT(length > 0);
  if (length > utf16_length_) length = utf16_length_;
  // memcpy everything in buffer.
  unsigned buffer_length =
      last_byte_of_buffer_unused_ ? kBufferSize - 1 : kBufferSize;
  unsigned memcpy_length = length <= buffer_length ? length : buffer_length;
  v8::internal::MemCopy(data, buffer_, memcpy_length * sizeof(uint16_t));
  if (length <= buffer_length) return length;
  ASSERT(unbuffered_start_ != NULL);
  // Copy the rest the slow way.
  WriteUtf16Slow(unbuffered_start_,
                 data + buffer_length,
                 length - buffer_length);
  return length;
}

}  // namespace unibrow

#endif  // V8_UNICODE_INL_H_
Updated unicode library. Added Nl category to letters predicate (as requried for JS identifiers). Changed/simplified representation of canonicalization ranges. Truncated tables to code points in the BMP (all that is used by JS). Reformatted tables to avoid excessively long lines. Removed duplicate entries from multi-character mapping result tables. Review URL: http://codereview.chromium.org/3030026 git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@5155 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2010-07-30 07:10:22 +00:00			`// Copyright 2007-2010 the V8 project authors. All rights reserved.`
Bulk update of Google copyright headers in source files. R=svenpanne@chromium.org Review URL: https://codereview.chromium.org/259183002 git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@21035 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2014-04-29 06:42:26 +00:00			`// Use of this source code is governed by a BSD-style license that can be`
			`// found in the LICENSE file.`
Initial export. git-svn-id: http://v8.googlecode.com/svn/trunk@2 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2008-07-03 15:10:15 +00:00
Cleanup include guards: - Fix some typos / guards that didn't match the filename. - Fix some style inconsistencies. - Add guards to files that were missing them. - Add the directory name to the guard. Review URL: http://codereview.chromium.org/99343 git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@1845 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2009-05-04 13:36:43 +00:00			`#ifndef V8_UNICODE_INL_H_`
			`#define V8_UNICODE_INL_H_`
Initial export. git-svn-id: http://v8.googlecode.com/svn/trunk@2 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2008-07-03 15:10:15 +00:00
Use full include paths everywhere - this avoids using relative include paths which are forbidden by the style guide - makes the code more readable since it's clear which header is meant - allows for starting to use checkdeps BUG=none R=jkummerow@chromium.org, danno@chromium.org LOG=n Review URL: https://codereview.chromium.org/304153016 git-svn-id: https://v8.googlecode.com/svn/branches/bleeding_edge@21625 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2014-06-03 08:12:43 +00:00			`#include "src/unicode.h"`
Move platform abstraction to base library Also split v8-core independent methods from checks.h to base/logging.h and merge v8checks with the rest of checks. The CPU::FlushICache method is moved to CpuFeatures::FlushICache RoundUp and related methods are moved to base/macros.h Remove all layering violations from src/libplatform BUG=none R=jkummerow@chromium.org LOG=n Review URL: https://codereview.chromium.org/358363002 git-svn-id: https://v8.googlecode.com/svn/branches/bleeding_edge@22092 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2014-06-30 13:25:46 +00:00			`#include "src/base/logging.h"`
Use full include paths everywhere - this avoids using relative include paths which are forbidden by the style guide - makes the code more readable since it's clear which header is meant - allows for starting to use checkdeps BUG=none R=jkummerow@chromium.org, danno@chromium.org LOG=n Review URL: https://codereview.chromium.org/304153016 git-svn-id: https://v8.googlecode.com/svn/branches/bleeding_edge@21625 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2014-06-03 08:12:43 +00:00			`#include "src/utils.h"`
Initial export. git-svn-id: http://v8.googlecode.com/svn/trunk@2 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2008-07-03 15:10:15 +00:00
			`namespace unibrow {`

			`template <class T, int s> bool Predicate<T, s>::get(uchar code_point) {`
			`CacheEntry entry = entries_[code_point & kMask];`
			`if (entry.code_point_ == code_point) return entry.value_;`
			`return CalculateValue(code_point);`
			`}`

			`template <class T, int s> bool Predicate<T, s>::CalculateValue(`
			`uchar code_point) {`
			`bool result = T::Is(code_point);`
			`entries_[code_point & kMask] = CacheEntry(code_point, result);`
			`return result;`
			`}`

			`template <class T, int s> int Mapping<T, s>::get(uchar c, uchar n,`
			`uchar* result) {`
			`CacheEntry entry = entries_[c & kMask];`
			`if (entry.code_point_ == c) {`
			`if (entry.offset_ == 0) {`
			`return 0;`
			`} else {`
			`result[0] = c + entry.offset_;`
			`return 1;`
			`}`
			`} else {`
			`return CalculateValue(c, n, result);`
			`}`
			`}`

			`template <class T, int s> int Mapping<T, s>::CalculateValue(uchar c, uchar n,`
			`uchar* result) {`
			`bool allow_caching = true;`
			`int length = T::Convert(c, n, result, &allow_caching);`
			`if (allow_caching) {`
			`if (length == 1) {`
			`entries_[c & kMask] = CacheEntry(c, result[0] - c);`
			`return 1;`
			`} else {`
			`entries_[c & kMask] = CacheEntry(c, 0);`
			`return 0;`
			`}`
			`} else {`
			`return length;`
			`}`
			`}`


Fix some latin-1 webkit units tests R=yangguo@chromium.org BUG= Review URL: https://chromiumcodereview.appspot.com/11962035 Patch from Dan Carney <dcarney@google.com>. git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@13455 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2013-01-21 16:11:31 +00:00			`uint16_t Latin1::ConvertNonLatin1ToLatin1(uint16_t c) {`
Cleanup latin-1 conversion check in regexp engine R=yangguo@chromium.org BUG= Review URL: https://chromiumcodereview.appspot.com/11880045 Patch from Dan Carney <dcarney@google.com>. git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@13400 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2013-01-16 13:04:07 +00:00			`ASSERT(c > Latin1::kMaxChar);`
			`switch (c) {`
Fix some latin-1 webkit units tests R=yangguo@chromium.org BUG= Review URL: https://chromiumcodereview.appspot.com/11962035 Patch from Dan Carney <dcarney@google.com>. git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@13455 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2013-01-21 16:11:31 +00:00			`// This are equivalent characters in unicode.`
			`case 0x39c:`
			`case 0x3bc:`
			`return 0xb5;`
			`// This is an uppercase of a Latin-1 character`
			`// outside of Latin-1.`
Cleanup latin-1 conversion check in regexp engine R=yangguo@chromium.org BUG= Review URL: https://chromiumcodereview.appspot.com/11880045 Patch from Dan Carney <dcarney@google.com>. git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@13400 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2013-01-16 13:04:07 +00:00			`case 0x178:`
Fix some latin-1 webkit units tests R=yangguo@chromium.org BUG= Review URL: https://chromiumcodereview.appspot.com/11962035 Patch from Dan Carney <dcarney@google.com>. git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@13455 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2013-01-21 16:11:31 +00:00			`return 0xff;`
Cleanup latin-1 conversion check in regexp engine R=yangguo@chromium.org BUG= Review URL: https://chromiumcodereview.appspot.com/11880045 Patch from Dan Carney <dcarney@google.com>. git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@13400 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2013-01-16 13:04:07 +00:00			`}`
Fix some latin-1 webkit units tests R=yangguo@chromium.org BUG= Review URL: https://chromiumcodereview.appspot.com/11962035 Patch from Dan Carney <dcarney@google.com>. git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@13455 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2013-01-21 16:11:31 +00:00			`return 0;`
Cleanup latin-1 conversion check in regexp engine R=yangguo@chromium.org BUG= Review URL: https://chromiumcodereview.appspot.com/11880045 Patch from Dan Carney <dcarney@google.com>. git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@13400 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2013-01-16 13:04:07 +00:00			`}`


Some Utf8Length microoptimizations R=yangguo@chromium.org BUG= Review URL: https://codereview.chromium.org/12783002 git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@13938 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2013-03-13 19:43:45 +00:00			`unsigned Utf8::EncodeOneByte(char* str, uint8_t c) {`
			`static const int kMask = ~(1 << 6);`
			`if (c <= kMaxOneByteChar) {`
			`str[0] = c;`
			`return 1;`
			`}`
			`str[0] = 0xC0 \| (c >> 6);`
			`str[1] = 0x80 \| (c & kMask);`
			`return 2;`
			`}`

String:WriteUtf8: Add REPLACE_INVALID_UTF8 option This patch makes String::WriteUtf8 replace invalid code points (i.e. unmatched surrogates) with the unicode replacement character when REPLACE_INVALID_UTF8 is set. This is done to avoid creating invalid UTF-8 output which can lead to compatibility issues with software requiring valid UTF-8 inputs (e.g. the WebSocket protocol requires valid UTF-8 and terminates connections when invalid UTF-8 is encountered). R=dcarney@chromium.org BUG= Review URL: https://codereview.chromium.org/121173009 Patch from Felix Geisendörfer <haimuiba@gmail.com>. git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@18683 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2014-01-20 09:52:54 +00:00			`// Encode encodes the UTF-16 code units c and previous into the given str`
			`// buffer, and combines surrogate code units into single code points. If`
			`// replace_invalid is set to true, orphan surrogate code units will be replaced`
			`// with kBadChar.`
			`unsigned Utf8::Encode(char* str,`
			`uchar c,`
			`int previous,`
			`bool replace_invalid) {`
Initial export. git-svn-id: http://v8.googlecode.com/svn/trunk@2 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2008-07-03 15:10:15 +00:00			`static const int kMask = ~(1 << 6);`
			`if (c <= kMaxOneByteChar) {`
			`str[0] = c;`
			`return 1;`
			`} else if (c <= kMaxTwoByteChar) {`
			`str[0] = 0xC0 \| (c >> 6);`
			`str[1] = 0x80 \| (c & kMask);`
			`return 2;`
			`} else if (c <= kMaxThreeByteChar) {`
String:WriteUtf8: Add REPLACE_INVALID_UTF8 option This patch makes String::WriteUtf8 replace invalid code points (i.e. unmatched surrogates) with the unicode replacement character when REPLACE_INVALID_UTF8 is set. This is done to avoid creating invalid UTF-8 output which can lead to compatibility issues with software requiring valid UTF-8 inputs (e.g. the WebSocket protocol requires valid UTF-8 and terminates connections when invalid UTF-8 is encountered). R=dcarney@chromium.org BUG= Review URL: https://codereview.chromium.org/121173009 Patch from Felix Geisendörfer <haimuiba@gmail.com>. git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@18683 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2014-01-20 09:52:54 +00:00			`if (Utf16::IsSurrogatePair(previous, c)) {`
Fix input and output to handle UTF16 surrogate pairs. Review URL: https://chromiumcodereview.appspot.com/9600009 git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@11007 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2012-03-12 12:35:28 +00:00			`const int kUnmatchedSize = kSizeOfUnmatchedSurrogate;`
			`return Encode(str - kUnmatchedSize,`
			`Utf16::CombineSurrogatePair(previous, c),`
String:WriteUtf8: Add REPLACE_INVALID_UTF8 option This patch makes String::WriteUtf8 replace invalid code points (i.e. unmatched surrogates) with the unicode replacement character when REPLACE_INVALID_UTF8 is set. This is done to avoid creating invalid UTF-8 output which can lead to compatibility issues with software requiring valid UTF-8 inputs (e.g. the WebSocket protocol requires valid UTF-8 and terminates connections when invalid UTF-8 is encountered). R=dcarney@chromium.org BUG= Review URL: https://codereview.chromium.org/121173009 Patch from Felix Geisendörfer <haimuiba@gmail.com>. git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@18683 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2014-01-20 09:52:54 +00:00			`Utf16::kNoPreviousCharacter,`
			`replace_invalid) - kUnmatchedSize;`
			`} else if (replace_invalid &&`
			`(Utf16::IsLeadSurrogate(c) \|\|`
			`Utf16::IsTrailSurrogate(c))) {`
			`c = kBadChar;`
Fix input and output to handle UTF16 surrogate pairs. Review URL: https://chromiumcodereview.appspot.com/9600009 git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@11007 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2012-03-12 12:35:28 +00:00			`}`
Initial export. git-svn-id: http://v8.googlecode.com/svn/trunk@2 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2008-07-03 15:10:15 +00:00			`str[0] = 0xE0 \| (c >> 12);`
			`str[1] = 0x80 \| ((c >> 6) & kMask);`
			`str[2] = 0x80 \| (c & kMask);`
			`return 3;`
			`} else {`
			`str[0] = 0xF0 \| (c >> 18);`
			`str[1] = 0x80 \| ((c >> 12) & kMask);`
			`str[2] = 0x80 \| ((c >> 6) & kMask);`
			`str[3] = 0x80 \| (c & kMask);`
			`return 4;`
			`}`
			`}`


			`uchar Utf8::ValueOf(const byte* bytes, unsigned length, unsigned* cursor) {`
			`if (length <= 0) return kBadChar;`
			`byte first = bytes[0];`
			`// Characters between 0000 and 0007F are encoded as a single character`
			`if (first <= kMaxOneByteChar) {`
			`*cursor += 1;`
			`return first;`
			`}`
			`return CalculateValue(bytes, length, cursor);`
			`}`

Fix input and output to handle UTF16 surrogate pairs. Review URL: https://chromiumcodereview.appspot.com/9600009 git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@11007 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2012-03-12 12:35:28 +00:00			`unsigned Utf8::Length(uchar c, int previous) {`
Initial export. git-svn-id: http://v8.googlecode.com/svn/trunk@2 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2008-07-03 15:10:15 +00:00			`if (c <= kMaxOneByteChar) {`
			`return 1;`
			`} else if (c <= kMaxTwoByteChar) {`
			`return 2;`
			`} else if (c <= kMaxThreeByteChar) {`
Fix input and output to handle UTF16 surrogate pairs. Review URL: https://chromiumcodereview.appspot.com/9600009 git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@11007 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2012-03-12 12:35:28 +00:00			`if (Utf16::IsTrailSurrogate(c) &&`
			`Utf16::IsLeadSurrogate(previous)) {`
			`return kSizeOfUnmatchedSurrogate - kBytesSavedByCombiningSurrogates;`
			`}`
Initial export. git-svn-id: http://v8.googlecode.com/svn/trunk@2 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2008-07-03 15:10:15 +00:00			`return 3;`
			`} else {`
			`return 4;`
			`}`
			`}`

Remove Utf8InputBuffer R=yangguo@chromium.org BUG= Review URL: https://chromiumcodereview.appspot.com/11649018 Patch from Dan Carney <dcarney@google.com>. git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@13248 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2012-12-20 09:20:37 +00:00			`Utf8DecoderBase::Utf8DecoderBase()`
			`: unbuffered_start_(NULL),`
			`utf16_length_(0),`
			`last_byte_of_buffer_unused_(false) {}`

			`Utf8DecoderBase::Utf8DecoderBase(uint16_t* buffer,`
			`unsigned buffer_length,`
			`const uint8_t* stream,`
			`unsigned stream_length) {`
			`Reset(buffer, buffer_length, stream, stream_length);`
			`}`

			`template<unsigned kBufferSize>`
			`Utf8Decoder<kBufferSize>::Utf8Decoder(const char* stream, unsigned length)`
			`: Utf8DecoderBase(buffer_,`
			`kBufferSize,`
			`reinterpret_cast<const uint8_t*>(stream),`
			`length) {`
			`}`

			`template<unsigned kBufferSize>`
			`void Utf8Decoder<kBufferSize>::Reset(const char* stream, unsigned length) {`
			`Utf8DecoderBase::Reset(buffer_,`
			`kBufferSize,`
			`reinterpret_cast<const uint8_t*>(stream),`
			`length);`
			`}`

			`template <unsigned kBufferSize>`
			`unsigned Utf8Decoder<kBufferSize>::WriteUtf16(uint16_t* data,`
			`unsigned length) const {`
			`ASSERT(length > 0);`
			`if (length > utf16_length_) length = utf16_length_;`
			`// memcpy everything in buffer.`
			`unsigned buffer_length =`
			`last_byte_of_buffer_unused_ ? kBufferSize - 1 : kBufferSize;`
Reland 21502 - "Move OS::MemCopy and OS::MemMove out of platform to utils" Verified that arm builds locally. BUG=none TBR=jkummerow@chromium.org LOG=n Review URL: https://codereview.chromium.org/306473004 git-svn-id: https://v8.googlecode.com/svn/branches/bleeding_edge@21512 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2014-05-27 07:57:22 +00:00			`unsigned memcpy_length = length <= buffer_length ? length : buffer_length;`
			`v8::internal::MemCopy(data, buffer_, memcpy_length * sizeof(uint16_t));`
Remove Utf8InputBuffer R=yangguo@chromium.org BUG= Review URL: https://chromiumcodereview.appspot.com/11649018 Patch from Dan Carney <dcarney@google.com>. git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@13248 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2012-12-20 09:20:37 +00:00			`if (length <= buffer_length) return length;`
			`ASSERT(unbuffered_start_ != NULL);`
			`// Copy the rest the slow way.`
			`WriteUtf16Slow(unbuffered_start_,`
			`data + buffer_length,`
			`length - buffer_length);`
			`return length;`
Initial export. git-svn-id: http://v8.googlecode.com/svn/trunk@2 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2008-07-03 15:10:15 +00:00			`}`

			`} // namespace unibrow`

Cleanup include guards: - Fix some typos / guards that didn't match the filename. - Fix some style inconsistencies. - Add guards to files that were missing them. - Add the directory name to the guard. Review URL: http://codereview.chromium.org/99343 git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@1845 ce2b1a6d-e550-0410-aec6-3dcde31c8c00 2009-05-04 13:36:43 +00:00			`#endif // V8_UNICODE_INL_H_`