scuffed-code/icu4c/source/i18n/tzfmt.cpp

2877 lines
94 KiB
C++
Raw Normal View History

// Copyright (C) 2016 and later: Unicode, Inc. and others.
// License & terms of use: http://www.unicode.org/copyright.html
/*
*******************************************************************************
* Copyright (C) 2011-2015, International Business Machines Corporation and
* others. All Rights Reserved.
*******************************************************************************
*/
#include "unicode/utypes.h"
#if !UCONFIG_NO_FORMATTING
#include "unicode/calendar.h"
#include "unicode/tzfmt.h"
#include "unicode/numsys.h"
#include "unicode/uchar.h"
#include "unicode/udat.h"
#include "tzgnames.h"
#include "cmemory.h"
#include "cstring.h"
#include "putilimp.h"
#include "uassert.h"
#include "ucln_in.h"
#include "umutex.h"
#include "uresimp.h"
#include "ureslocs.h"
#include "uvector.h"
#include "zonemeta.h"
#include "tznames_impl.h" // TextTrieMap
U_NAMESPACE_BEGIN
// Bit flags used by the parse method.
// The order must match UTimeZoneFormatStyle enum.
#define ISO_Z_STYLE_FLAG 0x0080
#define ISO_LOCAL_STYLE_FLAG 0x0100
static const int16_t STYLE_PARSE_FLAGS[] = {
0x0001, // UTZFMT_STYLE_GENERIC_LOCATION,
0x0002, // UTZFMT_STYLE_GENERIC_LONG,
0x0004, // UTZFMT_STYLE_GENERIC_SHORT,
0x0008, // UTZFMT_STYLE_SPECIFIC_LONG,
0x0010, // UTZFMT_STYLE_SPECIFIC_SHORT,
0x0020, // UTZFMT_STYLE_LOCALIZED_GMT,
0x0040, // UTZFMT_STYLE_LOCALIZED_GMT_SHORT,
ISO_Z_STYLE_FLAG, // UTZFMT_STYLE_ISO_BASIC_SHORT,
ISO_LOCAL_STYLE_FLAG, // UTZFMT_STYLE_ISO_BASIC_LOCAL_SHORT,
ISO_Z_STYLE_FLAG, // UTZFMT_STYLE_ISO_BASIC_FIXED,
ISO_LOCAL_STYLE_FLAG, // UTZFMT_STYLE_ISO_BASIC_LOCAL_FIXED,
ISO_Z_STYLE_FLAG, // UTZFMT_STYLE_ISO_BASIC_FULL,
ISO_LOCAL_STYLE_FLAG, // UTZFMT_STYLE_ISO_BASIC_LOCAL_FULL,
ISO_Z_STYLE_FLAG, // UTZFMT_STYLE_ISO_EXTENDED_FIXED,
ISO_LOCAL_STYLE_FLAG, // UTZFMT_STYLE_ISO_EXTENDED_LOCAL_FIXED,
ISO_Z_STYLE_FLAG, // UTZFMT_STYLE_ISO_EXTENDED_FULL,
ISO_LOCAL_STYLE_FLAG, // UTZFMT_STYLE_ISO_EXTENDED_LOCAL_FULL,
0x0200, // UTZFMT_STYLE_ZONE_ID,
0x0400, // UTZFMT_STYLE_ZONE_ID_SHORT,
0x0800 // UTZFMT_STYLE_EXEMPLAR_LOCATION
};
static const char gZoneStringsTag[] = "zoneStrings";
static const char gGmtFormatTag[]= "gmtFormat";
static const char gGmtZeroFormatTag[] = "gmtZeroFormat";
static const char gHourFormatTag[]= "hourFormat";
static const UChar TZID_GMT[] = {0x0045, 0x0074, 0x0063, 0x002F, 0x0047, 0x004D, 0x0054, 0}; // Etc/GMT
static const UChar UNKNOWN_ZONE_ID[] = {
0x0045, 0x0074, 0x0063, 0x002F, 0x0055, 0x006E, 0x006B, 0x006E, 0x006F, 0x0077, 0x006E, 0}; // Etc/Unknown
static const UChar UNKNOWN_SHORT_ZONE_ID[] = {0x0075, 0x006E, 0x006B, 0}; // unk
static const UChar UNKNOWN_LOCATION[] = {0x0055, 0x006E, 0x006B, 0x006E, 0x006F, 0x0077, 0x006E, 0}; // Unknown
static const UChar DEFAULT_GMT_PATTERN[] = {0x0047, 0x004D, 0x0054, 0x007B, 0x0030, 0x007D, 0}; // GMT{0}
//static const UChar DEFAULT_GMT_ZERO[] = {0x0047, 0x004D, 0x0054, 0}; // GMT
static const UChar DEFAULT_GMT_POSITIVE_HM[] = {0x002B, 0x0048, 0x003A, 0x006D, 0x006D, 0}; // +H:mm
static const UChar DEFAULT_GMT_POSITIVE_HMS[] = {0x002B, 0x0048, 0x003A, 0x006D, 0x006D, 0x003A, 0x0073, 0x0073, 0}; // +H:mm:ss
static const UChar DEFAULT_GMT_NEGATIVE_HM[] = {0x002D, 0x0048, 0x003A, 0x006D, 0x006D, 0}; // -H:mm
static const UChar DEFAULT_GMT_NEGATIVE_HMS[] = {0x002D, 0x0048, 0x003A, 0x006D, 0x006D, 0x003A, 0x0073, 0x0073, 0}; // -H:mm:ss
static const UChar DEFAULT_GMT_POSITIVE_H[] = {0x002B, 0x0048, 0}; // +H
static const UChar DEFAULT_GMT_NEGATIVE_H[] = {0x002D, 0x0048, 0}; // -H
static const UChar32 DEFAULT_GMT_DIGITS[] = {
0x0030, 0x0031, 0x0032, 0x0033, 0x0034,
0x0035, 0x0036, 0x0037, 0x0038, 0x0039
};
static const UChar DEFAULT_GMT_OFFSET_SEP = 0x003A; // ':'
static const UChar ARG0[] = {0x007B, 0x0030, 0x007D}; // "{0}"
static const int32_t ARG0_LEN = 3;
static const UChar DEFAULT_GMT_OFFSET_MINUTE_PATTERN[] = {0x006D, 0x006D, 0}; // "mm"
static const UChar DEFAULT_GMT_OFFSET_SECOND_PATTERN[] = {0x0073, 0x0073, 0}; // "ss"
static const UChar ALT_GMT_STRINGS[][4] = {
{0x0047, 0x004D, 0x0054, 0}, // GMT
{0x0055, 0x0054, 0x0043, 0}, // UTC
{0x0055, 0x0054, 0, 0}, // UT
{0, 0, 0, 0}
};
// Order of GMT offset pattern parsing, *_HMS must be evaluated first
// because *_HM is most likely a substring of *_HMS
static const int32_t PARSE_GMT_OFFSET_TYPES[] = {
UTZFMT_PAT_POSITIVE_HMS,
UTZFMT_PAT_NEGATIVE_HMS,
UTZFMT_PAT_POSITIVE_HM,
UTZFMT_PAT_NEGATIVE_HM,
UTZFMT_PAT_POSITIVE_H,
UTZFMT_PAT_NEGATIVE_H,
-1
};
static const UChar SINGLEQUOTE = 0x0027;
static const UChar PLUS = 0x002B;
static const UChar MINUS = 0x002D;
static const UChar ISO8601_UTC = 0x005A; // 'Z'
static const UChar ISO8601_SEP = 0x003A; // ':'
static const int32_t MILLIS_PER_HOUR = 60 * 60 * 1000;
static const int32_t MILLIS_PER_MINUTE = 60 * 1000;
static const int32_t MILLIS_PER_SECOND = 1000;
// Maximum offset (exclusive) in millisecond supported by offset formats
static int32_t MAX_OFFSET = 24 * MILLIS_PER_HOUR;
// Maximum values for GMT offset fields
static const int32_t MAX_OFFSET_HOUR = 23;
static const int32_t MAX_OFFSET_MINUTE = 59;
static const int32_t MAX_OFFSET_SECOND = 59;
static const int32_t UNKNOWN_OFFSET = 0x7FFFFFFF;
static const int32_t ALL_SIMPLE_NAME_TYPES = UTZNM_LONG_STANDARD | UTZNM_LONG_DAYLIGHT | UTZNM_SHORT_STANDARD | UTZNM_SHORT_DAYLIGHT | UTZNM_EXEMPLAR_LOCATION;
static const int32_t ALL_GENERIC_NAME_TYPES = UTZGNM_LOCATION | UTZGNM_LONG | UTZGNM_SHORT;
#define DIGIT_VAL(c) (0x0030 <= (c) && (c) <= 0x0039 ? (c) - 0x0030 : -1)
#define MAX_OFFSET_DIGITS 6
// Time Zone ID/Short ID trie
static TextTrieMap *gZoneIdTrie = NULL;
static icu::UInitOnce gZoneIdTrieInitOnce = U_INITONCE_INITIALIZER;
static TextTrieMap *gShortZoneIdTrie = NULL;
static icu::UInitOnce gShortZoneIdTrieInitOnce = U_INITONCE_INITIALIZER;
static UMutex gLock = U_MUTEX_INITIALIZER;
U_CDECL_BEGIN
/**
* Cleanup callback func
*/
static UBool U_CALLCONV tzfmt_cleanup(void)
{
if (gZoneIdTrie != NULL) {
delete gZoneIdTrie;
}
gZoneIdTrie = NULL;
gZoneIdTrieInitOnce.reset();
if (gShortZoneIdTrie != NULL) {
delete gShortZoneIdTrie;
}
gShortZoneIdTrie = NULL;
gShortZoneIdTrieInitOnce.reset();
return TRUE;
}
U_CDECL_END
// ------------------------------------------------------------------
// GMTOffsetField
//
// This class represents a localized GMT offset pattern
// item and used by TimeZoneFormat
// ------------------------------------------------------------------
class GMTOffsetField : public UMemory {
public:
enum FieldType {
TEXT = 0,
HOUR = 1,
MINUTE = 2,
SECOND = 4
};
virtual ~GMTOffsetField();
static GMTOffsetField* createText(const UnicodeString& text, UErrorCode& status);
static GMTOffsetField* createTimeField(FieldType type, uint8_t width, UErrorCode& status);
static UBool isValid(FieldType type, int32_t width);
static FieldType getTypeByLetter(UChar ch);
FieldType getType() const;
uint8_t getWidth() const;
const UChar* getPatternText(void) const;
private:
UChar* fText;
FieldType fType;
uint8_t fWidth;
GMTOffsetField();
};
GMTOffsetField::GMTOffsetField()
: fText(NULL), fType(TEXT), fWidth(0) {
}
GMTOffsetField::~GMTOffsetField() {
if (fText) {
uprv_free(fText);
}
}
GMTOffsetField*
GMTOffsetField::createText(const UnicodeString& text, UErrorCode& status) {
if (U_FAILURE(status)) {
return NULL;
}
GMTOffsetField* result = new GMTOffsetField();
if (result == NULL) {
status = U_MEMORY_ALLOCATION_ERROR;
return NULL;
}
int32_t len = text.length();
result->fText = (UChar*)uprv_malloc((len + 1) * sizeof(UChar));
if (result->fText == NULL) {
status = U_MEMORY_ALLOCATION_ERROR;
delete result;
return NULL;
}
u_strncpy(result->fText, text.getBuffer(), len);
result->fText[len] = 0;
result->fType = TEXT;
return result;
}
GMTOffsetField*
GMTOffsetField::createTimeField(FieldType type, uint8_t width, UErrorCode& status) {
U_ASSERT(type != TEXT);
if (U_FAILURE(status)) {
return NULL;
}
GMTOffsetField* result = new GMTOffsetField();
if (result == NULL) {
status = U_MEMORY_ALLOCATION_ERROR;
return NULL;
}
result->fType = type;
result->fWidth = width;
return result;
}
UBool
GMTOffsetField::isValid(FieldType type, int32_t width) {
switch (type) {
case HOUR:
return (width == 1 || width == 2);
case MINUTE:
case SECOND:
return (width == 2);
default:
U_ASSERT(FALSE);
}
return (width > 0);
}
GMTOffsetField::FieldType
GMTOffsetField::getTypeByLetter(UChar ch) {
if (ch == 0x0048 /* H */) {
return HOUR;
} else if (ch == 0x006D /* m */) {
return MINUTE;
} else if (ch == 0x0073 /* s */) {
return SECOND;
}
return TEXT;
}
inline GMTOffsetField::FieldType
GMTOffsetField::getType() const {
return fType;
}
inline uint8_t
GMTOffsetField::getWidth() const {
return fWidth;
}
inline const UChar*
GMTOffsetField::getPatternText(void) const {
return fText;
}
U_CDECL_BEGIN
static void U_CALLCONV
deleteGMTOffsetField(void *obj) {
delete static_cast<GMTOffsetField *>(obj);
}
U_CDECL_END
// ------------------------------------------------------------------
// TimeZoneFormat
// ------------------------------------------------------------------
UOBJECT_DEFINE_RTTI_IMPLEMENTATION(TimeZoneFormat)
TimeZoneFormat::TimeZoneFormat(const Locale& locale, UErrorCode& status)
: fLocale(locale), fTimeZoneNames(NULL), fTimeZoneGenericNames(NULL),
fDefParseOptionFlags(0), fTZDBTimeZoneNames(NULL) {
for (int32_t i = 0; i < UTZFMT_PAT_COUNT; i++) {
fGMTOffsetPatternItems[i] = NULL;
}
const char* region = fLocale.getCountry();
int32_t regionLen = uprv_strlen(region);
if (regionLen == 0) {
char loc[ULOC_FULLNAME_CAPACITY];
uloc_addLikelySubtags(fLocale.getName(), loc, sizeof(loc), &status);
regionLen = uloc_getCountry(loc, fTargetRegion, sizeof(fTargetRegion), &status);
if (U_SUCCESS(status)) {
fTargetRegion[regionLen] = 0;
} else {
return;
}
} else if (regionLen < (int32_t)sizeof(fTargetRegion)) {
uprv_strcpy(fTargetRegion, region);
} else {
fTargetRegion[0] = 0;
}
fTimeZoneNames = TimeZoneNames::createInstance(locale, status);
// fTimeZoneGenericNames is lazily instantiated
if (U_FAILURE(status)) {
return;
}
const UChar* gmtPattern = NULL;
const UChar* hourFormats = NULL;
UResourceBundle *zoneBundle = ures_open(U_ICUDATA_ZONE, locale.getName(), &status);
UResourceBundle *zoneStringsArray = ures_getByKeyWithFallback(zoneBundle, gZoneStringsTag, NULL, &status);
if (U_SUCCESS(status)) {
const UChar* resStr;
int32_t len;
resStr = ures_getStringByKeyWithFallback(zoneStringsArray, gGmtFormatTag, &len, &status);
if (len > 0) {
gmtPattern = resStr;
}
resStr = ures_getStringByKeyWithFallback(zoneStringsArray, gGmtZeroFormatTag, &len, &status);
if (len > 0) {
fGMTZeroFormat.setTo(TRUE, resStr, len);
}
resStr = ures_getStringByKeyWithFallback(zoneStringsArray, gHourFormatTag, &len, &status);
if (len > 0) {
hourFormats = resStr;
}
ures_close(zoneStringsArray);
ures_close(zoneBundle);
}
if (gmtPattern == NULL) {
gmtPattern = DEFAULT_GMT_PATTERN;
}
initGMTPattern(UnicodeString(TRUE, gmtPattern, -1), status);
UBool useDefaultOffsetPatterns = TRUE;
if (hourFormats) {
UChar *sep = u_strchr(hourFormats, (UChar)0x003B /* ';' */);
if (sep != NULL) {
UErrorCode tmpStatus = U_ZERO_ERROR;
fGMTOffsetPatterns[UTZFMT_PAT_POSITIVE_HM].setTo(FALSE, hourFormats, (int32_t)(sep - hourFormats));
fGMTOffsetPatterns[UTZFMT_PAT_NEGATIVE_HM].setTo(TRUE, sep + 1, -1);
expandOffsetPattern(fGMTOffsetPatterns[UTZFMT_PAT_POSITIVE_HM], fGMTOffsetPatterns[UTZFMT_PAT_POSITIVE_HMS], tmpStatus);
expandOffsetPattern(fGMTOffsetPatterns[UTZFMT_PAT_NEGATIVE_HM], fGMTOffsetPatterns[UTZFMT_PAT_NEGATIVE_HMS], tmpStatus);
truncateOffsetPattern(fGMTOffsetPatterns[UTZFMT_PAT_POSITIVE_HM], fGMTOffsetPatterns[UTZFMT_PAT_POSITIVE_H], tmpStatus);
truncateOffsetPattern(fGMTOffsetPatterns[UTZFMT_PAT_NEGATIVE_HM], fGMTOffsetPatterns[UTZFMT_PAT_NEGATIVE_H], tmpStatus);
if (U_SUCCESS(tmpStatus)) {
useDefaultOffsetPatterns = FALSE;
}
}
}
if (useDefaultOffsetPatterns) {
fGMTOffsetPatterns[UTZFMT_PAT_POSITIVE_H].setTo(TRUE, DEFAULT_GMT_POSITIVE_H, -1);
fGMTOffsetPatterns[UTZFMT_PAT_POSITIVE_HM].setTo(TRUE, DEFAULT_GMT_POSITIVE_HM, -1);
fGMTOffsetPatterns[UTZFMT_PAT_POSITIVE_HMS].setTo(TRUE, DEFAULT_GMT_POSITIVE_HMS, -1);
fGMTOffsetPatterns[UTZFMT_PAT_NEGATIVE_H].setTo(TRUE, DEFAULT_GMT_NEGATIVE_H, -1);
fGMTOffsetPatterns[UTZFMT_PAT_NEGATIVE_HM].setTo(TRUE, DEFAULT_GMT_NEGATIVE_HM, -1);
fGMTOffsetPatterns[UTZFMT_PAT_NEGATIVE_HMS].setTo(TRUE, DEFAULT_GMT_NEGATIVE_HMS, -1);
}
initGMTOffsetPatterns(status);
NumberingSystem* ns = NumberingSystem::createInstance(locale, status);
UBool useDefDigits = TRUE;
if (ns && !ns->isAlgorithmic()) {
UnicodeString digits = ns->getDescription();
useDefDigits = !toCodePoints(digits, fGMTOffsetDigits, 10);
}
if (useDefDigits) {
uprv_memcpy(fGMTOffsetDigits, DEFAULT_GMT_DIGITS, sizeof(UChar32) * 10);
}
delete ns;
}
TimeZoneFormat::TimeZoneFormat(const TimeZoneFormat& other)
: Format(other), fTimeZoneNames(NULL), fTimeZoneGenericNames(NULL),
fTZDBTimeZoneNames(NULL) {
for (int32_t i = 0; i < UTZFMT_PAT_COUNT; i++) {
fGMTOffsetPatternItems[i] = NULL;
}
*this = other;
}
TimeZoneFormat::~TimeZoneFormat() {
delete fTimeZoneNames;
delete fTimeZoneGenericNames;
delete fTZDBTimeZoneNames;
for (int32_t i = 0; i < UTZFMT_PAT_COUNT; i++) {
delete fGMTOffsetPatternItems[i];
}
}
TimeZoneFormat&
TimeZoneFormat::operator=(const TimeZoneFormat& other) {
if (this == &other) {
return *this;
}
delete fTimeZoneNames;
delete fTimeZoneGenericNames;
fTimeZoneGenericNames = NULL;
delete fTZDBTimeZoneNames;
fTZDBTimeZoneNames = NULL;
fLocale = other.fLocale;
uprv_memcpy(fTargetRegion, other.fTargetRegion, sizeof(fTargetRegion));
fTimeZoneNames = other.fTimeZoneNames->clone();
if (other.fTimeZoneGenericNames) {
// TODO: this test has dubious thread safety.
fTimeZoneGenericNames = other.fTimeZoneGenericNames->clone();
}
fGMTPattern = other.fGMTPattern;
fGMTPatternPrefix = other.fGMTPatternPrefix;
fGMTPatternSuffix = other.fGMTPatternSuffix;
UErrorCode status = U_ZERO_ERROR;
for (int32_t i = 0; i < UTZFMT_PAT_COUNT; i++) {
fGMTOffsetPatterns[i] = other.fGMTOffsetPatterns[i];
delete fGMTOffsetPatternItems[i];
fGMTOffsetPatternItems[i] = NULL;
}
initGMTOffsetPatterns(status);
U_ASSERT(U_SUCCESS(status));
fGMTZeroFormat = other.fGMTZeroFormat;
uprv_memcpy(fGMTOffsetDigits, other.fGMTOffsetDigits, sizeof(fGMTOffsetDigits));
fDefParseOptionFlags = other.fDefParseOptionFlags;
return *this;
}
UBool
TimeZoneFormat::operator==(const Format& other) const {
TimeZoneFormat* tzfmt = (TimeZoneFormat*)&other;
UBool isEqual =
fLocale == tzfmt->fLocale
&& fGMTPattern == tzfmt->fGMTPattern
&& fGMTZeroFormat == tzfmt->fGMTZeroFormat
&& *fTimeZoneNames == *tzfmt->fTimeZoneNames;
for (int32_t i = 0; i < UTZFMT_PAT_COUNT && isEqual; i++) {
isEqual = fGMTOffsetPatterns[i] == tzfmt->fGMTOffsetPatterns[i];
}
for (int32_t i = 0; i < 10 && isEqual; i++) {
isEqual = fGMTOffsetDigits[i] == tzfmt->fGMTOffsetDigits[i];
}
// TODO
// Check fTimeZoneGenericNames. For now,
// if fTimeZoneNames is same, fTimeZoneGenericNames should
// be also equivalent.
return isEqual;
}
Format*
TimeZoneFormat::clone() const {
return new TimeZoneFormat(*this);
}
TimeZoneFormat* U_EXPORT2
TimeZoneFormat::createInstance(const Locale& locale, UErrorCode& status) {
TimeZoneFormat* tzfmt = new TimeZoneFormat(locale, status);
if (U_SUCCESS(status)) {
return tzfmt;
}
delete tzfmt;
return NULL;
}
// ------------------------------------------------------------------
// Setter and Getter
const TimeZoneNames*
TimeZoneFormat::getTimeZoneNames() const {
return (const TimeZoneNames*)fTimeZoneNames;
}
void
TimeZoneFormat::adoptTimeZoneNames(TimeZoneNames *tznames) {
delete fTimeZoneNames;
fTimeZoneNames = tznames;
// TODO - We should also update fTimeZoneGenericNames
}
void
TimeZoneFormat::setTimeZoneNames(const TimeZoneNames &tznames) {
delete fTimeZoneNames;
fTimeZoneNames = tznames.clone();
// TODO - We should also update fTimeZoneGenericNames
}
void
TimeZoneFormat::setDefaultParseOptions(uint32_t flags) {
fDefParseOptionFlags = flags;
}
uint32_t
TimeZoneFormat::getDefaultParseOptions(void) const {
return fDefParseOptionFlags;
}
UnicodeString&
TimeZoneFormat::getGMTPattern(UnicodeString& pattern) const {
return pattern.setTo(fGMTPattern);
}
void
TimeZoneFormat::setGMTPattern(const UnicodeString& pattern, UErrorCode& status) {
initGMTPattern(pattern, status);
}
UnicodeString&
TimeZoneFormat::getGMTOffsetPattern(UTimeZoneFormatGMTOffsetPatternType type, UnicodeString& pattern) const {
return pattern.setTo(fGMTOffsetPatterns[type]);
}
void
TimeZoneFormat::setGMTOffsetPattern(UTimeZoneFormatGMTOffsetPatternType type, const UnicodeString& pattern, UErrorCode& status) {
if (U_FAILURE(status)) {
return;
}
if (pattern == fGMTOffsetPatterns[type]) {
// No need to reset
return;
}
OffsetFields required = FIELDS_HM;
switch (type) {
case UTZFMT_PAT_POSITIVE_H:
case UTZFMT_PAT_NEGATIVE_H:
required = FIELDS_H;
break;
case UTZFMT_PAT_POSITIVE_HM:
case UTZFMT_PAT_NEGATIVE_HM:
required = FIELDS_HM;
break;
case UTZFMT_PAT_POSITIVE_HMS:
case UTZFMT_PAT_NEGATIVE_HMS:
required = FIELDS_HMS;
break;
default:
U_ASSERT(FALSE);
break;
}
UVector* patternItems = parseOffsetPattern(pattern, required, status);
if (patternItems == NULL) {
return;
}
fGMTOffsetPatterns[type].setTo(pattern);
delete fGMTOffsetPatternItems[type];
fGMTOffsetPatternItems[type] = patternItems;
checkAbuttingHoursAndMinutes();
}
UnicodeString&
TimeZoneFormat::getGMTOffsetDigits(UnicodeString& digits) const {
digits.remove();
for (int32_t i = 0; i < 10; i++) {
digits.append(fGMTOffsetDigits[i]);
}
return digits;
}
void
TimeZoneFormat::setGMTOffsetDigits(const UnicodeString& digits, UErrorCode& status) {
if (U_FAILURE(status)) {
return;
}
UChar32 digitArray[10];
if (!toCodePoints(digits, digitArray, 10)) {
status = U_ILLEGAL_ARGUMENT_ERROR;
return;
}
uprv_memcpy(fGMTOffsetDigits, digitArray, sizeof(UChar32)*10);
}
UnicodeString&
TimeZoneFormat::getGMTZeroFormat(UnicodeString& gmtZeroFormat) const {
return gmtZeroFormat.setTo(fGMTZeroFormat);
}
void
TimeZoneFormat::setGMTZeroFormat(const UnicodeString& gmtZeroFormat, UErrorCode& status) {
if (U_SUCCESS(status)) {
if (gmtZeroFormat.isEmpty()) {
status = U_ILLEGAL_ARGUMENT_ERROR;
} else if (gmtZeroFormat != fGMTZeroFormat) {
fGMTZeroFormat.setTo(gmtZeroFormat);
}
}
}
// ------------------------------------------------------------------
// Format and Parse
UnicodeString&
TimeZoneFormat::format(UTimeZoneFormatStyle style, const TimeZone& tz, UDate date,
UnicodeString& name, UTimeZoneFormatTimeType* timeType /* = NULL */) const {
if (timeType) {
*timeType = UTZFMT_TIME_TYPE_UNKNOWN;
}
UBool noOffsetFormatFallback = FALSE;
switch (style) {
case UTZFMT_STYLE_GENERIC_LOCATION:
formatGeneric(tz, UTZGNM_LOCATION, date, name);
break;
case UTZFMT_STYLE_GENERIC_LONG:
formatGeneric(tz, UTZGNM_LONG, date, name);
break;
case UTZFMT_STYLE_GENERIC_SHORT:
formatGeneric(tz, UTZGNM_SHORT, date, name);
break;
case UTZFMT_STYLE_SPECIFIC_LONG:
formatSpecific(tz, UTZNM_LONG_STANDARD, UTZNM_LONG_DAYLIGHT, date, name, timeType);
break;
case UTZFMT_STYLE_SPECIFIC_SHORT:
formatSpecific(tz, UTZNM_SHORT_STANDARD, UTZNM_SHORT_DAYLIGHT, date, name, timeType);
break;
case UTZFMT_STYLE_ZONE_ID:
tz.getID(name);
noOffsetFormatFallback = TRUE;
break;
case UTZFMT_STYLE_ZONE_ID_SHORT:
{
const UChar* shortID = ZoneMeta::getShortID(tz);
if (shortID == NULL) {
shortID = UNKNOWN_SHORT_ZONE_ID;
}
name.setTo(shortID, -1);
}
noOffsetFormatFallback = TRUE;
break;
case UTZFMT_STYLE_EXEMPLAR_LOCATION:
formatExemplarLocation(tz, name);
noOffsetFormatFallback = TRUE;
break;
default:
// will be handled below
break;
}
if (name.isEmpty() && !noOffsetFormatFallback) {
UErrorCode status = U_ZERO_ERROR;
int32_t rawOffset, dstOffset;
tz.getOffset(date, FALSE, rawOffset, dstOffset, status);
int32_t offset = rawOffset + dstOffset;
if (U_SUCCESS(status)) {
switch (style) {
case UTZFMT_STYLE_GENERIC_LOCATION:
case UTZFMT_STYLE_GENERIC_LONG:
case UTZFMT_STYLE_SPECIFIC_LONG:
case UTZFMT_STYLE_LOCALIZED_GMT:
formatOffsetLocalizedGMT(offset, name, status);
break;
case UTZFMT_STYLE_GENERIC_SHORT:
case UTZFMT_STYLE_SPECIFIC_SHORT:
case UTZFMT_STYLE_LOCALIZED_GMT_SHORT:
formatOffsetShortLocalizedGMT(offset, name, status);
break;
case UTZFMT_STYLE_ISO_BASIC_SHORT:
formatOffsetISO8601Basic(offset, TRUE, TRUE, TRUE, name, status);
break;
case UTZFMT_STYLE_ISO_BASIC_LOCAL_SHORT:
formatOffsetISO8601Basic(offset, FALSE, TRUE, TRUE, name, status);
break;
case UTZFMT_STYLE_ISO_BASIC_FIXED:
formatOffsetISO8601Basic(offset, TRUE, FALSE, TRUE, name, status);
break;
case UTZFMT_STYLE_ISO_BASIC_LOCAL_FIXED:
formatOffsetISO8601Basic(offset, FALSE, FALSE, TRUE, name, status);
break;
case UTZFMT_STYLE_ISO_EXTENDED_FIXED:
formatOffsetISO8601Extended(offset, TRUE, FALSE, TRUE, name, status);
break;
case UTZFMT_STYLE_ISO_EXTENDED_LOCAL_FIXED:
formatOffsetISO8601Extended(offset, FALSE, FALSE, TRUE, name, status);
break;
case UTZFMT_STYLE_ISO_BASIC_FULL:
formatOffsetISO8601Basic(offset, TRUE, FALSE, FALSE, name, status);
break;
case UTZFMT_STYLE_ISO_BASIC_LOCAL_FULL:
formatOffsetISO8601Basic(offset, FALSE, FALSE, FALSE, name, status);
break;
case UTZFMT_STYLE_ISO_EXTENDED_FULL:
formatOffsetISO8601Extended(offset, TRUE, FALSE, FALSE, name, status);
break;
case UTZFMT_STYLE_ISO_EXTENDED_LOCAL_FULL:
formatOffsetISO8601Extended(offset, FALSE, FALSE, FALSE, name, status);
break;
default:
// UTZFMT_STYLE_ZONE_ID, UTZFMT_STYLE_ZONE_ID_SHORT, UTZFMT_STYLE_EXEMPLAR_LOCATION
break;
}
if (timeType) {
*timeType = (dstOffset != 0) ? UTZFMT_TIME_TYPE_DAYLIGHT : UTZFMT_TIME_TYPE_STANDARD;
}
}
}
return name;
}
UnicodeString&
TimeZoneFormat::format(const Formattable& obj, UnicodeString& appendTo,
FieldPosition& pos, UErrorCode& status) const {
if (U_FAILURE(status)) {
return appendTo;
}
UDate date = Calendar::getNow();
if (obj.getType() == Formattable::kObject) {
const UObject* formatObj = obj.getObject();
const TimeZone* tz = dynamic_cast<const TimeZone*>(formatObj);
if (tz == NULL) {
const Calendar* cal = dynamic_cast<const Calendar*>(formatObj);
if (cal != NULL) {
tz = &cal->getTimeZone();
date = cal->getTime(status);
}
}
if (tz != NULL) {
int32_t rawOffset, dstOffset;
tz->getOffset(date, FALSE, rawOffset, dstOffset, status);
UChar buf[32];
UnicodeString result(buf, 0, UPRV_LENGTHOF(buf));
formatOffsetLocalizedGMT(rawOffset + dstOffset, result, status);
if (U_SUCCESS(status)) {
appendTo.append(result);
if (pos.getField() == UDAT_TIMEZONE_FIELD) {
pos.setBeginIndex(0);
pos.setEndIndex(result.length());
}
}
}
}
return appendTo;
}
TimeZone*
TimeZoneFormat::parse(UTimeZoneFormatStyle style, const UnicodeString& text, ParsePosition& pos,
UTimeZoneFormatTimeType* timeType /*= NULL*/) const {
return parse(style, text, pos, getDefaultParseOptions(), timeType);
}
TimeZone*
TimeZoneFormat::parse(UTimeZoneFormatStyle style, const UnicodeString& text, ParsePosition& pos,
int32_t parseOptions, UTimeZoneFormatTimeType* timeType /* = NULL */) const {
if (timeType) {
*timeType = UTZFMT_TIME_TYPE_UNKNOWN;
}
int32_t startIdx = pos.getIndex();
int32_t maxPos = text.length();
int32_t offset;
// Styles using localized GMT format as fallback
UBool fallbackLocalizedGMT =
(style == UTZFMT_STYLE_SPECIFIC_LONG || style == UTZFMT_STYLE_GENERIC_LONG || style == UTZFMT_STYLE_GENERIC_LOCATION);
UBool fallbackShortLocalizedGMT =
(style == UTZFMT_STYLE_SPECIFIC_SHORT || style == UTZFMT_STYLE_GENERIC_SHORT);
int32_t evaluated = 0; // bit flags representing already evaluated styles
ParsePosition tmpPos(startIdx);
int32_t parsedOffset = UNKNOWN_OFFSET; // stores successfully parsed offset for later use
int32_t parsedPos = -1; // stores successfully parsed offset position for later use
// Try localized GMT format first if necessary
if (fallbackLocalizedGMT || fallbackShortLocalizedGMT) {
UBool hasDigitOffset = FALSE;
offset = parseOffsetLocalizedGMT(text, tmpPos, fallbackShortLocalizedGMT, &hasDigitOffset);
if (tmpPos.getErrorIndex() == -1) {
// Even when the input text was successfully parsed as a localized GMT format text,
// we may still need to evaluate the specified style if -
// 1) GMT zero format was used, and
// 2) The input text was not completely processed
if (tmpPos.getIndex() == maxPos || hasDigitOffset) {
pos.setIndex(tmpPos.getIndex());
return createTimeZoneForOffset(offset);
}
parsedOffset = offset;
parsedPos = tmpPos.getIndex();
}
// Note: For now, no distinction between long/short localized GMT format in the parser.
// This might be changed in future.
// evaluated |= (fallbackLocalizedGMT ? STYLE_PARSE_FLAGS[UTZFMT_STYLE_LOCALIZED_GMT] : STYLE_PARSE_FLAGS[UTZFMT_STYLE_LOCALIZED_GMT_SHORT]);
evaluated |= STYLE_PARSE_FLAGS[UTZFMT_STYLE_LOCALIZED_GMT] | STYLE_PARSE_FLAGS[UTZFMT_STYLE_LOCALIZED_GMT_SHORT];
}
UErrorCode status = U_ZERO_ERROR;
UChar tzIDBuf[32];
UnicodeString tzID(tzIDBuf, 0, UPRV_LENGTHOF(tzIDBuf));
UBool parseTZDBAbbrev = ((parseOptions & UTZFMT_PARSE_OPTION_TZ_DATABASE_ABBREVIATIONS) != 0);
// Try the specified style
switch (style) {
case UTZFMT_STYLE_LOCALIZED_GMT:
{
tmpPos.setIndex(startIdx);
tmpPos.setErrorIndex(-1);
offset = parseOffsetLocalizedGMT(text, tmpPos);
if (tmpPos.getErrorIndex() == -1) {
pos.setIndex(tmpPos.getIndex());
return createTimeZoneForOffset(offset);
}
// Note: For now, no distinction between long/short localized GMT format in the parser.
// This might be changed in future.
evaluated |= STYLE_PARSE_FLAGS[UTZFMT_STYLE_LOCALIZED_GMT_SHORT];
break;
}
case UTZFMT_STYLE_LOCALIZED_GMT_SHORT:
{
tmpPos.setIndex(startIdx);
tmpPos.setErrorIndex(-1);
offset = parseOffsetShortLocalizedGMT(text, tmpPos);
if (tmpPos.getErrorIndex() == -1) {
pos.setIndex(tmpPos.getIndex());
return createTimeZoneForOffset(offset);
}
// Note: For now, no distinction between long/short localized GMT format in the parser.
// This might be changed in future.
evaluated |= STYLE_PARSE_FLAGS[UTZFMT_STYLE_LOCALIZED_GMT];
break;
}
case UTZFMT_STYLE_ISO_BASIC_SHORT:
case UTZFMT_STYLE_ISO_BASIC_FIXED:
case UTZFMT_STYLE_ISO_BASIC_FULL:
case UTZFMT_STYLE_ISO_EXTENDED_FIXED:
case UTZFMT_STYLE_ISO_EXTENDED_FULL:
{
tmpPos.setIndex(startIdx);
tmpPos.setErrorIndex(-1);
offset = parseOffsetISO8601(text, tmpPos);
if (tmpPos.getErrorIndex() == -1) {
pos.setIndex(tmpPos.getIndex());
return createTimeZoneForOffset(offset);
}
break;
}
case UTZFMT_STYLE_ISO_BASIC_LOCAL_SHORT:
case UTZFMT_STYLE_ISO_BASIC_LOCAL_FIXED:
case UTZFMT_STYLE_ISO_BASIC_LOCAL_FULL:
case UTZFMT_STYLE_ISO_EXTENDED_LOCAL_FIXED:
case UTZFMT_STYLE_ISO_EXTENDED_LOCAL_FULL:
{
tmpPos.setIndex(startIdx);
tmpPos.setErrorIndex(-1);
// Exclude the case of UTC Indicator "Z" here
UBool hasDigitOffset = FALSE;
offset = parseOffsetISO8601(text, tmpPos, FALSE, &hasDigitOffset);
if (tmpPos.getErrorIndex() == -1 && hasDigitOffset) {
pos.setIndex(tmpPos.getIndex());
return createTimeZoneForOffset(offset);
}
break;
}
case UTZFMT_STYLE_SPECIFIC_LONG:
case UTZFMT_STYLE_SPECIFIC_SHORT:
{
// Specific styles
int32_t nameTypes = 0;
if (style == UTZFMT_STYLE_SPECIFIC_LONG) {
nameTypes = (UTZNM_LONG_STANDARD | UTZNM_LONG_DAYLIGHT);
} else {
U_ASSERT(style == UTZFMT_STYLE_SPECIFIC_SHORT);
nameTypes = (UTZNM_SHORT_STANDARD | UTZNM_SHORT_DAYLIGHT);
}
LocalPointer<TimeZoneNames::MatchInfoCollection> specificMatches(fTimeZoneNames->find(text, startIdx, nameTypes, status));
if (U_FAILURE(status)) {
pos.setErrorIndex(startIdx);
return NULL;
}
if (!specificMatches.isNull()) {
int32_t matchIdx = -1;
int32_t matchPos = -1;
for (int32_t i = 0; i < specificMatches->size(); i++) {
matchPos = startIdx + specificMatches->getMatchLengthAt(i);
if (matchPos > parsedPos) {
matchIdx = i;
parsedPos = matchPos;
}
}
if (matchIdx >= 0) {
if (timeType) {
*timeType = getTimeType(specificMatches->getNameTypeAt(matchIdx));
}
pos.setIndex(matchPos);
getTimeZoneID(specificMatches.getAlias(), matchIdx, tzID);
U_ASSERT(!tzID.isEmpty());
return TimeZone::createTimeZone(tzID);
}
}
if (parseTZDBAbbrev && style == UTZFMT_STYLE_SPECIFIC_SHORT) {
U_ASSERT((nameTypes & UTZNM_SHORT_STANDARD) != 0);
U_ASSERT((nameTypes & UTZNM_SHORT_DAYLIGHT) != 0);
const TZDBTimeZoneNames *tzdbTimeZoneNames = getTZDBTimeZoneNames(status);
if (U_SUCCESS(status)) {
LocalPointer<TimeZoneNames::MatchInfoCollection> tzdbNameMatches(
tzdbTimeZoneNames->find(text, startIdx, nameTypes, status));
if (U_FAILURE(status)) {
pos.setErrorIndex(startIdx);
return NULL;
}
if (!tzdbNameMatches.isNull()) {
int32_t matchIdx = -1;
int32_t matchPos = -1;
for (int32_t i = 0; i < tzdbNameMatches->size(); i++) {
matchPos = startIdx + tzdbNameMatches->getMatchLengthAt(i);
if (matchPos > parsedPos) {
matchIdx = i;
parsedPos = matchPos;
}
}
if (matchIdx >= 0) {
if (timeType) {
*timeType = getTimeType(tzdbNameMatches->getNameTypeAt(matchIdx));
}
pos.setIndex(matchPos);
getTimeZoneID(tzdbNameMatches.getAlias(), matchIdx, tzID);
U_ASSERT(!tzID.isEmpty());
return TimeZone::createTimeZone(tzID);
}
}
}
}
break;
}
case UTZFMT_STYLE_GENERIC_LONG:
case UTZFMT_STYLE_GENERIC_SHORT:
case UTZFMT_STYLE_GENERIC_LOCATION:
{
int32_t genericNameTypes = 0;
switch (style) {
case UTZFMT_STYLE_GENERIC_LOCATION:
genericNameTypes = UTZGNM_LOCATION;
break;
case UTZFMT_STYLE_GENERIC_LONG:
genericNameTypes = UTZGNM_LONG | UTZGNM_LOCATION;
break;
case UTZFMT_STYLE_GENERIC_SHORT:
genericNameTypes = UTZGNM_SHORT | UTZGNM_LOCATION;
break;
default:
U_ASSERT(FALSE);
}
int32_t len = 0;
UTimeZoneFormatTimeType tt = UTZFMT_TIME_TYPE_UNKNOWN;
const TimeZoneGenericNames *gnames = getTimeZoneGenericNames(status);
if (U_SUCCESS(status)) {
len = gnames->findBestMatch(text, startIdx, genericNameTypes, tzID, tt, status);
}
if (U_FAILURE(status)) {
pos.setErrorIndex(startIdx);
return NULL;
}
if (len > 0) {
// Found a match
if (timeType) {
*timeType = tt;
}
pos.setIndex(startIdx + len);
U_ASSERT(!tzID.isEmpty());
return TimeZone::createTimeZone(tzID);
}
break;
}
case UTZFMT_STYLE_ZONE_ID:
{
tmpPos.setIndex(startIdx);
tmpPos.setErrorIndex(-1);
parseZoneID(text, tmpPos, tzID);
if (tmpPos.getErrorIndex() == -1) {
pos.setIndex(tmpPos.getIndex());
return TimeZone::createTimeZone(tzID);
}
break;
}
case UTZFMT_STYLE_ZONE_ID_SHORT:
{
tmpPos.setIndex(startIdx);
tmpPos.setErrorIndex(-1);
parseShortZoneID(text, tmpPos, tzID);
if (tmpPos.getErrorIndex() == -1) {
pos.setIndex(tmpPos.getIndex());
return TimeZone::createTimeZone(tzID);
}
break;
}
case UTZFMT_STYLE_EXEMPLAR_LOCATION:
{
tmpPos.setIndex(startIdx);
tmpPos.setErrorIndex(-1);
parseExemplarLocation(text, tmpPos, tzID);
if (tmpPos.getErrorIndex() == -1) {
pos.setIndex(tmpPos.getIndex());
return TimeZone::createTimeZone(tzID);
}
break;
}
}
evaluated |= STYLE_PARSE_FLAGS[style];
if (parsedPos > startIdx) {
// When the specified style is one of SPECIFIC_XXX or GENERIC_XXX, we tried to parse the input
// as localized GMT format earlier. If parsedOffset is positive, it means it was successfully
// parsed as localized GMT format, but offset digits were not detected (more specifically, GMT
// zero format). Then, it tried to find a match within the set of display names, but could not
// find a match. At this point, we can safely assume the input text contains the localized
// GMT format.
U_ASSERT(parsedOffset != UNKNOWN_OFFSET);
pos.setIndex(parsedPos);
return createTimeZoneForOffset(parsedOffset);
}
// Failed to parse the input text as the time zone format in the specified style.
// Check the longest match among other styles below.
UChar parsedIDBuf[32];
UnicodeString parsedID(parsedIDBuf, 0, UPRV_LENGTHOF(parsedIDBuf));
UTimeZoneFormatTimeType parsedTimeType = UTZFMT_TIME_TYPE_UNKNOWN;
U_ASSERT(parsedPos < 0);
U_ASSERT(parsedOffset == UNKNOWN_OFFSET);
// ISO 8601
if (parsedPos < maxPos &&
((evaluated & ISO_Z_STYLE_FLAG) == 0 || (evaluated & ISO_LOCAL_STYLE_FLAG) == 0)) {
tmpPos.setIndex(startIdx);
tmpPos.setErrorIndex(-1);
UBool hasDigitOffset = FALSE;
offset = parseOffsetISO8601(text, tmpPos, FALSE, &hasDigitOffset);
if (tmpPos.getErrorIndex() == -1) {
if (tmpPos.getIndex() == maxPos || hasDigitOffset) {
pos.setIndex(tmpPos.getIndex());
return createTimeZoneForOffset(offset);
}
// Note: When ISO 8601 format contains offset digits, it should not
// collide with other formats. However, ISO 8601 UTC format "Z" (single letter)
// may collide with other names. In this case, we need to evaluate other names.
if (parsedPos < tmpPos.getIndex()) {
parsedOffset = offset;
parsedID.setToBogus();
parsedTimeType = UTZFMT_TIME_TYPE_UNKNOWN;
parsedPos = tmpPos.getIndex();
U_ASSERT(parsedPos == startIdx + 1); // only when "Z" is used
}
}
}
// Localized GMT format
if (parsedPos < maxPos &&
(evaluated & STYLE_PARSE_FLAGS[UTZFMT_STYLE_LOCALIZED_GMT]) == 0) {
tmpPos.setIndex(startIdx);
tmpPos.setErrorIndex(-1);
UBool hasDigitOffset = FALSE;
offset = parseOffsetLocalizedGMT(text, tmpPos, FALSE, &hasDigitOffset);
if (tmpPos.getErrorIndex() == -1) {
if (tmpPos.getIndex() == maxPos || hasDigitOffset) {
pos.setIndex(tmpPos.getIndex());
return createTimeZoneForOffset(offset);
}
// Evaluate other names - see the comment earlier in this method.
if (parsedPos < tmpPos.getIndex()) {
parsedOffset = offset;
parsedID.setToBogus();
parsedTimeType = UTZFMT_TIME_TYPE_UNKNOWN;
parsedPos = tmpPos.getIndex();
}
}
}
if (parsedPos < maxPos &&
(evaluated & STYLE_PARSE_FLAGS[UTZFMT_STYLE_LOCALIZED_GMT_SHORT]) == 0) {
tmpPos.setIndex(startIdx);
tmpPos.setErrorIndex(-1);
UBool hasDigitOffset = FALSE;
offset = parseOffsetLocalizedGMT(text, tmpPos, TRUE, &hasDigitOffset);
if (tmpPos.getErrorIndex() == -1) {
if (tmpPos.getIndex() == maxPos || hasDigitOffset) {
pos.setIndex(tmpPos.getIndex());
return createTimeZoneForOffset(offset);
}
// Evaluate other names - see the comment earlier in this method.
if (parsedPos < tmpPos.getIndex()) {
parsedOffset = offset;
parsedID.setToBogus();
parsedTimeType = UTZFMT_TIME_TYPE_UNKNOWN;
parsedPos = tmpPos.getIndex();
}
}
}
// When ParseOption.ALL_STYLES is available, we also try to look all possible display names and IDs.
// For example, when style is GENERIC_LONG, "EST" (SPECIFIC_SHORT) is never
// used for America/New_York. With parseAllStyles true, this code parses "EST"
// as America/New_York.
// Note: Adding all possible names into the trie used by the implementation is quite heavy operation,
// which we want to avoid normally (note that we cache the trie, so this is applicable to the
// first time only as long as the cache does not expire).
if (parseOptions & UTZFMT_PARSE_OPTION_ALL_STYLES) {
// Try all specific names and exemplar location names
if (parsedPos < maxPos) {
LocalPointer<TimeZoneNames::MatchInfoCollection> specificMatches(fTimeZoneNames->find(text, startIdx, ALL_SIMPLE_NAME_TYPES, status));
if (U_FAILURE(status)) {
pos.setErrorIndex(startIdx);
return NULL;
}
int32_t specificMatchIdx = -1;
int32_t matchPos = -1;
if (!specificMatches.isNull()) {
for (int32_t i = 0; i < specificMatches->size(); i++) {
if (startIdx + specificMatches->getMatchLengthAt(i) > matchPos) {
specificMatchIdx = i;
matchPos = startIdx + specificMatches->getMatchLengthAt(i);
}
}
}
if (parsedPos < matchPos) {
U_ASSERT(specificMatchIdx >= 0);
parsedPos = matchPos;
getTimeZoneID(specificMatches.getAlias(), specificMatchIdx, parsedID);
parsedTimeType = getTimeType(specificMatches->getNameTypeAt(specificMatchIdx));
parsedOffset = UNKNOWN_OFFSET;
}
}
if (parseTZDBAbbrev && parsedPos < maxPos && (evaluated & STYLE_PARSE_FLAGS[UTZFMT_STYLE_SPECIFIC_SHORT]) == 0) {
const TZDBTimeZoneNames *tzdbTimeZoneNames = getTZDBTimeZoneNames(status);
if (U_SUCCESS(status)) {
LocalPointer<TimeZoneNames::MatchInfoCollection> tzdbNameMatches(
tzdbTimeZoneNames->find(text, startIdx, ALL_SIMPLE_NAME_TYPES, status));
if (U_FAILURE(status)) {
pos.setErrorIndex(startIdx);
return NULL;
}
int32_t tzdbNameMatchIdx = -1;
int32_t matchPos = -1;
if (!tzdbNameMatches.isNull()) {
for (int32_t i = 0; i < tzdbNameMatches->size(); i++) {
if (startIdx + tzdbNameMatches->getMatchLengthAt(i) > matchPos) {
tzdbNameMatchIdx = i;
matchPos = startIdx + tzdbNameMatches->getMatchLengthAt(i);
}
}
}
if (parsedPos < matchPos) {
U_ASSERT(tzdbNameMatchIdx >= 0);
parsedPos = matchPos;
getTimeZoneID(tzdbNameMatches.getAlias(), tzdbNameMatchIdx, parsedID);
parsedTimeType = getTimeType(tzdbNameMatches->getNameTypeAt(tzdbNameMatchIdx));
parsedOffset = UNKNOWN_OFFSET;
}
}
}
// Try generic names
if (parsedPos < maxPos) {
int32_t genMatchLen = -1;
UTimeZoneFormatTimeType tt = UTZFMT_TIME_TYPE_UNKNOWN;
const TimeZoneGenericNames *gnames = getTimeZoneGenericNames(status);
if (U_SUCCESS(status)) {
genMatchLen = gnames->findBestMatch(text, startIdx, ALL_GENERIC_NAME_TYPES, tzID, tt, status);
}
if (U_FAILURE(status)) {
pos.setErrorIndex(startIdx);
return NULL;
}
if (genMatchLen > 0 && parsedPos < startIdx + genMatchLen) {
parsedPos = startIdx + genMatchLen;
parsedID.setTo(tzID);
parsedTimeType = tt;
parsedOffset = UNKNOWN_OFFSET;
}
}
// Try time zone ID
if (parsedPos < maxPos && (evaluated & STYLE_PARSE_FLAGS[UTZFMT_STYLE_ZONE_ID]) == 0) {
tmpPos.setIndex(startIdx);
tmpPos.setErrorIndex(-1);
parseZoneID(text, tmpPos, tzID);
if (tmpPos.getErrorIndex() == -1 && parsedPos < tmpPos.getIndex()) {
parsedPos = tmpPos.getIndex();
parsedID.setTo(tzID);
parsedTimeType = UTZFMT_TIME_TYPE_UNKNOWN;
parsedOffset = UNKNOWN_OFFSET;
}
}
// Try short time zone ID
if (parsedPos < maxPos && (evaluated & STYLE_PARSE_FLAGS[UTZFMT_STYLE_ZONE_ID]) == 0) {
tmpPos.setIndex(startIdx);
tmpPos.setErrorIndex(-1);
parseShortZoneID(text, tmpPos, tzID);
if (tmpPos.getErrorIndex() == -1 && parsedPos < tmpPos.getIndex()) {
parsedPos = tmpPos.getIndex();
parsedID.setTo(tzID);
parsedTimeType = UTZFMT_TIME_TYPE_UNKNOWN;
parsedOffset = UNKNOWN_OFFSET;
}
}
}
if (parsedPos > startIdx) {
// Parsed successfully
TimeZone* parsedTZ;
if (parsedID.length() > 0) {
parsedTZ = TimeZone::createTimeZone(parsedID);
} else {
U_ASSERT(parsedOffset != UNKNOWN_OFFSET);
parsedTZ = createTimeZoneForOffset(parsedOffset);
}
if (timeType) {
*timeType = parsedTimeType;
}
pos.setIndex(parsedPos);
return parsedTZ;
}
pos.setErrorIndex(startIdx);
return NULL;
}
void
TimeZoneFormat::parseObject(const UnicodeString& source, Formattable& result,
ParsePosition& parse_pos) const {
result.adoptObject(parse(UTZFMT_STYLE_GENERIC_LOCATION, source, parse_pos, UTZFMT_PARSE_OPTION_ALL_STYLES));
}
// ------------------------------------------------------------------
// Private zone name format/parse implementation
UnicodeString&
TimeZoneFormat::formatGeneric(const TimeZone& tz, int32_t genType, UDate date, UnicodeString& name) const {
UErrorCode status = U_ZERO_ERROR;
const TimeZoneGenericNames* gnames = getTimeZoneGenericNames(status);
if (U_FAILURE(status)) {
name.setToBogus();
return name;
}
if (genType == UTZGNM_LOCATION) {
const UChar* canonicalID = ZoneMeta::getCanonicalCLDRID(tz);
if (canonicalID == NULL) {
name.setToBogus();
return name;
}
return gnames->getGenericLocationName(UnicodeString(TRUE, canonicalID, -1), name);
}
return gnames->getDisplayName(tz, (UTimeZoneGenericNameType)genType, date, name);
}
UnicodeString&
TimeZoneFormat::formatSpecific(const TimeZone& tz, UTimeZoneNameType stdType, UTimeZoneNameType dstType,
UDate date, UnicodeString& name, UTimeZoneFormatTimeType *timeType) const {
if (fTimeZoneNames == NULL) {
name.setToBogus();
return name;
}
UErrorCode status = U_ZERO_ERROR;
UBool isDaylight = tz.inDaylightTime(date, status);
const UChar* canonicalID = ZoneMeta::getCanonicalCLDRID(tz);
if (U_FAILURE(status) || canonicalID == NULL) {
name.setToBogus();
return name;
}
if (isDaylight) {
fTimeZoneNames->getDisplayName(UnicodeString(TRUE, canonicalID, -1), dstType, date, name);
} else {
fTimeZoneNames->getDisplayName(UnicodeString(TRUE, canonicalID, -1), stdType, date, name);
}
if (timeType && !name.isEmpty()) {
*timeType = isDaylight ? UTZFMT_TIME_TYPE_DAYLIGHT : UTZFMT_TIME_TYPE_STANDARD;
}
return name;
}
const TimeZoneGenericNames*
TimeZoneFormat::getTimeZoneGenericNames(UErrorCode& status) const {
if (U_FAILURE(status)) {
return NULL;
}
umtx_lock(&gLock);
if (fTimeZoneGenericNames == NULL) {
TimeZoneFormat *nonConstThis = const_cast<TimeZoneFormat *>(this);
nonConstThis->fTimeZoneGenericNames = TimeZoneGenericNames::createInstance(fLocale, status);
}
umtx_unlock(&gLock);
return fTimeZoneGenericNames;
}
const TZDBTimeZoneNames*
TimeZoneFormat::getTZDBTimeZoneNames(UErrorCode& status) const {
if (U_FAILURE(status)) {
return NULL;
}
umtx_lock(&gLock);
if (fTZDBTimeZoneNames == NULL) {
TZDBTimeZoneNames *tzdbNames = new TZDBTimeZoneNames(fLocale);
if (tzdbNames == NULL) {
status = U_MEMORY_ALLOCATION_ERROR;
} else {
TimeZoneFormat *nonConstThis = const_cast<TimeZoneFormat *>(this);
nonConstThis->fTZDBTimeZoneNames = tzdbNames;
}
}
umtx_unlock(&gLock);
return fTZDBTimeZoneNames;
}
UnicodeString&
TimeZoneFormat::formatExemplarLocation(const TimeZone& tz, UnicodeString& name) const {
UChar locationBuf[64];
UnicodeString location(locationBuf, 0, UPRV_LENGTHOF(locationBuf));
const UChar* canonicalID = ZoneMeta::getCanonicalCLDRID(tz);
if (canonicalID) {
fTimeZoneNames->getExemplarLocationName(UnicodeString(TRUE, canonicalID, -1), location);
}
if (location.length() > 0) {
name.setTo(location);
} else {
// Use "unknown" location
fTimeZoneNames->getExemplarLocationName(UnicodeString(TRUE, UNKNOWN_ZONE_ID, -1), location);
if (location.length() > 0) {
name.setTo(location);
} else {
// last resort
name.setTo(UNKNOWN_LOCATION, -1);
}
}
return name;
}
// ------------------------------------------------------------------
// Zone offset format and parse
UnicodeString&
TimeZoneFormat::formatOffsetISO8601Basic(int32_t offset, UBool useUtcIndicator, UBool isShort, UBool ignoreSeconds,
UnicodeString& result, UErrorCode& status) const {
return formatOffsetISO8601(offset, TRUE, useUtcIndicator, isShort, ignoreSeconds, result, status);
}
UnicodeString&
TimeZoneFormat::formatOffsetISO8601Extended(int32_t offset, UBool useUtcIndicator, UBool isShort, UBool ignoreSeconds,
UnicodeString& result, UErrorCode& status) const {
return formatOffsetISO8601(offset, FALSE, useUtcIndicator, isShort, ignoreSeconds, result, status);
}
UnicodeString&
TimeZoneFormat::formatOffsetLocalizedGMT(int32_t offset, UnicodeString& result, UErrorCode& status) const {
return formatOffsetLocalizedGMT(offset, FALSE, result, status);
}
UnicodeString&
TimeZoneFormat::formatOffsetShortLocalizedGMT(int32_t offset, UnicodeString& result, UErrorCode& status) const {
return formatOffsetLocalizedGMT(offset, TRUE, result, status);
}
int32_t
TimeZoneFormat::parseOffsetISO8601(const UnicodeString& text, ParsePosition& pos) const {
return parseOffsetISO8601(text, pos, FALSE);
}
int32_t
TimeZoneFormat::parseOffsetLocalizedGMT(const UnicodeString& text, ParsePosition& pos) const {
return parseOffsetLocalizedGMT(text, pos, FALSE, NULL);
}
int32_t
TimeZoneFormat::parseOffsetShortLocalizedGMT(const UnicodeString& text, ParsePosition& pos) const {
return parseOffsetLocalizedGMT(text, pos, TRUE, NULL);
}
// ------------------------------------------------------------------
// Private zone offset format/parse implementation
UnicodeString&
TimeZoneFormat::formatOffsetISO8601(int32_t offset, UBool isBasic, UBool useUtcIndicator,
UBool isShort, UBool ignoreSeconds, UnicodeString& result, UErrorCode& status) const {
if (U_FAILURE(status)) {
result.setToBogus();
return result;
}
int32_t absOffset = offset < 0 ? -offset : offset;
if (useUtcIndicator && (absOffset < MILLIS_PER_SECOND || (ignoreSeconds && absOffset < MILLIS_PER_MINUTE))) {
result.setTo(ISO8601_UTC);
return result;
}
OffsetFields minFields = isShort ? FIELDS_H : FIELDS_HM;
OffsetFields maxFields = ignoreSeconds ? FIELDS_HM : FIELDS_HMS;
UChar sep = isBasic ? 0 : ISO8601_SEP;
// Note: FIELDS_HMS as maxFields is a CLDR/ICU extension. ISO 8601 specification does
// not support seconds field.
if (absOffset >= MAX_OFFSET) {
result.setToBogus();
status = U_ILLEGAL_ARGUMENT_ERROR;
return result;
}
int fields[3];
fields[0] = absOffset / MILLIS_PER_HOUR;
absOffset = absOffset % MILLIS_PER_HOUR;
fields[1] = absOffset / MILLIS_PER_MINUTE;
absOffset = absOffset % MILLIS_PER_MINUTE;
fields[2] = absOffset / MILLIS_PER_SECOND;
U_ASSERT(fields[0] >= 0 && fields[0] <= MAX_OFFSET_HOUR);
U_ASSERT(fields[1] >= 0 && fields[1] <= MAX_OFFSET_MINUTE);
U_ASSERT(fields[2] >= 0 && fields[2] <= MAX_OFFSET_SECOND);
int32_t lastIdx = maxFields;
while (lastIdx > minFields) {
if (fields[lastIdx] != 0) {
break;
}
lastIdx--;
}
UChar sign = PLUS;
if (offset < 0) {
// if all output fields are 0s, do not use negative sign
for (int32_t idx = 0; idx <= lastIdx; idx++) {
if (fields[idx] != 0) {
sign = MINUS;
break;
}
}
}
result.setTo(sign);
for (int32_t idx = 0; idx <= lastIdx; idx++) {
if (sep && idx != 0) {
result.append(sep);
}
result.append((UChar)(0x0030 + fields[idx]/10));
result.append((UChar)(0x0030 + fields[idx]%10));
}
return result;
}
UnicodeString&
TimeZoneFormat::formatOffsetLocalizedGMT(int32_t offset, UBool isShort, UnicodeString& result, UErrorCode& status) const {
if (U_FAILURE(status)) {
result.setToBogus();
return result;
}
if (offset <= -MAX_OFFSET || offset >= MAX_OFFSET) {
result.setToBogus();
status = U_ILLEGAL_ARGUMENT_ERROR;
return result;
}
if (offset == 0) {
result.setTo(fGMTZeroFormat);
return result;
}
UBool positive = TRUE;
if (offset < 0) {
offset = -offset;
positive = FALSE;
}
int32_t offsetH = offset / MILLIS_PER_HOUR;
offset = offset % MILLIS_PER_HOUR;
int32_t offsetM = offset / MILLIS_PER_MINUTE;
offset = offset % MILLIS_PER_MINUTE;
int32_t offsetS = offset / MILLIS_PER_SECOND;
U_ASSERT(offsetH <= MAX_OFFSET_HOUR && offsetM <= MAX_OFFSET_MINUTE && offsetS <= MAX_OFFSET_SECOND);
const UVector* offsetPatternItems = NULL;
if (positive) {
if (offsetS != 0) {
offsetPatternItems = fGMTOffsetPatternItems[UTZFMT_PAT_POSITIVE_HMS];
} else if (offsetM != 0 || !isShort) {
offsetPatternItems = fGMTOffsetPatternItems[UTZFMT_PAT_POSITIVE_HM];
} else {
offsetPatternItems = fGMTOffsetPatternItems[UTZFMT_PAT_POSITIVE_H];
}
} else {
if (offsetS != 0) {
offsetPatternItems = fGMTOffsetPatternItems[UTZFMT_PAT_NEGATIVE_HMS];
} else if (offsetM != 0 || !isShort) {
offsetPatternItems = fGMTOffsetPatternItems[UTZFMT_PAT_NEGATIVE_HM];
} else {
offsetPatternItems = fGMTOffsetPatternItems[UTZFMT_PAT_NEGATIVE_H];
}
}
U_ASSERT(offsetPatternItems != NULL);
// Building the GMT format string
result.setTo(fGMTPatternPrefix);
for (int32_t i = 0; i < offsetPatternItems->size(); i++) {
const GMTOffsetField* item = (GMTOffsetField*)offsetPatternItems->elementAt(i);
GMTOffsetField::FieldType type = item->getType();
switch (type) {
case GMTOffsetField::TEXT:
result.append(item->getPatternText(), -1);
break;
case GMTOffsetField::HOUR:
appendOffsetDigits(result, offsetH, (isShort ? 1 : 2));
break;
case GMTOffsetField::MINUTE:
appendOffsetDigits(result, offsetM, 2);
break;
case GMTOffsetField::SECOND:
appendOffsetDigits(result, offsetS, 2);
break;
}
}
result.append(fGMTPatternSuffix);
return result;
}
int32_t
TimeZoneFormat::parseOffsetISO8601(const UnicodeString& text, ParsePosition& pos, UBool extendedOnly, UBool* hasDigitOffset /* = NULL */) const {
if (hasDigitOffset) {
*hasDigitOffset = FALSE;
}
int32_t start = pos.getIndex();
if (start >= text.length()) {
pos.setErrorIndex(start);
return 0;
}
UChar firstChar = text.charAt(start);
if (firstChar == ISO8601_UTC || firstChar == (UChar)(ISO8601_UTC + 0x20)) {
// "Z" (or "z") - indicates UTC
pos.setIndex(start + 1);
return 0;
}
int32_t sign = 1;
if (firstChar == PLUS) {
sign = 1;
} else if (firstChar == MINUS) {
sign = -1;
} else {
// Not an ISO 8601 offset string
pos.setErrorIndex(start);
return 0;
}
ParsePosition posOffset(start + 1);
int32_t offset = parseAsciiOffsetFields(text, posOffset, ISO8601_SEP, FIELDS_H, FIELDS_HMS);
if (posOffset.getErrorIndex() == -1 && !extendedOnly && (posOffset.getIndex() - start <= 3)) {
// If the text is successfully parsed as extended format with the options above, it can be also parsed
// as basic format. For example, "0230" can be parsed as offset 2:00 (only first digits are valid for
// extended format), but it can be parsed as offset 2:30 with basic format. We use longer result.
ParsePosition posBasic(start + 1);
int32_t tmpOffset = parseAbuttingAsciiOffsetFields(text, posBasic, FIELDS_H, FIELDS_HMS, FALSE);
if (posBasic.getErrorIndex() == -1 && posBasic.getIndex() > posOffset.getIndex()) {
offset = tmpOffset;
posOffset.setIndex(posBasic.getIndex());
}
}
if (posOffset.getErrorIndex() != -1) {
pos.setErrorIndex(start);
return 0;
}
pos.setIndex(posOffset.getIndex());
if (hasDigitOffset) {
*hasDigitOffset = TRUE;
}
return sign * offset;
}
int32_t
TimeZoneFormat::parseOffsetLocalizedGMT(const UnicodeString& text, ParsePosition& pos, UBool isShort, UBool* hasDigitOffset) const {
int32_t start = pos.getIndex();
int32_t offset = 0;
int32_t parsedLength = 0;
if (hasDigitOffset) {
*hasDigitOffset = FALSE;
}
offset = parseOffsetLocalizedGMTPattern(text, start, isShort, parsedLength);
// For now, parseOffsetLocalizedGMTPattern handles both long and short
// formats, no matter isShort is true or false. This might be changed in future
// when strict parsing is necessary, or different set of patterns are used for
// short/long formats.
#if 0
if (parsedLength == 0) {
offset = parseOffsetLocalizedGMTPattern(text, start, !isShort, parsedLength);
}
#endif
if (parsedLength > 0) {
if (hasDigitOffset) {
*hasDigitOffset = TRUE;
}
pos.setIndex(start + parsedLength);
return offset;
}
// Try the default patterns
offset = parseOffsetDefaultLocalizedGMT(text, start, parsedLength);
if (parsedLength > 0) {
if (hasDigitOffset) {
*hasDigitOffset = TRUE;
}
pos.setIndex(start + parsedLength);
return offset;
}
// Check if this is a GMT zero format
if (text.caseCompare(start, fGMTZeroFormat.length(), fGMTZeroFormat, 0) == 0) {
pos.setIndex(start + fGMTZeroFormat.length());
return 0;
}
// Check if this is a default GMT zero format
for (int32_t i = 0; ALT_GMT_STRINGS[i][0] != 0; i++) {
const UChar* defGMTZero = ALT_GMT_STRINGS[i];
int32_t defGMTZeroLen = u_strlen(defGMTZero);
if (text.caseCompare(start, defGMTZeroLen, defGMTZero, 0) == 0) {
pos.setIndex(start + defGMTZeroLen);
return 0;
}
}
// Nothing matched
pos.setErrorIndex(start);
return 0;
}
int32_t
TimeZoneFormat::parseOffsetLocalizedGMTPattern(const UnicodeString& text, int32_t start, UBool /*isShort*/, int32_t& parsedLen) const {
int32_t idx = start;
int32_t offset = 0;
UBool parsed = FALSE;
do {
// Prefix part
int32_t len = fGMTPatternPrefix.length();
if (len > 0 && text.caseCompare(idx, len, fGMTPatternPrefix, 0) != 0) {
// prefix match failed
break;
}
idx += len;
// Offset part
offset = parseOffsetFields(text, idx, FALSE, len);
if (len == 0) {
// offset field match failed
break;
}
idx += len;
len = fGMTPatternSuffix.length();
if (len > 0 && text.caseCompare(idx, len, fGMTPatternSuffix, 0) != 0) {
// no suffix match
break;
}
idx += len;
parsed = TRUE;
} while (FALSE);
parsedLen = parsed ? idx - start : 0;
return offset;
}
int32_t
TimeZoneFormat::parseOffsetFields(const UnicodeString& text, int32_t start, UBool /*isShort*/, int32_t& parsedLen) const {
int32_t outLen = 0;
int32_t offset = 0;
int32_t sign = 1;
parsedLen = 0;
int32_t offsetH, offsetM, offsetS;
offsetH = offsetM = offsetS = 0;
for (int32_t patidx = 0; PARSE_GMT_OFFSET_TYPES[patidx] >= 0; patidx++) {
int32_t gmtPatType = PARSE_GMT_OFFSET_TYPES[patidx];
UVector* items = fGMTOffsetPatternItems[gmtPatType];
U_ASSERT(items != NULL);
outLen = parseOffsetFieldsWithPattern(text, start, items, FALSE, offsetH, offsetM, offsetS);
if (outLen > 0) {
sign = (gmtPatType == UTZFMT_PAT_POSITIVE_H || gmtPatType == UTZFMT_PAT_POSITIVE_HM || gmtPatType == UTZFMT_PAT_POSITIVE_HMS) ?
1 : -1;
break;
}
}
if (outLen > 0 && fAbuttingOffsetHoursAndMinutes) {
// When hours field is sabutting minutes field,
// the parse result above may not be appropriate.
// For example, "01020" is parsed as 01:02: above,
// but it should be parsed as 00:10:20.
int32_t tmpLen = 0;
int32_t tmpSign = 1;
int32_t tmpH, tmpM, tmpS;
for (int32_t patidx = 0; PARSE_GMT_OFFSET_TYPES[patidx] >= 0; patidx++) {
int32_t gmtPatType = PARSE_GMT_OFFSET_TYPES[patidx];
UVector* items = fGMTOffsetPatternItems[gmtPatType];
U_ASSERT(items != NULL);
// forcing parse to use single hour digit
tmpLen = parseOffsetFieldsWithPattern(text, start, items, TRUE, tmpH, tmpM, tmpS);
if (tmpLen > 0) {
tmpSign = (gmtPatType == UTZFMT_PAT_POSITIVE_H || gmtPatType == UTZFMT_PAT_POSITIVE_HM || gmtPatType == UTZFMT_PAT_POSITIVE_HMS) ?
1 : -1;
break;
}
}
if (tmpLen > outLen) {
// Better parse result with single hour digit
outLen = tmpLen;
sign = tmpSign;
offsetH = tmpH;
offsetM = tmpM;
offsetS = tmpS;
}
}
if (outLen > 0) {
offset = ((((offsetH * 60) + offsetM) * 60) + offsetS) * 1000 * sign;
parsedLen = outLen;
}
return offset;
}
int32_t
TimeZoneFormat::parseOffsetFieldsWithPattern(const UnicodeString& text, int32_t start,
UVector* patternItems, UBool forceSingleHourDigit, int32_t& hour, int32_t& min, int32_t& sec) const {
UBool failed = FALSE;
int32_t offsetH, offsetM, offsetS;
offsetH = offsetM = offsetS = 0;
int32_t idx = start;
for (int32_t i = 0; i < patternItems->size(); i++) {
int32_t len = 0;
const GMTOffsetField* field = (const GMTOffsetField*)patternItems->elementAt(i);
GMTOffsetField::FieldType fieldType = field->getType();
if (fieldType == GMTOffsetField::TEXT) {
const UChar* patStr = field->getPatternText();
len = u_strlen(patStr);
if (text.caseCompare(idx, len, patStr, 0) != 0) {
failed = TRUE;
break;
}
idx += len;
} else {
if (fieldType == GMTOffsetField::HOUR) {
uint8_t maxDigits = forceSingleHourDigit ? 1 : 2;
offsetH = parseOffsetFieldWithLocalizedDigits(text, idx, 1, maxDigits, 0, MAX_OFFSET_HOUR, len);
} else if (fieldType == GMTOffsetField::MINUTE) {
offsetM = parseOffsetFieldWithLocalizedDigits(text, idx, 2, 2, 0, MAX_OFFSET_MINUTE, len);
} else if (fieldType == GMTOffsetField::SECOND) {
offsetS = parseOffsetFieldWithLocalizedDigits(text, idx, 2, 2, 0, MAX_OFFSET_SECOND, len);
}
if (len == 0) {
failed = TRUE;
break;
}
idx += len;
}
}
if (failed) {
hour = min = sec = 0;
return 0;
}
hour = offsetH;
min = offsetM;
sec = offsetS;
return idx - start;
}
int32_t
TimeZoneFormat::parseAbuttingOffsetFields(const UnicodeString& text, int32_t start, int32_t& parsedLen) const {
int32_t digits[MAX_OFFSET_DIGITS];
int32_t parsed[MAX_OFFSET_DIGITS]; // accumulative offsets
// Parse digits into int[]
int32_t idx = start;
int32_t len = 0;
int32_t numDigits = 0;
for (int32_t i = 0; i < MAX_OFFSET_DIGITS; i++) {
digits[i] = parseSingleLocalizedDigit(text, idx, len);
if (digits[i] < 0) {
break;
}
idx += len;
parsed[i] = idx - start;
numDigits++;
}
if (numDigits == 0) {
parsedLen = 0;
return 0;
}
int32_t offset = 0;
while (numDigits > 0) {
int32_t hour = 0;
int32_t min = 0;
int32_t sec = 0;
U_ASSERT(numDigits > 0 && numDigits <= MAX_OFFSET_DIGITS);
switch (numDigits) {
case 1: // H
hour = digits[0];
break;
case 2: // HH
hour = digits[0] * 10 + digits[1];
break;
case 3: // Hmm
hour = digits[0];
min = digits[1] * 10 + digits[2];
break;
case 4: // HHmm
hour = digits[0] * 10 + digits[1];
min = digits[2] * 10 + digits[3];
break;
case 5: // Hmmss
hour = digits[0];
min = digits[1] * 10 + digits[2];
sec = digits[3] * 10 + digits[4];
break;
case 6: // HHmmss
hour = digits[0] * 10 + digits[1];
min = digits[2] * 10 + digits[3];
sec = digits[4] * 10 + digits[5];
break;
}
if (hour <= MAX_OFFSET_HOUR && min <= MAX_OFFSET_MINUTE && sec <= MAX_OFFSET_SECOND) {
// found a valid combination
offset = hour * MILLIS_PER_HOUR + min * MILLIS_PER_MINUTE + sec * MILLIS_PER_SECOND;
parsedLen = parsed[numDigits - 1];
break;
}
numDigits--;
}
return offset;
}
int32_t
TimeZoneFormat::parseOffsetDefaultLocalizedGMT(const UnicodeString& text, int start, int32_t& parsedLen) const {
int32_t idx = start;
int32_t offset = 0;
int32_t parsed = 0;
do {
// check global default GMT alternatives
int32_t gmtLen = 0;
for (int32_t i = 0; ALT_GMT_STRINGS[i][0] != 0; i++) {
const UChar* gmt = ALT_GMT_STRINGS[i];
int32_t len = u_strlen(gmt);
if (text.caseCompare(start, len, gmt, 0) == 0) {
gmtLen = len;
break;
}
}
if (gmtLen == 0) {
break;
}
idx += gmtLen;
// offset needs a sign char and a digit at minimum
if (idx + 1 >= text.length()) {
break;
}
// parse sign
int32_t sign = 1;
UChar c = text.charAt(idx);
if (c == PLUS) {
sign = 1;
} else if (c == MINUS) {
sign = -1;
} else {
break;
}
idx++;
// offset part
// try the default pattern with the separator first
int32_t lenWithSep = 0;
int32_t offsetWithSep = parseDefaultOffsetFields(text, idx, DEFAULT_GMT_OFFSET_SEP, lenWithSep);
if (lenWithSep == text.length() - idx) {
// maximum match
offset = offsetWithSep * sign;
idx += lenWithSep;
} else {
// try abutting field pattern
int32_t lenAbut = 0;
int32_t offsetAbut = parseAbuttingOffsetFields(text, idx, lenAbut);
if (lenWithSep > lenAbut) {
offset = offsetWithSep * sign;
idx += lenWithSep;
} else {
offset = offsetAbut * sign;
idx += lenAbut;
}
}
parsed = idx - start;
} while (false);
parsedLen = parsed;
return offset;
}
int32_t
TimeZoneFormat::parseDefaultOffsetFields(const UnicodeString& text, int32_t start, UChar separator, int32_t& parsedLen) const {
int32_t max = text.length();
int32_t idx = start;
int32_t len = 0;
int32_t hour = 0, min = 0, sec = 0;
parsedLen = 0;
do {
hour = parseOffsetFieldWithLocalizedDigits(text, idx, 1, 2, 0, MAX_OFFSET_HOUR, len);
if (len == 0) {
break;
}
idx += len;
if (idx + 1 < max && text.charAt(idx) == separator) {
min = parseOffsetFieldWithLocalizedDigits(text, idx + 1, 2, 2, 0, MAX_OFFSET_MINUTE, len);
if (len == 0) {
break;
}
idx += (1 + len);
if (idx + 1 < max && text.charAt(idx) == separator) {
sec = parseOffsetFieldWithLocalizedDigits(text, idx + 1, 2, 2, 0, MAX_OFFSET_SECOND, len);
if (len == 0) {
break;
}
idx += (1 + len);
}
}
} while (FALSE);
if (idx == start) {
return 0;
}
parsedLen = idx - start;
return hour * MILLIS_PER_HOUR + min * MILLIS_PER_MINUTE + sec * MILLIS_PER_SECOND;
}
int32_t
TimeZoneFormat::parseOffsetFieldWithLocalizedDigits(const UnicodeString& text, int32_t start, uint8_t minDigits, uint8_t maxDigits, uint16_t minVal, uint16_t maxVal, int32_t& parsedLen) const {
parsedLen = 0;
int32_t decVal = 0;
int32_t numDigits = 0;
int32_t idx = start;
int32_t digitLen = 0;
while (idx < text.length() && numDigits < maxDigits) {
int32_t digit = parseSingleLocalizedDigit(text, idx, digitLen);
if (digit < 0) {
break;
}
int32_t tmpVal = decVal * 10 + digit;
if (tmpVal > maxVal) {
break;
}
decVal = tmpVal;
numDigits++;
idx += digitLen;
}
// Note: maxVal is checked in the while loop
if (numDigits < minDigits || decVal < minVal) {
decVal = -1;
numDigits = 0;
} else {
parsedLen = idx - start;
}
return decVal;
}
int32_t
TimeZoneFormat::parseSingleLocalizedDigit(const UnicodeString& text, int32_t start, int32_t& len) const {
int32_t digit = -1;
len = 0;
if (start < text.length()) {
UChar32 cp = text.char32At(start);
// First, try digits configured for this instance
for (int32_t i = 0; i < 10; i++) {
if (cp == fGMTOffsetDigits[i]) {
digit = i;
break;
}
}
// If failed, check if this is a Unicode digit
if (digit < 0) {
int32_t tmp = u_charDigitValue(cp);
digit = (tmp >= 0 && tmp <= 9) ? tmp : -1;
}
if (digit >= 0) {
int32_t next = text.moveIndex32(start, 1);
len = next - start;
}
}
return digit;
}
UnicodeString&
TimeZoneFormat::formatOffsetWithAsciiDigits(int32_t offset, UChar sep, OffsetFields minFields, OffsetFields maxFields, UnicodeString& result) {
U_ASSERT(maxFields >= minFields);
U_ASSERT(offset > -MAX_OFFSET && offset < MAX_OFFSET);
UChar sign = PLUS;
if (offset < 0) {
sign = MINUS;
offset = -offset;
}
result.setTo(sign);
int fields[3];
fields[0] = offset / MILLIS_PER_HOUR;
offset = offset % MILLIS_PER_HOUR;
fields[1] = offset / MILLIS_PER_MINUTE;
offset = offset % MILLIS_PER_MINUTE;
fields[2] = offset / MILLIS_PER_SECOND;
U_ASSERT(fields[0] >= 0 && fields[0] <= MAX_OFFSET_HOUR);
U_ASSERT(fields[1] >= 0 && fields[1] <= MAX_OFFSET_MINUTE);
U_ASSERT(fields[2] >= 0 && fields[2] <= MAX_OFFSET_SECOND);
int32_t lastIdx = maxFields;
while (lastIdx > minFields) {
if (fields[lastIdx] != 0) {
break;
}
lastIdx--;
}
for (int32_t idx = 0; idx <= lastIdx; idx++) {
if (sep && idx != 0) {
result.append(sep);
}
result.append((UChar)(0x0030 + fields[idx]/10));
result.append((UChar)(0x0030 + fields[idx]%10));
}
return result;
}
int32_t
TimeZoneFormat::parseAbuttingAsciiOffsetFields(const UnicodeString& text, ParsePosition& pos, OffsetFields minFields, OffsetFields maxFields, UBool fixedHourWidth) {
int32_t start = pos.getIndex();
int32_t minDigits = 2 * (minFields + 1) - (fixedHourWidth ? 0 : 1);
int32_t maxDigits = 2 * (maxFields + 1);
U_ASSERT(maxDigits <= MAX_OFFSET_DIGITS);
int32_t digits[MAX_OFFSET_DIGITS] = {};
int32_t numDigits = 0;
int32_t idx = start;
while (numDigits < maxDigits && idx < text.length()) {
UChar uch = text.charAt(idx);
int32_t digit = DIGIT_VAL(uch);
if (digit < 0) {
break;
}
digits[numDigits] = digit;
numDigits++;
idx++;
}
if (fixedHourWidth && (numDigits & 1)) {
// Fixed digits, so the number of digits must be even number. Truncating.
numDigits--;
}
if (numDigits < minDigits) {
pos.setErrorIndex(start);
return 0;
}
int32_t hour = 0, min = 0, sec = 0;
UBool bParsed = FALSE;
while (numDigits >= minDigits) {
switch (numDigits) {
case 1: //H
hour = digits[0];
break;
case 2: //HH
hour = digits[0] * 10 + digits[1];
break;
case 3: //Hmm
hour = digits[0];
min = digits[1] * 10 + digits[2];
break;
case 4: //HHmm
hour = digits[0] * 10 + digits[1];
min = digits[2] * 10 + digits[3];
break;
case 5: //Hmmss
hour = digits[0];
min = digits[1] * 10 + digits[2];
sec = digits[3] * 10 + digits[4];
break;
case 6: //HHmmss
hour = digits[0] * 10 + digits[1];
min = digits[2] * 10 + digits[3];
sec = digits[4] * 10 + digits[5];
break;
}
if (hour <= MAX_OFFSET_HOUR && min <= MAX_OFFSET_MINUTE && sec <= MAX_OFFSET_SECOND) {
// Successfully parsed
bParsed = true;
break;
}
// Truncating
numDigits -= (fixedHourWidth ? 2 : 1);
hour = min = sec = 0;
}
if (!bParsed) {
pos.setErrorIndex(start);
return 0;
}
pos.setIndex(start + numDigits);
return ((((hour * 60) + min) * 60) + sec) * 1000;
}
int32_t
TimeZoneFormat::parseAsciiOffsetFields(const UnicodeString& text, ParsePosition& pos, UChar sep, OffsetFields minFields, OffsetFields maxFields) {
int32_t start = pos.getIndex();
int32_t fieldVal[] = {0, 0, 0};
int32_t fieldLen[] = {0, -1, -1};
for (int32_t idx = start, fieldIdx = 0; idx < text.length() && fieldIdx <= maxFields; idx++) {
UChar c = text.charAt(idx);
if (c == sep) {
if (fieldIdx == 0) {
if (fieldLen[0] == 0) {
// no hours field
break;
}
// 1 digit hour, move to next field
} else {
if (fieldLen[fieldIdx] != -1) {
// premature minute or seconds field
break;
}
fieldLen[fieldIdx] = 0;
}
continue;
} else if (fieldLen[fieldIdx] == -1) {
// no separator after 2 digit field
break;
}
int32_t digit = DIGIT_VAL(c);
if (digit < 0) {
// not a digit
break;
}
fieldVal[fieldIdx] = fieldVal[fieldIdx] * 10 + digit;
fieldLen[fieldIdx]++;
if (fieldLen[fieldIdx] >= 2) {
// parsed 2 digits, move to next field
fieldIdx++;
}
}
int32_t offset = 0;
int32_t parsedLen = 0;
int32_t parsedFields = -1;
do {
// hour
if (fieldLen[0] == 0) {
break;
}
if (fieldVal[0] > MAX_OFFSET_HOUR) {
offset = (fieldVal[0] / 10) * MILLIS_PER_HOUR;
parsedFields = FIELDS_H;
parsedLen = 1;
break;
}
offset = fieldVal[0] * MILLIS_PER_HOUR;
parsedLen = fieldLen[0];
parsedFields = FIELDS_H;
// minute
if (fieldLen[1] != 2 || fieldVal[1] > MAX_OFFSET_MINUTE) {
break;
}
offset += fieldVal[1] * MILLIS_PER_MINUTE;
parsedLen += (1 + fieldLen[1]);
parsedFields = FIELDS_HM;
// second
if (fieldLen[2] != 2 || fieldVal[2] > MAX_OFFSET_SECOND) {
break;
}
offset += fieldVal[2] * MILLIS_PER_SECOND;
parsedLen += (1 + fieldLen[2]);
parsedFields = FIELDS_HMS;
} while (false);
if (parsedFields < minFields) {
pos.setErrorIndex(start);
return 0;
}
pos.setIndex(start + parsedLen);
return offset;
}
void
TimeZoneFormat::appendOffsetDigits(UnicodeString& buf, int32_t n, uint8_t minDigits) const {
U_ASSERT(n >= 0 && n < 60);
int32_t numDigits = n >= 10 ? 2 : 1;
for (int32_t i = 0; i < minDigits - numDigits; i++) {
buf.append(fGMTOffsetDigits[0]);
}
if (numDigits == 2) {
buf.append(fGMTOffsetDigits[n / 10]);
}
buf.append(fGMTOffsetDigits[n % 10]);
}
// ------------------------------------------------------------------
// Private misc
void
TimeZoneFormat::initGMTPattern(const UnicodeString& gmtPattern, UErrorCode& status) {
if (U_FAILURE(status)) {
return;
}
// This implementation not perfect, but sufficient practically.
int32_t idx = gmtPattern.indexOf(ARG0, ARG0_LEN, 0);
if (idx < 0) {
status = U_ILLEGAL_ARGUMENT_ERROR;
return;
}
fGMTPattern.setTo(gmtPattern);
unquote(gmtPattern.tempSubString(0, idx), fGMTPatternPrefix);
unquote(gmtPattern.tempSubString(idx + ARG0_LEN), fGMTPatternSuffix);
}
UnicodeString&
TimeZoneFormat::unquote(const UnicodeString& pattern, UnicodeString& result) {
if (pattern.indexOf(SINGLEQUOTE) < 0) {
result.setTo(pattern);
return result;
}
result.remove();
UBool isPrevQuote = FALSE;
UBool inQuote = FALSE;
for (int32_t i = 0; i < pattern.length(); i++) {
UChar c = pattern.charAt(i);
if (c == SINGLEQUOTE) {
if (isPrevQuote) {
result.append(c);
isPrevQuote = FALSE;
} else {
isPrevQuote = TRUE;
}
inQuote = !inQuote;
} else {
isPrevQuote = FALSE;
result.append(c);
}
}
return result;
}
UVector*
TimeZoneFormat::parseOffsetPattern(const UnicodeString& pattern, OffsetFields required, UErrorCode& status) {
if (U_FAILURE(status)) {
return NULL;
}
UVector* result = new UVector(deleteGMTOffsetField, NULL, status);
if (result == NULL) {
status = U_MEMORY_ALLOCATION_ERROR;
return NULL;
}
int32_t checkBits = 0;
UBool isPrevQuote = FALSE;
UBool inQuote = FALSE;
UChar textBuf[32];
UnicodeString text(textBuf, 0, UPRV_LENGTHOF(textBuf));
GMTOffsetField::FieldType itemType = GMTOffsetField::TEXT;
int32_t itemLength = 1;
for (int32_t i = 0; i < pattern.length(); i++) {
UChar ch = pattern.charAt(i);
if (ch == SINGLEQUOTE) {
if (isPrevQuote) {
text.append(SINGLEQUOTE);
isPrevQuote = FALSE;
} else {
isPrevQuote = TRUE;
if (itemType != GMTOffsetField::TEXT) {
if (GMTOffsetField::isValid(itemType, itemLength)) {
GMTOffsetField* fld = GMTOffsetField::createTimeField(itemType, (uint8_t)itemLength, status);
result->addElement(fld, status);
if (U_FAILURE(status)) {
break;
}
} else {
status = U_ILLEGAL_ARGUMENT_ERROR;
break;
}
itemType = GMTOffsetField::TEXT;
}
}
inQuote = !inQuote;
} else {
isPrevQuote = FALSE;
if (inQuote) {
text.append(ch);
} else {
GMTOffsetField::FieldType tmpType = GMTOffsetField::getTypeByLetter(ch);
if (tmpType != GMTOffsetField::TEXT) {
// an offset time pattern character
if (tmpType == itemType) {
itemLength++;
} else {
if (itemType == GMTOffsetField::TEXT) {
if (text.length() > 0) {
GMTOffsetField* textfld = GMTOffsetField::createText(text, status);
result->addElement(textfld, status);
if (U_FAILURE(status)) {
break;
}
text.remove();
}
} else {
if (GMTOffsetField::isValid(itemType, itemLength)) {
GMTOffsetField* fld = GMTOffsetField::createTimeField(itemType, itemLength, status);
result->addElement(fld, status);
if (U_FAILURE(status)) {
break;
}
} else {
status = U_ILLEGAL_ARGUMENT_ERROR;
break;
}
}
itemType = tmpType;
itemLength = 1;
checkBits |= tmpType;
}
} else {
// a string literal
if (itemType != GMTOffsetField::TEXT) {
if (GMTOffsetField::isValid(itemType, itemLength)) {
GMTOffsetField* fld = GMTOffsetField::createTimeField(itemType, itemLength, status);
result->addElement(fld, status);
if (U_FAILURE(status)) {
break;
}
} else {
status = U_ILLEGAL_ARGUMENT_ERROR;
break;
}
itemType = GMTOffsetField::TEXT;
}
text.append(ch);
}
}
}
}
// handle last item
if (U_SUCCESS(status)) {
if (itemType == GMTOffsetField::TEXT) {
if (text.length() > 0) {
GMTOffsetField* tfld = GMTOffsetField::createText(text, status);
result->addElement(tfld, status);
}
} else {
if (GMTOffsetField::isValid(itemType, itemLength)) {
GMTOffsetField* fld = GMTOffsetField::createTimeField(itemType, itemLength, status);
result->addElement(fld, status);
} else {
status = U_ILLEGAL_ARGUMENT_ERROR;
}
}
// Check all required fields are set
if (U_SUCCESS(status)) {
int32_t reqBits = 0;
switch (required) {
case FIELDS_H:
reqBits = GMTOffsetField::HOUR;
break;
case FIELDS_HM:
reqBits = GMTOffsetField::HOUR | GMTOffsetField::MINUTE;
break;
case FIELDS_HMS:
reqBits = GMTOffsetField::HOUR | GMTOffsetField::MINUTE | GMTOffsetField::SECOND;
break;
}
if (checkBits == reqBits) {
// all required fields are set, no extra fields
return result;
}
}
}
// error
delete result;
return NULL;
}
UnicodeString&
TimeZoneFormat::expandOffsetPattern(const UnicodeString& offsetHM, UnicodeString& result, UErrorCode& status) {
result.setToBogus();
if (U_FAILURE(status)) {
return result;
}
U_ASSERT(u_strlen(DEFAULT_GMT_OFFSET_MINUTE_PATTERN) == 2);
int32_t idx_mm = offsetHM.indexOf(DEFAULT_GMT_OFFSET_MINUTE_PATTERN, 2, 0);
if (idx_mm < 0) {
// Bad time zone hour pattern data
status = U_ILLEGAL_ARGUMENT_ERROR;
return result;
}
UnicodeString sep;
2012-11-02 19:41:57 +00:00
int32_t idx_H = offsetHM.tempSubString(0, idx_mm).lastIndexOf((UChar)0x0048 /* H */);
if (idx_H >= 0) {
sep = offsetHM.tempSubString(idx_H + 1, idx_mm - (idx_H + 1));
}
result.setTo(offsetHM.tempSubString(0, idx_mm + 2));
result.append(sep);
result.append(DEFAULT_GMT_OFFSET_SECOND_PATTERN, -1);
result.append(offsetHM.tempSubString(idx_mm + 2));
return result;
}
UnicodeString&
TimeZoneFormat::truncateOffsetPattern(const UnicodeString& offsetHM, UnicodeString& result, UErrorCode& status) {
result.setToBogus();
if (U_FAILURE(status)) {
return result;
}
U_ASSERT(u_strlen(DEFAULT_GMT_OFFSET_MINUTE_PATTERN) == 2);
int32_t idx_mm = offsetHM.indexOf(DEFAULT_GMT_OFFSET_MINUTE_PATTERN, 2, 0);
if (idx_mm < 0) {
// Bad time zone hour pattern data
status = U_ILLEGAL_ARGUMENT_ERROR;
return result;
}
UChar HH[] = {0x0048, 0x0048};
int32_t idx_HH = offsetHM.tempSubString(0, idx_mm).lastIndexOf(HH, 2, 0);
if (idx_HH >= 0) {
return result.setTo(offsetHM.tempSubString(0, idx_HH + 2));
}
int32_t idx_H = offsetHM.tempSubString(0, idx_mm).lastIndexOf((UChar)0x0048, 0);
if (idx_H >= 0) {
return result.setTo(offsetHM.tempSubString(0, idx_H + 1));
}
// Bad time zone hour pattern data
status = U_ILLEGAL_ARGUMENT_ERROR;
return result;
}
void
TimeZoneFormat::initGMTOffsetPatterns(UErrorCode& status) {
for (int32_t type = 0; type < UTZFMT_PAT_COUNT; type++) {
switch (type) {
case UTZFMT_PAT_POSITIVE_H:
case UTZFMT_PAT_NEGATIVE_H:
fGMTOffsetPatternItems[type] = parseOffsetPattern(fGMTOffsetPatterns[type], FIELDS_H, status);
break;
case UTZFMT_PAT_POSITIVE_HM:
case UTZFMT_PAT_NEGATIVE_HM:
fGMTOffsetPatternItems[type] = parseOffsetPattern(fGMTOffsetPatterns[type], FIELDS_HM, status);
break;
case UTZFMT_PAT_POSITIVE_HMS:
case UTZFMT_PAT_NEGATIVE_HMS:
fGMTOffsetPatternItems[type] = parseOffsetPattern(fGMTOffsetPatterns[type], FIELDS_HMS, status);
break;
}
}
checkAbuttingHoursAndMinutes();
}
void
TimeZoneFormat::checkAbuttingHoursAndMinutes() {
fAbuttingOffsetHoursAndMinutes= FALSE;
for (int32_t type = 0; type < UTZFMT_PAT_COUNT; type++) {
UBool afterH = FALSE;
UVector *items = fGMTOffsetPatternItems[type];
for (int32_t i = 0; i < items->size(); i++) {
const GMTOffsetField* item = (GMTOffsetField*)items->elementAt(i);
GMTOffsetField::FieldType type = item->getType();
if (type != GMTOffsetField::TEXT) {
if (afterH) {
fAbuttingOffsetHoursAndMinutes = TRUE;
break;
} else if (type == GMTOffsetField::HOUR) {
afterH = TRUE;
}
} else if (afterH) {
break;
}
}
if (fAbuttingOffsetHoursAndMinutes) {
break;
}
}
}
UBool
TimeZoneFormat::toCodePoints(const UnicodeString& str, UChar32* codeArray, int32_t size) {
int32_t count = str.countChar32();
if (count != size) {
return FALSE;
}
for (int32_t idx = 0, start = 0; idx < size; idx++) {
codeArray[idx] = str.char32At(start);
start = str.moveIndex32(start, 1);
}
return TRUE;
}
TimeZone*
TimeZoneFormat::createTimeZoneForOffset(int32_t offset) const {
if (offset == 0) {
// when offset is 0, we should use "Etc/GMT"
return TimeZone::createTimeZone(UnicodeString(TRUE, TZID_GMT, -1));
}
return ZoneMeta::createCustomTimeZone(offset);
}
UTimeZoneFormatTimeType
TimeZoneFormat::getTimeType(UTimeZoneNameType nameType) {
switch (nameType) {
case UTZNM_LONG_STANDARD:
case UTZNM_SHORT_STANDARD:
return UTZFMT_TIME_TYPE_STANDARD;
case UTZNM_LONG_DAYLIGHT:
case UTZNM_SHORT_DAYLIGHT:
return UTZFMT_TIME_TYPE_DAYLIGHT;
default:
return UTZFMT_TIME_TYPE_UNKNOWN;
}
}
UnicodeString&
TimeZoneFormat::getTimeZoneID(const TimeZoneNames::MatchInfoCollection* matches, int32_t idx, UnicodeString& tzID) const {
if (!matches->getTimeZoneIDAt(idx, tzID)) {
UChar mzIDBuf[32];
UnicodeString mzID(mzIDBuf, 0, UPRV_LENGTHOF(mzIDBuf));
if (matches->getMetaZoneIDAt(idx, mzID)) {
fTimeZoneNames->getReferenceZoneID(mzID, fTargetRegion, tzID);
}
}
return tzID;
}
class ZoneIdMatchHandler : public TextTrieMapSearchResultHandler {
public:
ZoneIdMatchHandler();
virtual ~ZoneIdMatchHandler();
UBool handleMatch(int32_t matchLength, const CharacterNode *node, UErrorCode &status);
const UChar* getID();
int32_t getMatchLen();
private:
int32_t fLen;
const UChar* fID;
};
ZoneIdMatchHandler::ZoneIdMatchHandler()
: fLen(0), fID(NULL) {
}
ZoneIdMatchHandler::~ZoneIdMatchHandler() {
}
UBool
ZoneIdMatchHandler::handleMatch(int32_t matchLength, const CharacterNode *node, UErrorCode &status) {
if (U_FAILURE(status)) {
return FALSE;
}
if (node->hasValues()) {
const UChar* id = (const UChar*)node->getValue(0);
if (id != NULL) {
if (fLen < matchLength) {
fID = id;
fLen = matchLength;
}
}
}
return TRUE;
}
const UChar*
ZoneIdMatchHandler::getID() {
return fID;
}
int32_t
ZoneIdMatchHandler::getMatchLen() {
return fLen;
}
static void U_CALLCONV initZoneIdTrie(UErrorCode &status) {
U_ASSERT(gZoneIdTrie == NULL);
ucln_i18n_registerCleanup(UCLN_I18N_TIMEZONEFORMAT, tzfmt_cleanup);
gZoneIdTrie = new TextTrieMap(TRUE, NULL); // No deleter, because values are pooled by ZoneMeta
if (gZoneIdTrie == NULL) {
status = U_MEMORY_ALLOCATION_ERROR;
return;
}
StringEnumeration *tzenum = TimeZone::createEnumeration();
const UnicodeString *id;
while ((id = tzenum->snext(status))) {
const UChar* uid = ZoneMeta::findTimeZoneID(*id);
if (uid) {
gZoneIdTrie->put(uid, const_cast<UChar *>(uid), status);
}
}
delete tzenum;
}
UnicodeString&
TimeZoneFormat::parseZoneID(const UnicodeString& text, ParsePosition& pos, UnicodeString& tzID) const {
UErrorCode status = U_ZERO_ERROR;
umtx_initOnce(gZoneIdTrieInitOnce, &initZoneIdTrie, status);
int32_t start = pos.getIndex();
int32_t len = 0;
tzID.setToBogus();
if (U_SUCCESS(status)) {
LocalPointer<ZoneIdMatchHandler> handler(new ZoneIdMatchHandler());
gZoneIdTrie->search(text, start, handler.getAlias(), status);
len = handler->getMatchLen();
if (len > 0) {
tzID.setTo(handler->getID(), -1);
}
}
if (len > 0) {
pos.setIndex(start + len);
} else {
pos.setErrorIndex(start);
}
return tzID;
}
static void U_CALLCONV initShortZoneIdTrie(UErrorCode &status) {
U_ASSERT(gShortZoneIdTrie == NULL);
ucln_i18n_registerCleanup(UCLN_I18N_TIMEZONEFORMAT, tzfmt_cleanup);
StringEnumeration *tzenum = TimeZone::createTimeZoneIDEnumeration(UCAL_ZONE_TYPE_CANONICAL, NULL, NULL, status);
if (U_SUCCESS(status)) {
gShortZoneIdTrie = new TextTrieMap(TRUE, NULL); // No deleter, because values are pooled by ZoneMeta
if (gShortZoneIdTrie == NULL) {
status = U_MEMORY_ALLOCATION_ERROR;
} else {
const UnicodeString *id;
while ((id = tzenum->snext(status))) {
const UChar* uID = ZoneMeta::findTimeZoneID(*id);
const UChar* shortID = ZoneMeta::getShortID(*id);
if (shortID && uID) {
gShortZoneIdTrie->put(shortID, const_cast<UChar *>(uID), status);
}
}
}
}
delete tzenum;
}
UnicodeString&
TimeZoneFormat::parseShortZoneID(const UnicodeString& text, ParsePosition& pos, UnicodeString& tzID) const {
UErrorCode status = U_ZERO_ERROR;
umtx_initOnce(gShortZoneIdTrieInitOnce, &initShortZoneIdTrie, status);
int32_t start = pos.getIndex();
int32_t len = 0;
tzID.setToBogus();
if (U_SUCCESS(status)) {
LocalPointer<ZoneIdMatchHandler> handler(new ZoneIdMatchHandler());
gShortZoneIdTrie->search(text, start, handler.getAlias(), status);
len = handler->getMatchLen();
if (len > 0) {
tzID.setTo(handler->getID(), -1);
}
}
if (len > 0) {
pos.setIndex(start + len);
} else {
pos.setErrorIndex(start);
}
return tzID;
}
UnicodeString&
TimeZoneFormat::parseExemplarLocation(const UnicodeString& text, ParsePosition& pos, UnicodeString& tzID) const {
int32_t startIdx = pos.getIndex();
int32_t parsedPos = -1;
tzID.setToBogus();
UErrorCode status = U_ZERO_ERROR;
LocalPointer<TimeZoneNames::MatchInfoCollection> exemplarMatches(fTimeZoneNames->find(text, startIdx, UTZNM_EXEMPLAR_LOCATION, status));
if (U_FAILURE(status)) {
pos.setErrorIndex(startIdx);
return tzID;
}
int32_t matchIdx = -1;
if (!exemplarMatches.isNull()) {
for (int32_t i = 0; i < exemplarMatches->size(); i++) {
if (startIdx + exemplarMatches->getMatchLengthAt(i) > parsedPos) {
matchIdx = i;
parsedPos = startIdx + exemplarMatches->getMatchLengthAt(i);
}
}
if (parsedPos > 0) {
pos.setIndex(parsedPos);
getTimeZoneID(exemplarMatches.getAlias(), matchIdx, tzID);
}
}
if (tzID.length() == 0) {
pos.setErrorIndex(startIdx);
}
return tzID;
}
U_NAMESPACE_END
#endif