d79344d97d
X-SVN-Rev: 27644
598 lines
18 KiB
C++
598 lines
18 KiB
C++
/*
|
|
*******************************************************************************
|
|
* Copyright (C) 2007-2010, International Business Machines Corporation and *
|
|
* others. All Rights Reserved. *
|
|
*******************************************************************************
|
|
*/
|
|
|
|
#include "unicode/utypes.h"
|
|
|
|
#if !UCONFIG_NO_FORMATTING
|
|
|
|
#include "zonemeta.h"
|
|
|
|
#include "unicode/timezone.h"
|
|
#include "unicode/ustring.h"
|
|
#include "unicode/putil.h"
|
|
|
|
#include "umutex.h"
|
|
#include "uvector.h"
|
|
#include "cmemory.h"
|
|
#include "gregoimp.h"
|
|
#include "cstring.h"
|
|
#include "ucln_in.h"
|
|
#include "uassert.h"
|
|
|
|
static UMTX gZoneMetaLock = NULL;
|
|
|
|
// Metazone mapping table
|
|
static UHashtable *gOlsonToMeta = NULL;
|
|
static UBool gOlsonToMetaInitialized = FALSE;
|
|
|
|
// Country info vectors
|
|
static UVector *gSingleZoneCountries = NULL;
|
|
static UVector *gMultiZonesCountries = NULL;
|
|
static UBool gCountryInfoVectorsInitialized = FALSE;
|
|
|
|
U_CDECL_BEGIN
|
|
|
|
|
|
/**
|
|
* Cleanup callback func
|
|
*/
|
|
static UBool U_CALLCONV zoneMeta_cleanup(void)
|
|
{
|
|
umtx_destroy(&gZoneMetaLock);
|
|
|
|
if (gOlsonToMeta != NULL) {
|
|
uhash_close(gOlsonToMeta);
|
|
gOlsonToMeta = NULL;
|
|
}
|
|
gOlsonToMetaInitialized = FALSE;
|
|
|
|
delete gSingleZoneCountries;
|
|
delete gMultiZonesCountries;
|
|
gCountryInfoVectorsInitialized = FALSE;
|
|
|
|
return TRUE;
|
|
}
|
|
|
|
/**
|
|
* Deleter for UChar* string
|
|
*/
|
|
static void U_CALLCONV
|
|
deleteUCharString(void *obj) {
|
|
UChar *entry = (UChar*)obj;
|
|
uprv_free(entry);
|
|
}
|
|
|
|
/**
|
|
* Deleter for UVector
|
|
*/
|
|
static void U_CALLCONV
|
|
deleteUVector(void *obj) {
|
|
delete (U_NAMESPACE_QUALIFIER UVector*) obj;
|
|
}
|
|
|
|
/**
|
|
* Deleter for OlsonToMetaMappingEntry
|
|
*/
|
|
static void U_CALLCONV
|
|
deleteOlsonToMetaMappingEntry(void *obj) {
|
|
U_NAMESPACE_QUALIFIER OlsonToMetaMappingEntry *entry = (U_NAMESPACE_QUALIFIER OlsonToMetaMappingEntry*)obj;
|
|
uprv_free(entry);
|
|
}
|
|
|
|
U_CDECL_END
|
|
|
|
U_NAMESPACE_BEGIN
|
|
|
|
#define ZID_KEY_MAX 128
|
|
|
|
static const char gMetaZones[] = "metaZones";
|
|
static const char gMetazoneInfo[] = "metazoneInfo";
|
|
static const char gMapTimezonesTag[] = "mapTimezones";
|
|
|
|
static const char gKeyTypeData[] = "keyTypeData";
|
|
static const char gTypeAliasTag[] = "typeAlias";
|
|
static const char gTimezoneTag[] = "timezone";
|
|
|
|
static const UChar gWorld[] = {0x30, 0x30, 0x31, 0x00}; // "001"
|
|
|
|
static const UChar gDefaultFrom[] = {0x31, 0x39, 0x37, 0x30, 0x2D, 0x30, 0x31, 0x2D, 0x30, 0x31,
|
|
0x20, 0x30, 0x30, 0x3A, 0x30, 0x30, 0x00}; // "1970-01-01 00:00"
|
|
static const UChar gDefaultTo[] = {0x39, 0x39, 0x39, 0x39, 0x2D, 0x31, 0x32, 0x2D, 0x33, 0x31,
|
|
0x20, 0x32, 0x33, 0x3A, 0x35, 0x39, 0x00}; // "9999-12-31 23:59"
|
|
|
|
#define ASCII_DIGIT(c) (((c)>=0x30 && (c)<=0x39) ? (c)-0x30 : -1)
|
|
|
|
/*
|
|
* Convert a date string used by metazone mappings to UDate.
|
|
* The format used by CLDR metazone mapping is "yyyy-MM-dd HH:mm".
|
|
*/
|
|
static UDate
|
|
parseDate (const UChar *text, UErrorCode &status) {
|
|
if (U_FAILURE(status)) {
|
|
return 0;
|
|
}
|
|
int32_t len = u_strlen(text);
|
|
if (len != 16 && len != 10) {
|
|
// It must be yyyy-MM-dd HH:mm (length 16) or yyyy-MM-dd (length 10)
|
|
status = U_INVALID_FORMAT_ERROR;
|
|
return 0;
|
|
}
|
|
|
|
int32_t year = 0, month = 0, day = 0, hour = 0, min = 0, n;
|
|
int32_t idx;
|
|
|
|
// "yyyy" (0 - 3)
|
|
for (idx = 0; idx <= 3 && U_SUCCESS(status); idx++) {
|
|
n = ASCII_DIGIT((int32_t)text[idx]);
|
|
if (n >= 0) {
|
|
year = 10*year + n;
|
|
} else {
|
|
status = U_INVALID_FORMAT_ERROR;
|
|
}
|
|
}
|
|
// "MM" (5 - 6)
|
|
for (idx = 5; idx <= 6 && U_SUCCESS(status); idx++) {
|
|
n = ASCII_DIGIT((int32_t)text[idx]);
|
|
if (n >= 0) {
|
|
month = 10*month + n;
|
|
} else {
|
|
status = U_INVALID_FORMAT_ERROR;
|
|
}
|
|
}
|
|
// "dd" (8 - 9)
|
|
for (idx = 8; idx <= 9 && U_SUCCESS(status); idx++) {
|
|
n = ASCII_DIGIT((int32_t)text[idx]);
|
|
if (n >= 0) {
|
|
day = 10*day + n;
|
|
} else {
|
|
status = U_INVALID_FORMAT_ERROR;
|
|
}
|
|
}
|
|
if (len == 16) {
|
|
// "HH" (11 - 12)
|
|
for (idx = 11; idx <= 12 && U_SUCCESS(status); idx++) {
|
|
n = ASCII_DIGIT((int32_t)text[idx]);
|
|
if (n >= 0) {
|
|
hour = 10*hour + n;
|
|
} else {
|
|
status = U_INVALID_FORMAT_ERROR;
|
|
}
|
|
}
|
|
// "mm" (14 - 15)
|
|
for (idx = 14; idx <= 15 && U_SUCCESS(status); idx++) {
|
|
n = ASCII_DIGIT((int32_t)text[idx]);
|
|
if (n >= 0) {
|
|
min = 10*min + n;
|
|
} else {
|
|
status = U_INVALID_FORMAT_ERROR;
|
|
}
|
|
}
|
|
}
|
|
|
|
if (U_SUCCESS(status)) {
|
|
UDate date = Grego::fieldsToDay(year, month - 1, day) * U_MILLIS_PER_DAY
|
|
+ hour * U_MILLIS_PER_HOUR + min * U_MILLIS_PER_MINUTE;
|
|
return date;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
UnicodeString& U_EXPORT2
|
|
ZoneMeta::getCanonicalSystemID(const UnicodeString &tzid, UnicodeString &systemID, UErrorCode& status) {
|
|
// Dereference the input ID using the tz data first
|
|
const UChar *canonical = TimeZone::dereferOlsonLink(tzid);
|
|
if (canonical != NULL) {
|
|
// check canonical mapping in CLDR
|
|
char id[ZID_KEY_MAX];
|
|
int32_t len = u_strlen(canonical);
|
|
if (len < sizeof(id)) {
|
|
u_UCharsToChars(canonical, id, len + 1 /* include the terminator */);
|
|
// replace '/' with ':'
|
|
char *p = id;
|
|
while (*p) {
|
|
if (*p == '/') {
|
|
*p = ':';
|
|
}
|
|
p++;
|
|
}
|
|
|
|
UErrorCode tmpStatus = U_ZERO_ERROR;
|
|
UResourceBundle *rb = ures_openDirect(NULL, gKeyTypeData, &tmpStatus);
|
|
ures_getByKey(rb, gTypeAliasTag, rb, &tmpStatus);
|
|
ures_getByKey(rb, gTimezoneTag, rb, &tmpStatus);
|
|
const UChar *cldrCanonical = ures_getStringByKey(rb, id, NULL, &tmpStatus);
|
|
if (U_SUCCESS(tmpStatus)) {
|
|
// canonical map found
|
|
canonical = cldrCanonical;
|
|
}
|
|
ures_close(rb);
|
|
}
|
|
}
|
|
if (canonical == NULL) {
|
|
systemID.remove();
|
|
status = U_ILLEGAL_ARGUMENT_ERROR;
|
|
} else {
|
|
systemID.setTo(canonical);
|
|
}
|
|
|
|
return systemID;
|
|
}
|
|
|
|
UnicodeString& U_EXPORT2
|
|
ZoneMeta::getCanonicalCountry(const UnicodeString &tzid, UnicodeString &canonicalCountry) {
|
|
const UChar *region = TimeZone::getRegion(tzid);
|
|
if (u_strcmp(gWorld, region) != 0) {
|
|
canonicalCountry.setTo(region, -1);
|
|
} else {
|
|
canonicalCountry.remove();
|
|
}
|
|
return canonicalCountry;
|
|
}
|
|
|
|
UnicodeString& U_EXPORT2
|
|
ZoneMeta::getSingleCountry(const UnicodeString &tzid, UnicodeString &country) {
|
|
// Get canonical country for the zone
|
|
const UChar *region = TimeZone::getRegion(tzid);
|
|
if (u_strcmp(gWorld, region) == 0) {
|
|
// special case - "001"
|
|
country.remove();
|
|
return country;
|
|
}
|
|
|
|
// Checking the cached results
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
UBool initialized;
|
|
UMTX_CHECK(&gZoneMetaLock, gCountryInfoVectorsInitialized, initialized);
|
|
if (!initialized) {
|
|
// Create empty vectors
|
|
umtx_lock(&gZoneMetaLock);
|
|
{
|
|
if (!gCountryInfoVectorsInitialized) {
|
|
// No deleters for these UVectors, it's a reference to a resource bundle string.
|
|
gSingleZoneCountries = new UVector(NULL, uhash_compareUChars, status);
|
|
if (gSingleZoneCountries == NULL) {
|
|
status = U_MEMORY_ALLOCATION_ERROR;
|
|
}
|
|
gMultiZonesCountries = new UVector(NULL, uhash_compareUChars, status);
|
|
if (gMultiZonesCountries == NULL) {
|
|
status = U_MEMORY_ALLOCATION_ERROR;
|
|
}
|
|
|
|
if (U_SUCCESS(status)) {
|
|
gCountryInfoVectorsInitialized = TRUE;
|
|
} else {
|
|
delete gSingleZoneCountries;
|
|
delete gMultiZonesCountries;
|
|
}
|
|
}
|
|
}
|
|
umtx_unlock(&gZoneMetaLock);
|
|
|
|
if (U_FAILURE(status)) {
|
|
country.remove();
|
|
return country;
|
|
}
|
|
}
|
|
|
|
// Check if it was already cached
|
|
UBool cached = FALSE;
|
|
UBool multiZones = FALSE;
|
|
umtx_lock(&gZoneMetaLock);
|
|
{
|
|
multiZones = cached = gMultiZonesCountries->contains((void*)region);
|
|
if (!multiZones) {
|
|
cached = gSingleZoneCountries->contains((void*)region);
|
|
}
|
|
}
|
|
umtx_unlock(&gZoneMetaLock);
|
|
|
|
if (!cached) {
|
|
// We need to go through all zones associated with the region.
|
|
// This is relatively heavy operation.
|
|
|
|
U_ASSERT(u_strlen(region) == 2);
|
|
|
|
char buf[] = {0, 0, 0};
|
|
u_UCharsToChars(region, buf, 2);
|
|
|
|
StringEnumeration *ids = TimeZone::createEnumeration(buf);
|
|
int32_t idsLen = ids->count(status);
|
|
if (U_SUCCESS(status) && idsLen > 1) {
|
|
// multiple zones are available for the region
|
|
UnicodeString canonical, tmp;
|
|
const UnicodeString *id = ids->snext(status);
|
|
getCanonicalSystemID(*id, canonical, status);
|
|
if (U_SUCCESS(status)) {
|
|
// check if there are any other canonical zone in the group
|
|
while (id = ids->snext(status)) {
|
|
getCanonicalSystemID(*id, tmp, status);
|
|
if (U_FAILURE(status)) {
|
|
break;
|
|
}
|
|
if (canonical != tmp) {
|
|
// another canonical zone was found
|
|
multiZones = TRUE;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
if (U_FAILURE(status)) {
|
|
// no single country by default for any error cases
|
|
multiZones = TRUE;
|
|
}
|
|
delete ids;
|
|
|
|
// Cache the result
|
|
umtx_lock(&gZoneMetaLock);
|
|
{
|
|
UErrorCode ec = U_ZERO_ERROR;
|
|
if (multiZones) {
|
|
if (!gMultiZonesCountries->contains((void*)region)) {
|
|
gMultiZonesCountries->addElement((void*)region, ec);
|
|
}
|
|
} else {
|
|
if (!gSingleZoneCountries->contains((void*)region)) {
|
|
gSingleZoneCountries->addElement((void*)region, ec);
|
|
}
|
|
}
|
|
}
|
|
umtx_unlock(&gZoneMetaLock);
|
|
}
|
|
|
|
if (multiZones) {
|
|
country.remove();
|
|
} else {
|
|
country.setTo(region, -1);
|
|
}
|
|
return country;
|
|
}
|
|
|
|
UnicodeString& U_EXPORT2
|
|
ZoneMeta::getMetazoneID(const UnicodeString &tzid, UDate date, UnicodeString &result) {
|
|
UBool isSet = FALSE;
|
|
const UVector *mappings = getMetazoneMappings(tzid);
|
|
if (mappings != NULL) {
|
|
for (int32_t i = 0; i < mappings->size(); i++) {
|
|
OlsonToMetaMappingEntry *mzm = (OlsonToMetaMappingEntry*)mappings->elementAt(i);
|
|
if (mzm->from <= date && mzm->to > date) {
|
|
result.setTo(mzm->mzid, -1);
|
|
isSet = TRUE;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
if (!isSet) {
|
|
result.remove();
|
|
}
|
|
return result;
|
|
}
|
|
|
|
const UVector* U_EXPORT2
|
|
ZoneMeta::getMetazoneMappings(const UnicodeString &tzid) {
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
UChar tzidUChars[ZID_KEY_MAX];
|
|
tzid.extract(tzidUChars, ZID_KEY_MAX, status);
|
|
if (U_FAILURE(status) || status == U_STRING_NOT_TERMINATED_WARNING) {
|
|
return NULL;
|
|
}
|
|
|
|
UBool initialized;
|
|
UMTX_CHECK(&gZoneMetaLock, gOlsonToMetaInitialized, initialized);
|
|
if (!initialized) {
|
|
UHashtable *tmpOlsonToMeta = uhash_open(uhash_hashUChars, uhash_compareUChars, NULL, &status);
|
|
if (U_FAILURE(status)) {
|
|
return NULL;
|
|
}
|
|
uhash_setKeyDeleter(tmpOlsonToMeta, deleteUCharString);
|
|
uhash_setValueDeleter(tmpOlsonToMeta, deleteUVector);
|
|
|
|
umtx_lock(&gZoneMetaLock);
|
|
{
|
|
if (!gOlsonToMetaInitialized) {
|
|
gOlsonToMeta = tmpOlsonToMeta;
|
|
tmpOlsonToMeta = NULL;
|
|
gOlsonToMetaInitialized = TRUE;
|
|
}
|
|
}
|
|
umtx_unlock(&gZoneMetaLock);
|
|
|
|
// OK to call the following multiple times with the same function
|
|
ucln_i18n_registerCleanup(UCLN_I18N_ZONEMETA, zoneMeta_cleanup);
|
|
if (tmpOlsonToMeta != NULL) {
|
|
uhash_close(tmpOlsonToMeta);
|
|
}
|
|
}
|
|
|
|
// get the mapping from cache
|
|
const UVector *result = NULL;
|
|
|
|
umtx_lock(&gZoneMetaLock);
|
|
{
|
|
result = (UVector*) uhash_get(gOlsonToMeta, tzidUChars);
|
|
}
|
|
umtx_unlock(&gZoneMetaLock);
|
|
|
|
if (result != NULL) {
|
|
return result;
|
|
}
|
|
|
|
// miss the cache - create new one
|
|
UVector *tmpResult = createMetazoneMappings(tzid);
|
|
if (tmpResult == NULL) {
|
|
// not available
|
|
return NULL;
|
|
}
|
|
|
|
// put the new one into the cache
|
|
umtx_lock(&gZoneMetaLock);
|
|
{
|
|
// make sure it's already created
|
|
result = (UVector*) uhash_get(gOlsonToMeta, tzidUChars);
|
|
if (result == NULL) {
|
|
// add the one just created
|
|
int32_t tzidLen = tzid.length() + 1;
|
|
UChar *key = (UChar*)uprv_malloc(tzidLen * sizeof(UChar));
|
|
if (key == NULL) {
|
|
// memory allocation error.. just return NULL
|
|
result = NULL;
|
|
delete tmpResult;
|
|
} else {
|
|
tzid.extract(key, tzidLen, status);
|
|
uhash_put(gOlsonToMeta, key, tmpResult, &status);
|
|
if (U_FAILURE(status)) {
|
|
// delete the mapping
|
|
result = NULL;
|
|
delete tmpResult;
|
|
} else {
|
|
result = tmpResult;
|
|
}
|
|
}
|
|
} else {
|
|
// another thread already put the one
|
|
delete tmpResult;
|
|
}
|
|
}
|
|
umtx_unlock(&gZoneMetaLock);
|
|
|
|
return result;
|
|
}
|
|
|
|
UVector*
|
|
ZoneMeta::createMetazoneMappings(const UnicodeString &tzid) {
|
|
UVector *mzMappings = NULL;
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
|
|
UnicodeString canonicalID;
|
|
UResourceBundle *rb = ures_openDirect(NULL, gMetaZones, &status);
|
|
ures_getByKey(rb, gMetazoneInfo, rb, &status);
|
|
TimeZone::getCanonicalID(tzid, canonicalID, status);
|
|
|
|
if (U_SUCCESS(status)) {
|
|
char tzKey[ZID_KEY_MAX];
|
|
canonicalID.extract(0, canonicalID.length(), tzKey, sizeof(tzKey), US_INV);
|
|
|
|
// tzid keys are using ':' as separators
|
|
char *p = tzKey;
|
|
while (*p) {
|
|
if (*p == '/') {
|
|
*p = ':';
|
|
}
|
|
p++;
|
|
}
|
|
|
|
ures_getByKey(rb, tzKey, rb, &status);
|
|
|
|
if (U_SUCCESS(status)) {
|
|
UResourceBundle *mz = NULL;
|
|
while (ures_hasNext(rb)) {
|
|
mz = ures_getNextResource(rb, mz, &status);
|
|
|
|
const UChar *mz_name = ures_getStringByIndex(mz, 0, NULL, &status);
|
|
const UChar *mz_from = gDefaultFrom;
|
|
const UChar *mz_to = gDefaultTo;
|
|
|
|
if (ures_getSize(mz) == 3) {
|
|
mz_from = ures_getStringByIndex(mz, 1, NULL, &status);
|
|
mz_to = ures_getStringByIndex(mz, 2, NULL, &status);
|
|
}
|
|
|
|
if(U_FAILURE(status)){
|
|
status = U_ZERO_ERROR;
|
|
continue;
|
|
}
|
|
// We do not want to use SimpleDateformat to parse boundary dates,
|
|
// because this code could be triggered by the initialization code
|
|
// used by SimpleDateFormat.
|
|
UDate from = parseDate(mz_from, status);
|
|
UDate to = parseDate(mz_to, status);
|
|
if (U_FAILURE(status)) {
|
|
status = U_ZERO_ERROR;
|
|
continue;
|
|
}
|
|
|
|
OlsonToMetaMappingEntry *entry = (OlsonToMetaMappingEntry*)uprv_malloc(sizeof(OlsonToMetaMappingEntry));
|
|
if (entry == NULL) {
|
|
status = U_MEMORY_ALLOCATION_ERROR;
|
|
break;
|
|
}
|
|
entry->mzid = mz_name;
|
|
entry->from = from;
|
|
entry->to = to;
|
|
|
|
if (mzMappings == NULL) {
|
|
mzMappings = new UVector(deleteOlsonToMetaMappingEntry, NULL, status);
|
|
if (U_FAILURE(status)) {
|
|
delete mzMappings;
|
|
deleteOlsonToMetaMappingEntry(entry);
|
|
uprv_free(entry);
|
|
break;
|
|
}
|
|
}
|
|
|
|
mzMappings->addElement(entry, status);
|
|
if (U_FAILURE(status)) {
|
|
break;
|
|
}
|
|
}
|
|
ures_close(mz);
|
|
if (U_FAILURE(status)) {
|
|
if (mzMappings != NULL) {
|
|
delete mzMappings;
|
|
mzMappings = NULL;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
ures_close(rb);
|
|
return mzMappings;
|
|
}
|
|
|
|
UnicodeString& U_EXPORT2
|
|
ZoneMeta::getZoneIdByMetazone(const UnicodeString &mzid, const UnicodeString ®ion, UnicodeString &result) {
|
|
|
|
char *pRegionSuffix = NULL;
|
|
char mzidChars[ZID_KEY_MAX + 4];
|
|
int32_t mzLen = mzid.extract(0, mzid.length(), mzidChars, ZID_KEY_MAX, US_INV);
|
|
|
|
if (region.length() ==2 || region.length() == 3) {
|
|
pRegionSuffix = &mzidChars[mzLen];
|
|
*pRegionSuffix = ':';
|
|
region.extract(0, region.length(), &mzidChars[mzLen + 1], sizeof(mzidChars) - mzLen, US_INV);
|
|
}
|
|
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
const UChar *tzid = NULL;
|
|
int32_t tzidLen = 0;
|
|
|
|
UResourceBundle *rb = ures_openDirect(NULL, gMetaZones, &status);
|
|
ures_getByKey(rb, gMapTimezonesTag, rb, &status);
|
|
if (U_SUCCESS(status)) {
|
|
tzid = ures_getStringByKey(rb, mzidChars, &tzidLen, &status);
|
|
if (status == U_MISSING_RESOURCE_ERROR && pRegionSuffix != NULL) {
|
|
status = U_ZERO_ERROR;
|
|
// try key without region
|
|
*pRegionSuffix = 0;
|
|
tzid = ures_getStringByKey(rb, mzidChars, &tzidLen, &status);
|
|
}
|
|
}
|
|
ures_close(rb);
|
|
|
|
if (tzidLen > 0) {
|
|
result.setTo(tzid, tzidLen);
|
|
} else {
|
|
result.remove();
|
|
}
|
|
|
|
return result;
|
|
}
|
|
|
|
|
|
U_NAMESPACE_END
|
|
|
|
#endif /* #if !UCONFIG_NO_FORMATTING */
|