| /* |
| ****************************************************************************** |
| * |
| * Copyright (C) 1997-2005, International Business Machines |
| * Corporation and others. All Rights Reserved. |
| * |
| ****************************************************************************** |
| * |
| * FILE NAME : putil.c (previously putil.cpp and ptypes.cpp) |
| * |
| * Date Name Description |
| * 04/14/97 aliu Creation. |
| * 04/24/97 aliu Added getDefaultDataDirectory() and |
| * getDefaultLocaleID(). |
| * 04/28/97 aliu Rewritten to assume Unix and apply general methods |
| * for assumed case. Non-UNIX platforms must be |
| * special-cased. Rewrote numeric methods dealing |
| * with NaN and Infinity to be platform independent |
| * over all IEEE 754 platforms. |
| * 05/13/97 aliu Restored sign of timezone |
| * (semantics are hours West of GMT) |
| * 06/16/98 erm Added IEEE_754 stuff, cleaned up isInfinite, isNan, |
| * nextDouble.. |
| * 07/22/98 stephen Added remainder, max, min, trunc |
| * 08/13/98 stephen Added isNegativeInfinity, isPositiveInfinity |
| * 08/24/98 stephen Added longBitsFromDouble |
| * 09/08/98 stephen Minor changes for Mac Port |
| * 03/02/99 stephen Removed openFile(). Added AS400 support. |
| * Fixed EBCDIC tables |
| * 04/15/99 stephen Converted to C. |
| * 06/28/99 stephen Removed mutex locking in u_isBigEndian(). |
| * 08/04/99 jeffrey R. Added OS/2 changes |
| * 11/15/99 helena Integrated S/390 IEEE support. |
| * 04/26/01 Barry N. OS/400 support for uprv_getDefaultLocaleID |
| * 08/15/01 Steven H. OS/400 support for uprv_getDefaultCodepage |
| ****************************************************************************** |
| */ |
| |
| #ifndef PTX |
| |
| /* Define _XOPEN_SOURCE for Solaris and friends. */ |
| /* NetBSD needs it to be >= 4 */ |
| #ifndef _XOPEN_SOURCE |
| #define _XOPEN_SOURCE 4 |
| #endif |
| |
| /* Define __USE_POSIX and __USE_XOPEN for Linux and glibc. */ |
| #ifndef __USE_POSIX |
| #define __USE_POSIX |
| #endif |
| #ifndef __USE_XOPEN |
| #define __USE_XOPEN |
| #endif |
| |
| #endif /* PTX */ |
| |
| /* include ICU headers */ |
| #include "unicode/utypes.h" |
| #include "unicode/putil.h" |
| #include "unicode/ustring.h" |
| #include "putilimp.h" |
| #include "uassert.h" |
| #include "umutex.h" |
| #include "cmemory.h" |
| #include "cstring.h" |
| #include "locmap.h" |
| #include "ucln_cmn.h" |
| |
| /* Include standard headers. */ |
| #include <stdio.h> |
| #include <stdlib.h> |
| #include <string.h> |
| #include <math.h> |
| #include <locale.h> |
| #include <float.h> |
| #include <time.h> |
| |
| /* include system headers */ |
| #ifdef U_WINDOWS |
| # define WIN32_LEAN_AND_MEAN |
| # define VC_EXTRALEAN |
| # define NOUSER |
| # define NOSERVICE |
| # define NOIME |
| # define NOMCX |
| # include <windows.h> |
| #elif defined(U_CYGWIN) && defined(__STRICT_ANSI__) |
| /* tzset isn't defined in strict ANSI on Cygwin. */ |
| # undef __STRICT_ANSI__ |
| #elif defined(OS400) |
| # include <float.h> |
| # include <qusec.h> /* error code structure */ |
| # include <qusrjobi.h> |
| # include <qliept.h> /* EPT_CALL macro - this include must be after all other "QSYSINCs" */ |
| #elif defined(XP_MAC) |
| # include <Files.h> |
| # include <IntlResources.h> |
| # include <Script.h> |
| # include <Folders.h> |
| # include <MacTypes.h> |
| # include <TextUtils.h> |
| # define ICU_PREVENT_USER_DATA_OVERRIDE 1 |
| #elif defined(OS390) |
| #include "unicode/ucnv.h" /* Needed for UCNV_SWAP_LFNL_OPTION_STRING */ |
| #elif defined(U_AIX) |
| #elif defined(U_SOLARIS) || defined(U_LINUX) |
| #elif defined(U_HPUX) |
| #elif defined(U_DARWIN) |
| #include <sys/file.h> |
| #include <sys/param.h> |
| #elif defined(U_QNX) |
| #include <sys/neutrino.h> |
| #endif |
| |
| #ifndef U_WINDOWS |
| #include <sys/time.h> |
| #endif |
| |
| /* |
| * Only include langinfo.h if we have a way to get the codeset. If we later |
| * depend on more feature, we can test on U_HAVE_NL_LANGINFO. |
| * |
| */ |
| |
| #if U_HAVE_NL_LANGINFO_CODESET |
| #include <langinfo.h> |
| #endif |
| |
| /* Define the extension for data files, again... */ |
| #define DATA_TYPE "dat" |
| |
| /* Leave this copyright notice here! */ |
| static const char copyright[] = U_COPYRIGHT_STRING; |
| |
| /* floating point implementations ------------------------------------------- */ |
| |
| /* We return QNAN rather than SNAN*/ |
| #define SIGN 0x80000000U |
| #if defined(__GNUC__) || defined(_MSC_VER) |
| /* |
| This is an optimization for when u_topNBytesOfDouble |
| and u_bottomNBytesOfDouble can't be properly optimized by the compiler |
| or when faster infinity and NaN usage is helpful. |
| */ |
| #define USE_64BIT_DOUBLE_OPTIMIZATION 1 |
| #else |
| #define USE_64BIT_DOUBLE_OPTIMIZATION 0 |
| #endif |
| |
| #if USE_64BIT_DOUBLE_OPTIMIZATION |
| /* gcc 3.2 has an optimization bug */ |
| static const int64_t gNan64 = INT64_C(0x7FF8000000000000); |
| static const int64_t gInf64 = INT64_C(0x7FF0000000000000); |
| static const double * fgNan = (const double *)(&gNan64); |
| static const double * fgInf = (const double *)(&gInf64); |
| #else |
| |
| #if IEEE_754 |
| #define NAN_TOP ((int16_t)0x7FF8) |
| #define INF_TOP ((int16_t)0x7FF0) |
| #elif defined(OS390) |
| #define NAN_TOP ((int16_t)0x7F08) |
| #define INF_TOP ((int16_t)0x3F00) |
| #endif |
| |
| /* statics */ |
| static UBool fgNaNInitialized = FALSE; |
| static UBool fgInfInitialized = FALSE; |
| static double gNan; |
| static double gInf; |
| static double * fgNan = &gNan; |
| static double * fgInf = &gInf; |
| #endif |
| |
| /*--------------------------------------------------------------------------- |
| Platform utilities |
| Our general strategy is to assume we're on a POSIX platform. Platforms which |
| are non-POSIX must declare themselves so. The default POSIX implementation |
| will sometimes work for non-POSIX platforms as well (e.g., the NaN-related |
| functions). |
| ---------------------------------------------------------------------------*/ |
| |
| #if defined(U_WINDOWS) || defined(XP_MAC) || defined(OS400) |
| # undef U_POSIX_LOCALE |
| #else |
| # define U_POSIX_LOCALE 1 |
| #endif |
| |
| /* Utilities to get the bits from a double */ |
| #if !USE_64BIT_DOUBLE_OPTIMIZATION |
| static char* |
| u_topNBytesOfDouble(double* d, int n) |
| { |
| #if U_IS_BIG_ENDIAN |
| return (char*)d; |
| #else |
| return (char*)(d + 1) - n; |
| #endif |
| } |
| #endif |
| |
| static char* |
| u_bottomNBytesOfDouble(double* d, int n) |
| { |
| #if U_IS_BIG_ENDIAN |
| return (char*)(d + 1) - n; |
| #else |
| return (char*)d; |
| #endif |
| } |
| |
| #if defined(U_WINDOWS) |
| typedef union { |
| int64_t int64; |
| FILETIME fileTime; |
| } FileTimeConversion; /* This is like a ULARGE_INTEGER */ |
| |
| /* Number of 100 nanoseconds from 1/1/1601 to 1/1/1970 */ |
| #define EPOCH_BIAS INT64_C(116444736000000000) |
| #define HECTONANOSECOND_PER_MILLISECOND 10000 |
| |
| #endif |
| |
| /*--------------------------------------------------------------------------- |
| Universal Implementations |
| These are designed to work on all platforms. Try these, and if they |
| don't work on your platform, then special case your platform with new |
| implementations. |
| ---------------------------------------------------------------------------*/ |
| |
| /* Return UTC (GMT) time measured in milliseconds since 0:00 on 1/1/70.*/ |
| U_CAPI UDate U_EXPORT2 |
| uprv_getUTCtime() |
| { |
| #ifdef XP_MAC |
| time_t t, t1, t2; |
| struct tm tmrec; |
| |
| uprv_memset( &tmrec, 0, sizeof(tmrec) ); |
| tmrec.tm_year = 70; |
| tmrec.tm_mon = 0; |
| tmrec.tm_mday = 1; |
| t1 = mktime(&tmrec); /* seconds of 1/1/1970*/ |
| |
| time(&t); |
| uprv_memcpy( &tmrec, gmtime(&t), sizeof(tmrec) ); |
| t2 = mktime(&tmrec); /* seconds of current GMT*/ |
| return (UDate)(t2 - t1) * U_MILLIS_PER_SECOND; /* GMT (or UTC) in seconds since 1970*/ |
| #elif defined(U_WINDOWS) |
| |
| FileTimeConversion winTime; |
| GetSystemTimeAsFileTime(&winTime.fileTime); |
| return (UDate)((winTime.int64 - EPOCH_BIAS) / HECTONANOSECOND_PER_MILLISECOND); |
| #else |
| /* |
| struct timeval posixTime; |
| gettimeofday(&posixTime, NULL); |
| return (UDate)(((int64_t)posixTime.tv_sec * U_MILLIS_PER_SECOND) + (posixTime.tv_usec/1000)); |
| */ |
| time_t epochtime; |
| time(&epochtime); |
| return (UDate)epochtime * U_MILLIS_PER_SECOND; |
| #endif |
| } |
| |
| /*----------------------------------------------------------------------------- |
| IEEE 754 |
| These methods detect and return NaN and infinity values for doubles |
| conforming to IEEE 754. Platforms which support this standard include X86, |
| Mac 680x0, Mac PowerPC, AIX RS/6000, and most others. |
| If this doesn't work on your platform, you have non-IEEE floating-point, and |
| will need to code your own versions. A naive implementation is to return 0.0 |
| for getNaN and getInfinity, and false for isNaN and isInfinite. |
| ---------------------------------------------------------------------------*/ |
| |
| U_CAPI UBool U_EXPORT2 |
| uprv_isNaN(double number) |
| { |
| #if IEEE_754 |
| #if USE_64BIT_DOUBLE_OPTIMIZATION |
| /* gcc 3.2 has an optimization bug */ |
| /* Infinity is 0x7FF0000000000000U. Anything greater than that is a NaN */ |
| return (UBool)(((*((int64_t *)&number)) & U_INT64_MAX) > gInf64); |
| |
| #else |
| /* This should work in theory, but it doesn't, so we resort to the more*/ |
| /* complicated method below.*/ |
| /* return number != number;*/ |
| |
| /* You can't return number == getNaN() because, by definition, NaN != x for*/ |
| /* all x, including NaN (that is, NaN != NaN). So instead, we compare*/ |
| /* against the known bit pattern. We must be careful of endianism here.*/ |
| /* The pattern we are looking for id:*/ |
| |
| /* 7FFy yyyy yyyy yyyy (some y non-zero)*/ |
| |
| /* There are two different kinds of NaN, but we ignore the distinction*/ |
| /* here. Note that the y value must be non-zero; if it is zero, then we*/ |
| /* have infinity.*/ |
| |
| uint32_t highBits = *(uint32_t*)u_topNBytesOfDouble(&number, |
| sizeof(uint32_t)); |
| uint32_t lowBits = *(uint32_t*)u_bottomNBytesOfDouble(&number, |
| sizeof(uint32_t)); |
| |
| return (UBool)(((highBits & 0x7FF00000L) == 0x7FF00000L) && |
| (((highBits & 0x000FFFFFL) != 0) || (lowBits != 0))); |
| #endif |
| |
| #elif defined(OS390) |
| uint32_t highBits = *(uint32_t*)u_topNBytesOfDouble(&number, |
| sizeof(uint32_t)); |
| uint32_t lowBits = *(uint32_t*)u_bottomNBytesOfDouble(&number, |
| sizeof(uint32_t)); |
| |
| return ((highBits & 0x7F080000L) == 0x7F080000L) && |
| (lowBits == 0x00000000L); |
| |
| #else |
| /* If your platform doesn't support IEEE 754 but *does* have an NaN value,*/ |
| /* you'll need to replace this default implementation with what's correct*/ |
| /* for your platform.*/ |
| return number != number; |
| #endif |
| } |
| |
| U_CAPI UBool U_EXPORT2 |
| uprv_isInfinite(double number) |
| { |
| #if IEEE_754 |
| #if USE_64BIT_DOUBLE_OPTIMIZATION |
| /* gcc 3.2 has an optimization bug */ |
| return (UBool)(((*((int64_t *)&number)) & U_INT64_MAX) == gInf64); |
| #else |
| |
| /* We know the top bit is the sign bit, so we mask that off in a copy of */ |
| /* the number and compare against infinity. [LIU]*/ |
| /* The following approach doesn't work for some reason, so we go ahead and */ |
| /* scrutinize the pattern itself. */ |
| /* double a = number; */ |
| /* *(int8_t*)u_topNBytesOfDouble(&a, 1) &= 0x7F;*/ |
| /* return a == uprv_getInfinity();*/ |
| /* Instead, We want to see either:*/ |
| |
| /* 7FF0 0000 0000 0000*/ |
| /* FFF0 0000 0000 0000*/ |
| |
| uint32_t highBits = *(uint32_t*)u_topNBytesOfDouble(&number, |
| sizeof(uint32_t)); |
| uint32_t lowBits = *(uint32_t*)u_bottomNBytesOfDouble(&number, |
| sizeof(uint32_t)); |
| |
| return (UBool)(((highBits & ~SIGN) == 0x7FF00000U) && |
| (lowBits == 0x00000000U)); |
| #endif |
| |
| #elif defined(OS390) |
| uint32_t highBits = *(uint32_t*)u_topNBytesOfDouble(&number, |
| sizeof(uint32_t)); |
| uint32_t lowBits = *(uint32_t*)u_bottomNBytesOfDouble(&number, |
| sizeof(uint32_t)); |
| |
| return ((highBits & ~SIGN) == 0x70FF0000L) && (lowBits == 0x00000000L); |
| |
| #else |
| /* If your platform doesn't support IEEE 754 but *does* have an infinity*/ |
| /* value, you'll need to replace this default implementation with what's*/ |
| /* correct for your platform.*/ |
| return number == (2.0 * number); |
| #endif |
| } |
| |
| U_CAPI UBool U_EXPORT2 |
| uprv_isPositiveInfinity(double number) |
| { |
| #if IEEE_754 || defined(OS390) |
| return (UBool)(number > 0 && uprv_isInfinite(number)); |
| #else |
| return uprv_isInfinite(number); |
| #endif |
| } |
| |
| U_CAPI UBool U_EXPORT2 |
| uprv_isNegativeInfinity(double number) |
| { |
| #if IEEE_754 || defined(OS390) |
| return (UBool)(number < 0 && uprv_isInfinite(number)); |
| |
| #else |
| uint32_t highBits = *(uint32_t*)u_topNBytesOfDouble(&number, |
| sizeof(uint32_t)); |
| return((highBits & SIGN) && uprv_isInfinite(number)); |
| |
| #endif |
| } |
| |
| U_CAPI double U_EXPORT2 |
| uprv_getNaN() |
| { |
| #if IEEE_754 || defined(OS390) |
| #if !USE_64BIT_DOUBLE_OPTIMIZATION |
| if (!fgNaNInitialized) { |
| /* This variable is always initialized with the same value, |
| so a mutex isn't needed. */ |
| int i; |
| int8_t* p = (int8_t*)fgNan; |
| for(i = 0; i < sizeof(double); ++i) |
| *p++ = 0; |
| *(int16_t*)u_topNBytesOfDouble(fgNan, sizeof(NAN_TOP)) = NAN_TOP; |
| fgNaNInitialized = TRUE; |
| } |
| #endif |
| return *fgNan; |
| #else |
| /* If your platform doesn't support IEEE 754 but *does* have an NaN value,*/ |
| /* you'll need to replace this default implementation with what's correct*/ |
| /* for your platform.*/ |
| return 0.0; |
| #endif |
| } |
| |
| U_CAPI double U_EXPORT2 |
| uprv_getInfinity() |
| { |
| #if IEEE_754 || defined(OS390) |
| #if !USE_64BIT_DOUBLE_OPTIMIZATION |
| if (!fgInfInitialized) |
| { |
| /* This variable is always initialized with the same value, |
| so a mutex isn't needed. */ |
| int i; |
| int8_t* p = (int8_t*)fgInf; |
| for(i = 0; i < sizeof(double); ++i) |
| *p++ = 0; |
| *(int16_t*)u_topNBytesOfDouble(fgInf, sizeof(INF_TOP)) = INF_TOP; |
| fgInfInitialized = TRUE; |
| } |
| #endif |
| return *fgInf; |
| #else |
| /* If your platform doesn't support IEEE 754 but *does* have an infinity*/ |
| /* value, you'll need to replace this default implementation with what's*/ |
| /* correct for your platform.*/ |
| return 0.0; |
| #endif |
| } |
| |
| U_CAPI double U_EXPORT2 |
| uprv_floor(double x) |
| { |
| return floor(x); |
| } |
| |
| U_CAPI double U_EXPORT2 |
| uprv_ceil(double x) |
| { |
| return ceil(x); |
| } |
| |
| U_CAPI double U_EXPORT2 |
| uprv_round(double x) |
| { |
| return uprv_floor(x + 0.5); |
| } |
| |
| U_CAPI double U_EXPORT2 |
| uprv_fabs(double x) |
| { |
| return fabs(x); |
| } |
| |
| U_CAPI double U_EXPORT2 |
| uprv_modf(double x, double* y) |
| { |
| return modf(x, y); |
| } |
| |
| U_CAPI double U_EXPORT2 |
| uprv_fmod(double x, double y) |
| { |
| return fmod(x, y); |
| } |
| |
| U_CAPI double U_EXPORT2 |
| uprv_pow(double x, double y) |
| { |
| /* This is declared as "double pow(double x, double y)" */ |
| return pow(x, y); |
| } |
| |
| U_CAPI double U_EXPORT2 |
| uprv_pow10(int32_t x) |
| { |
| return pow(10.0, (double)x); |
| } |
| |
| U_CAPI double U_EXPORT2 |
| uprv_fmax(double x, double y) |
| { |
| #if IEEE_754 |
| int32_t lowBits; |
| |
| /* first handle NaN*/ |
| if(uprv_isNaN(x) || uprv_isNaN(y)) |
| return uprv_getNaN(); |
| |
| /* check for -0 and 0*/ |
| lowBits = *(uint32_t*) u_bottomNBytesOfDouble(&x, sizeof(uint32_t)); |
| if(x == 0.0 && y == 0.0 && (lowBits & SIGN)) |
| return y; |
| |
| #endif |
| |
| /* this should work for all flt point w/o NaN and Infpecial cases */ |
| return (x > y ? x : y); |
| } |
| |
| U_CAPI int32_t U_EXPORT2 |
| uprv_max(int32_t x, int32_t y) |
| { |
| return (x > y ? x : y); |
| } |
| |
| U_CAPI double U_EXPORT2 |
| uprv_fmin(double x, double y) |
| { |
| #if IEEE_754 |
| int32_t lowBits; |
| |
| /* first handle NaN*/ |
| if(uprv_isNaN(x) || uprv_isNaN(y)) |
| return uprv_getNaN(); |
| |
| /* check for -0 and 0*/ |
| lowBits = *(uint32_t*) u_bottomNBytesOfDouble(&y, sizeof(uint32_t)); |
| if(x == 0.0 && y == 0.0 && (lowBits & SIGN)) |
| return y; |
| |
| #endif |
| |
| /* this should work for all flt point w/o NaN and Inf special cases */ |
| return (x > y ? y : x); |
| } |
| |
| U_CAPI int32_t U_EXPORT2 |
| uprv_min(int32_t x, int32_t y) |
| { |
| return (x > y ? y : x); |
| } |
| |
| /** |
| * Truncates the given double. |
| * trunc(3.3) = 3.0, trunc (-3.3) = -3.0 |
| * This is different than calling floor() or ceil(): |
| * floor(3.3) = 3, floor(-3.3) = -4 |
| * ceil(3.3) = 4, ceil(-3.3) = -3 |
| */ |
| U_CAPI double U_EXPORT2 |
| uprv_trunc(double d) |
| { |
| #if IEEE_754 |
| int32_t lowBits; |
| |
| /* handle error cases*/ |
| if(uprv_isNaN(d)) |
| return uprv_getNaN(); |
| if(uprv_isInfinite(d)) |
| return uprv_getInfinity(); |
| |
| lowBits = *(uint32_t*) u_bottomNBytesOfDouble(&d, sizeof(uint32_t)); |
| if( (d == 0.0 && (lowBits & SIGN)) || d < 0) |
| return ceil(d); |
| else |
| return floor(d); |
| |
| #else |
| return d >= 0 ? floor(d) : ceil(d); |
| |
| #endif |
| } |
| |
| /** |
| * Return the largest positive number that can be represented by an integer |
| * type of arbitrary bit length. |
| */ |
| U_CAPI double U_EXPORT2 |
| uprv_maxMantissa(void) |
| { |
| return pow(2.0, DBL_MANT_DIG + 1.0) - 1.0; |
| } |
| |
| /** |
| * Return the floor of the log base 10 of a given double. |
| * This method compensates for inaccuracies which arise naturally when |
| * computing logs, and always give the correct value. The parameter |
| * must be positive and finite. |
| * (Thanks to Alan Liu for supplying this function.) |
| */ |
| U_CAPI int16_t U_EXPORT2 |
| uprv_log10(double d) |
| { |
| #ifdef OS400 |
| /* We don't use the normal implementation because you can't underflow */ |
| /* a double otherwise an underflow exception occurs */ |
| return log10(d); |
| #else |
| /* The reason this routine is needed is that simply taking the*/ |
| /* log and dividing by log10 yields a result which may be off*/ |
| /* by 1 due to rounding errors. For example, the naive log10*/ |
| /* of 1.0e300 taken this way is 299, rather than 300.*/ |
| double alog10 = log(d) / log(10.0); |
| int16_t ailog10 = (int16_t) floor(alog10); |
| |
| /* Positive logs could be too small, e.g. 0.99 instead of 1.0*/ |
| if (alog10 > 0 && d >= pow(10.0, (double)(ailog10 + 1))) |
| ++ailog10; |
| |
| /* Negative logs could be too big, e.g. -0.99 instead of -1.0*/ |
| else if (alog10 < 0 && d < pow(10.0, (double)(ailog10))) |
| --ailog10; |
| |
| return ailog10; |
| #endif |
| } |
| |
| U_CAPI double U_EXPORT2 |
| uprv_log(double d) |
| { |
| return log(d); |
| } |
| |
| #if 0 |
| /* This isn't used. If it's readded, readd putiltst.c tests */ |
| U_CAPI int32_t U_EXPORT2 |
| uprv_digitsAfterDecimal(double x) |
| { |
| char buffer[20]; |
| int32_t numDigits, bytesWritten; |
| char *p = buffer; |
| int32_t ptPos, exponent; |
| |
| /* cheat and use the string-format routine to get a string representation*/ |
| /* (it handles mathematical inaccuracy better than we can), then find out */ |
| /* many characters are to the right of the decimal point */ |
| bytesWritten = sprintf(buffer, "%+.9g", x); |
| while (isdigit(*(++p))) { |
| } |
| |
| ptPos = (int32_t)(p - buffer); |
| numDigits = (int32_t)(bytesWritten - ptPos - 1); |
| |
| /* if the number's string representation is in scientific notation, find */ |
| /* the exponent and take it into account*/ |
| exponent = 0; |
| p = uprv_strchr(buffer, 'e'); |
| if (p != 0) { |
| int16_t expPos = (int16_t)(p - buffer); |
| numDigits -= bytesWritten - expPos; |
| exponent = (int32_t)(atol(p + 1)); |
| } |
| |
| /* the string representation may still have spurious decimal digits in it, */ |
| /* so we cut off at the ninth digit to the right of the decimal, and have */ |
| /* to search backward from there to the first non-zero digit*/ |
| if (numDigits > 9) { |
| numDigits = 9; |
| while (numDigits > 0 && buffer[ptPos + numDigits] == '0') |
| --numDigits; |
| } |
| numDigits -= exponent; |
| if (numDigits < 0) { |
| return 0; |
| } |
| return numDigits; |
| } |
| #endif |
| |
| /*--------------------------------------------------------------------------- |
| Platform-specific Implementations |
| Try these, and if they don't work on your platform, then special case your |
| platform with new implementations. |
| ---------------------------------------------------------------------------*/ |
| |
| /* Win32 time zone detection ------------------------------------------------ */ |
| |
| #ifdef U_WINDOWS |
| |
| /* |
| This code attempts to detect the Windows time zone, as set in the |
| Windows Date and Time control panel. It attempts to work on |
| multiple flavors of Windows (9x, Me, NT, 2000, XP) and on localized |
| installs. It works by directly interrogating the registry and |
| comparing the data there with the data returned by the |
| GetTimeZoneInformation API, along with some other strategies. The |
| registry contains time zone data under one of two keys (depending on |
| the flavor of Windows): |
| |
| HKLM\SOFTWARE\Microsoft\Windows\CurrentVersion\Time Zones\ |
| HKLM\SOFTWARE\Microsoft\Windows NT\CurrentVersion\Time Zones\ |
| |
| Under this key are several subkeys, one for each time zone. These |
| subkeys are named "Pacific" on Win9x/Me and "Pacific Standard Time" |
| on WinNT/2k/XP. There are some other wrinkles; see the code for |
| details. The subkey name is NOT LOCALIZED, allowing us to support |
| localized installs. |
| |
| Under the subkey are data values. We care about: |
| |
| Std Standard time display name, localized |
| TZI Binary block of data |
| |
| The TZI data is of particular interest. It contains the offset, two |
| more offsets for standard and daylight time, and the start and end |
| rules. This is the same data returned by the GetTimeZoneInformation |
| API. The API may modify the data on the way out, so we have to be |
| careful, but essentially we do a binary comparison against the TZI |
| blocks of various registry keys. When we find a match, we know what |
| time zone Windows is set to. Since the registry key is not |
| localized, we can then translate the key through a simple table |
| lookup into the corresponding ICU time zone. |
| |
| This strategy doesn't always work because there are zones which |
| share an offset and rules, so more than one TZI block will match. |
| For example, both Tokyo and Seoul are at GMT+9 with no DST rules; |
| their TZI blocks are identical. For these cases, we fall back to a |
| name lookup. We attempt to match the display name as stored in the |
| registry for the current zone to the display name stored in the |
| registry for various Windows zones. By comparing the registry data |
| directly we avoid conversion complications. |
| |
| Author: Alan Liu |
| Since: ICU 2.6 |
| Based on original code by Carl Brown <cbrown@xnetinc.com> |
| */ |
| |
| /** |
| * Layout of the binary registry data under the "TZI" key. |
| */ |
| typedef struct { |
| LONG Bias; |
| LONG StandardBias; |
| LONG DaylightBias; /* Tweaked by GetTimeZoneInformation */ |
| SYSTEMTIME StandardDate; |
| SYSTEMTIME DaylightDate; |
| } TZI; |
| |
| typedef struct { |
| const char* icuid; |
| const char* winid; |
| } WindowsICUMap; |
| |
| /** |
| * Mapping between Windows zone IDs and ICU zone IDs. This list has |
| * been mechanically checked; all zone offsets match (most important) |
| * and city names match the display city names (where possible). The |
| * presence or absence of DST differs in some cases, but this is |
| * acceptable as long as the zone is semantically the same (which has |
| * been manually checked). |
| * |
| * Windows 9x/Me zone IDs are listed as "Pacific" rather than "Pacific |
| * Standard Time", which is seen in NT/2k/XP. This is fixed-up at |
| * runtime as needed. The one exception is "Mexico Standard Time 2", |
| * which is not present on Windows 9x/Me. |
| * |
| * Zones that are not unique under Offset+Rules should be grouped |
| * together for efficiency (see code below). In addition, rules MUST |
| * be grouped so that all zones of a single offset are together. |
| * |
| * Comments list S(tandard) or D(aylight), as declared by Windows, |
| * followed by the display name (data from Windows XP). |
| * |
| * NOTE: Etc/GMT+12 is CORRECT for offset GMT-12:00. Consult |
| * documentation elsewhere for an explanation. |
| */ |
| static const WindowsICUMap ZONE_MAP[] = { |
| "Etc/GMT+12", "Dateline", /* S (GMT-12:00) International Date Line West */ |
| |
| "Pacific/Apia", "Samoa", /* S (GMT-11:00) Midway Island, Samoa */ |
| |
| "Pacific/Honolulu", "Hawaiian", /* S (GMT-10:00) Hawaii */ |
| |
| "America/Anchorage", "Alaskan", /* D (GMT-09:00) Alaska */ |
| |
| "America/Los_Angeles", "Pacific", /* D (GMT-08:00) Pacific Time (US & Canada); Tijuana */ |
| |
| "America/Phoenix", "US Mountain", /* S (GMT-07:00) Arizona */ |
| "America/Denver", "Mountain", /* D (GMT-07:00) Mountain Time (US & Canada) */ |
| "America/Chihuahua", "Mexico Standard Time 2", /* D (GMT-07:00) Chihuahua, La Paz, Mazatlan */ |
| |
| "America/Managua", "Central America", /* S (GMT-06:00) Central America */ |
| "America/Regina", "Canada Central", /* S (GMT-06:00) Saskatchewan */ |
| "America/Mexico_City", "Mexico", /* D (GMT-06:00) Guadalajara, Mexico City, Monterrey */ |
| "America/Chicago", "Central", /* D (GMT-06:00) Central Time (US & Canada) */ |
| |
| "America/Indianapolis", "US Eastern", /* S (GMT-05:00) Indiana (East) */ |
| "America/Bogota", "SA Pacific", /* S (GMT-05:00) Bogota, Lima, Quito */ |
| "America/New_York", "Eastern", /* D (GMT-05:00) Eastern Time (US & Canada) */ |
| |
| "America/Caracas", "SA Western", /* S (GMT-04:00) Caracas, La Paz */ |
| "America/Santiago", "Pacific SA", /* D (GMT-04:00) Santiago */ |
| "America/Halifax", "Atlantic", /* D (GMT-04:00) Atlantic Time (Canada) */ |
| |
| "America/St_Johns", "Newfoundland", /* D (GMT-03:30) Newfoundland */ |
| |
| "America/Buenos_Aires", "SA Eastern", /* S (GMT-03:00) Buenos Aires, Georgetown */ |
| "America/Godthab", "Greenland", /* D (GMT-03:00) Greenland */ |
| "America/Sao_Paulo", "E. South America", /* D (GMT-03:00) Brasilia */ |
| |
| "America/Noronha", "Mid-Atlantic", /* D (GMT-02:00) Mid-Atlantic */ |
| |
| "Atlantic/Cape_Verde", "Cape Verde", /* S (GMT-01:00) Cape Verde Is. */ |
| "Atlantic/Azores", "Azores", /* D (GMT-01:00) Azores */ |
| |
| "Africa/Casablanca", "Greenwich", /* S (GMT) Casablanca, Monrovia */ |
| "Europe/London", "GMT", /* D (GMT) Greenwich Mean Time : Dublin, Edinburgh, Lisbon, London */ |
| |
| "Africa/Lagos", "W. Central Africa", /* S (GMT+01:00) West Central Africa */ |
| "Europe/Berlin", "W. Europe", /* D (GMT+01:00) Amsterdam, Berlin, Bern, Rome, Stockholm, Vienna */ |
| "Europe/Paris", "Romance", /* D (GMT+01:00) Brussels, Copenhagen, Madrid, Paris */ |
| "Europe/Sarajevo", "Central European", /* D (GMT+01:00) Sarajevo, Skopje, Warsaw, Zagreb */ |
| "Europe/Belgrade", "Central Europe", /* D (GMT+01:00) Belgrade, Bratislava, Budapest, Ljubljana, Prague */ |
| |
| "Africa/Johannesburg", "South Africa", /* S (GMT+02:00) Harare, Pretoria */ |
| "Asia/Jerusalem", "Israel", /* S (GMT+02:00) Jerusalem */ |
| "Europe/Istanbul", "GTB", /* D (GMT+02:00) Athens, Istanbul, Minsk */ |
| "Europe/Helsinki", "FLE", /* D (GMT+02:00) Helsinki, Kyiv, Riga, Sofia, Tallinn, Vilnius */ |
| "Africa/Cairo", "Egypt", /* D (GMT+02:00) Cairo */ |
| "Europe/Bucharest", "E. Europe", /* D (GMT+02:00) Bucharest */ |
| |
| "Africa/Nairobi", "E. Africa", /* S (GMT+03:00) Nairobi */ |
| "Asia/Riyadh", "Arab", /* S (GMT+03:00) Kuwait, Riyadh */ |
| "Europe/Moscow", "Russian", /* D (GMT+03:00) Moscow, St. Petersburg, Volgograd */ |
| "Asia/Baghdad", "Arabic", /* D (GMT+03:00) Baghdad */ |
| |
| "Asia/Tehran", "Iran", /* D (GMT+03:30) Tehran */ |
| |
| "Asia/Muscat", "Arabian", /* S (GMT+04:00) Abu Dhabi, Muscat */ |
| "Asia/Tbilisi", "Caucasus", /* D (GMT+04:00) Baku, Tbilisi, Yerevan */ |
| |
| "Asia/Kabul", "Afghanistan", /* S (GMT+04:30) Kabul */ |
| |
| "Asia/Karachi", "West Asia", /* S (GMT+05:00) Islamabad, Karachi, Tashkent */ |
| "Asia/Yekaterinburg", "Ekaterinburg", /* D (GMT+05:00) Ekaterinburg */ |
| |
| "Asia/Calcutta", "India", /* S (GMT+05:30) Chennai, Kolkata, Mumbai, New Delhi */ |
| |
| "Asia/Katmandu", "Nepal", /* S (GMT+05:45) Kathmandu */ |
| |
| "Asia/Colombo", "Sri Lanka", /* S (GMT+06:00) Sri Jayawardenepura */ |
| "Asia/Dhaka", "Central Asia", /* S (GMT+06:00) Astana, Dhaka */ |
| "Asia/Novosibirsk", "N. Central Asia", /* D (GMT+06:00) Almaty, Novosibirsk */ |
| |
| "Asia/Rangoon", "Myanmar", /* S (GMT+06:30) Rangoon */ |
| |
| "Asia/Bangkok", "SE Asia", /* S (GMT+07:00) Bangkok, Hanoi, Jakarta */ |
| "Asia/Krasnoyarsk", "North Asia", /* D (GMT+07:00) Krasnoyarsk */ |
| |
| "Australia/Perth", "W. Australia", /* S (GMT+08:00) Perth */ |
| "Asia/Taipei", "Taipei", /* S (GMT+08:00) Taipei */ |
| "Asia/Singapore", "Singapore", /* S (GMT+08:00) Kuala Lumpur, Singapore */ |
| "Asia/Hong_Kong", "China", /* S (GMT+08:00) Beijing, Chongqing, Hong Kong, Urumqi */ |
| "Asia/Irkutsk", "North Asia East", /* D (GMT+08:00) Irkutsk, Ulaan Bataar */ |
| |
| "Asia/Tokyo", "Tokyo", /* S (GMT+09:00) Osaka, Sapporo, Tokyo */ |
| "Asia/Seoul", "Korea", /* S (GMT+09:00) Seoul */ |
| "Asia/Yakutsk", "Yakutsk", /* D (GMT+09:00) Yakutsk */ |
| |
| "Australia/Darwin", "AUS Central", /* S (GMT+09:30) Darwin */ |
| "Australia/Adelaide", "Cen. Australia", /* D (GMT+09:30) Adelaide */ |
| |
| "Pacific/Guam", "West Pacific", /* S (GMT+10:00) Guam, Port Moresby */ |
| "Australia/Brisbane", "E. Australia", /* S (GMT+10:00) Brisbane */ |
| "Asia/Vladivostok", "Vladivostok", /* D (GMT+10:00) Vladivostok */ |
| "Australia/Hobart", "Tasmania", /* D (GMT+10:00) Hobart */ |
| "Australia/Sydney", "AUS Eastern", /* D (GMT+10:00) Canberra, Melbourne, Sydney */ |
| |
| "Asia/Magadan", "Central Pacific", /* S (GMT+11:00) Magadan, Solomon Is., New Caledonia */ |
| |
| "Pacific/Fiji", "Fiji", /* S (GMT+12:00) Fiji, Kamchatka, Marshall Is. */ |
| "Pacific/Auckland", "New Zealand", /* D (GMT+12:00) Auckland, Wellington */ |
| |
| "Pacific/Tongatapu", "Tonga", /* S (GMT+13:00) Nuku'alofa */ |
| NULL, NULL |
| }; |
| |
| typedef struct { |
| const char* winid; |
| const char* altwinid; |
| } WindowsZoneRemap; |
| |
| /** |
| * If a lookup fails, we attempt to remap certain Windows ids to |
| * alternate Windows ids. If the alternate listed here begins with |
| * '-', we use it as is (without the '-'). If it begins with '+', we |
| * append a " Standard Time" if appropriate. |
| */ |
| static const WindowsZoneRemap ZONE_REMAP[] = { |
| "Central European", "-Warsaw", |
| "Central Europe", "-Prague Bratislava", |
| "China", "-Beijing", |
| |
| "Greenwich", "+GMT", |
| "GTB", "+GFT", |
| "Arab", "+Saudi Arabia", |
| "SE Asia", "+Bangkok", |
| "AUS Eastern", "+Sydney", |
| NULL, NULL, |
| }; |
| |
| /** |
| * Various registry keys and key fragments. |
| */ |
| static const char CURRENT_ZONE_REGKEY[] = "SYSTEM\\CurrentControlSet\\Control\\TimeZoneInformation\\"; |
| static const char STANDARD_NAME_REGKEY[] = "StandardName"; |
| static const char STANDARD_TIME_REGKEY[] = " Standard Time"; |
| static const char TZI_REGKEY[] = "TZI"; |
| static const char STD_REGKEY[] = "Std"; |
| |
| /** |
| * HKLM subkeys used to probe for the flavor of Windows. Note that we |
| * specifically check for the "GMT" zone subkey; this is present on |
| * NT, but on XP has become "GMT Standard Time". We need to |
| * discriminate between these cases. |
| */ |
| static const char* const WIN_TYPE_PROBE_REGKEY[] = { |
| /* WIN_9X_ME_TYPE */ |
| "SOFTWARE\\Microsoft\\Windows\\CurrentVersion\\Time Zones", |
| |
| /* WIN_NT_TYPE */ |
| "SOFTWARE\\Microsoft\\Windows NT\\CurrentVersion\\Time Zones\\GMT" |
| |
| /* otherwise: WIN_2K_XP_TYPE */ |
| }; |
| |
| /** |
| * The time zone root subkeys (under HKLM) for different flavors of |
| * Windows. |
| */ |
| static const char* const TZ_REGKEY[] = { |
| /* WIN_9X_ME_TYPE */ |
| "SOFTWARE\\Microsoft\\Windows\\CurrentVersion\\Time Zones\\", |
| |
| /* WIN_NT_TYPE | WIN_2K_XP_TYPE */ |
| "SOFTWARE\\Microsoft\\Windows NT\\CurrentVersion\\Time Zones\\" |
| }; |
| |
| /** |
| * Flavor of Windows, from our perspective. Not a real OS version, |
| * but rather the flavor of the layout of the time zone information in |
| * the registry. |
| */ |
| enum { |
| WIN_9X_ME_TYPE = 0, |
| WIN_NT_TYPE = 1, |
| WIN_2K_XP_TYPE = 2 |
| }; |
| |
| /** |
| * Auxiliary Windows time zone function. Attempts to open the given |
| * Windows time zone ID as a registry key. Returns ERROR_SUCCESS if |
| * successful. Caller must close the registry key. Handles |
| * variations in the resource layout in different flavors of Windows. |
| * |
| * @param hkey output parameter to receive opened registry key |
| * @param winid Windows zone ID, e.g., "Pacific", without the |
| * " Standard Time" suffix (if any). Special case "Mexico Standard Time 2" |
| * allowed. |
| * @param winType Windows flavor (WIN_9X_ME_TYPE, etc.) |
| * @return ERROR_SUCCESS upon success |
| */ |
| static LONG openTZRegKey(HKEY *hkey, const char* winid, int winType) { |
| LONG result; |
| char subKeyName[96]; |
| char* name; |
| int i; |
| |
| uprv_strcpy(subKeyName, TZ_REGKEY[(winType == WIN_9X_ME_TYPE) ? 0 : 1]); |
| name = &subKeyName[strlen(subKeyName)]; |
| uprv_strcat(subKeyName, winid); |
| if (winType != WIN_9X_ME_TYPE) { |
| /* Don't modify "Mexico Standard Time 2", which does not occur |
| on WIN_9X_ME_TYPE. Also, if the type is WIN_NT_TYPE, then |
| in practice this means the GMT key is not followed by |
| " Standard Time", so don't append in that case. */ |
| int isMexico2 = (winid[uprv_strlen(winid)- 1] == '2'); |
| if (!isMexico2 && |
| !(winType == WIN_NT_TYPE && uprv_strcmp(winid, "GMT") == 0)) { |
| uprv_strcat(subKeyName, STANDARD_TIME_REGKEY); |
| } |
| } |
| result = RegOpenKeyEx(HKEY_LOCAL_MACHINE, |
| subKeyName, |
| 0, |
| KEY_QUERY_VALUE, |
| hkey); |
| |
| if (result != ERROR_SUCCESS) { |
| /* If the primary lookup fails, try to remap the Windows zone |
| ID, according to the remapping table. */ |
| for (i=0; ZONE_REMAP[i].winid; ++i) { |
| if (uprv_strcmp(winid, ZONE_REMAP[i].winid) == 0) { |
| uprv_strcpy(name, ZONE_REMAP[i].altwinid + 1); |
| if (*(ZONE_REMAP[i].altwinid) == '+' && |
| winType != WIN_9X_ME_TYPE) { |
| uprv_strcat(subKeyName, STANDARD_TIME_REGKEY); |
| } |
| result = RegOpenKeyEx(HKEY_LOCAL_MACHINE, |
| subKeyName, |
| 0, |
| KEY_QUERY_VALUE, |
| hkey); |
| break; |
| } |
| } |
| } |
| |
| return result; |
| } |
| |
| /** |
| * Main Windows time zone detection function. Returns the Windows |
| * time zone, translated to an ICU time zone, or NULL upon failure. |
| */ |
| static const char* detectWindowsTimeZone() { |
| int winType; |
| LONG result; |
| HKEY hkey; |
| TZI tziKey; |
| TZI tziReg; |
| DWORD cbData = sizeof(TZI); |
| TIME_ZONE_INFORMATION apiTZI; |
| char stdName[32]; |
| DWORD stdNameSize; |
| char stdRegName[64]; |
| DWORD stdRegNameSize; |
| int firstMatch, lastMatch; |
| int j; |
| |
| /* Detect the version of windows by trying to open a sequence of |
| probe keys. We don't use the OS version API because what we |
| really want to know is how the registry is laid out. |
| Specifically, is it 9x/Me or not, and is it "GMT" or "GMT |
| Standard Time". */ |
| for (winType=0; winType<2; ++winType) { |
| result = RegOpenKeyEx(HKEY_LOCAL_MACHINE, |
| WIN_TYPE_PROBE_REGKEY[winType], |
| 0, |
| KEY_QUERY_VALUE, |
| &hkey); |
| RegCloseKey(hkey); |
| if (result == ERROR_SUCCESS) { |
| break; |
| } |
| } |
| |
| /* Obtain TIME_ZONE_INFORMATION from the API, and then convert it |
| to TZI. We could also interrogate the registry directly; we do |
| this below if needed. */ |
| uprv_memset(&apiTZI, 0, sizeof(apiTZI)); |
| GetTimeZoneInformation(&apiTZI); |
| tziKey.Bias = apiTZI.Bias; |
| uprv_memcpy((char *)&tziKey.StandardDate, (char*)&apiTZI.StandardDate, |
| sizeof(apiTZI.StandardDate)); |
| uprv_memcpy((char *)&tziKey.DaylightDate, (char*)&apiTZI.DaylightDate, |
| sizeof(apiTZI.DaylightDate)); |
| |
| /* For each zone that can be identified by Offset+Rules, see if we |
| have a match. Continue scanning after finding a match, |
| recording the index of the first and the last match. We have |
| to do this because some zones are not unique under |
| Offset+Rules. */ |
| firstMatch = lastMatch = -1; |
| for (j=0; ZONE_MAP[j].icuid; j++) { |
| result = openTZRegKey(&hkey, ZONE_MAP[j].winid, winType); |
| if (result == ERROR_SUCCESS) { |
| result = RegQueryValueEx(hkey, |
| TZI_REGKEY, |
| NULL, |
| NULL, |
| (LPBYTE)&tziReg, |
| &cbData); |
| } |
| RegCloseKey(hkey); |
| if (result == ERROR_SUCCESS) { |
| /* Assume that offsets are grouped together, and bail out |
| when we've scanned everything with a matching |
| offset. */ |
| if (firstMatch >= 0 && tziKey.Bias != tziReg.Bias) { |
| break; |
| } |
| /* Windows alters the DaylightBias in some situations. |
| Using the bias and the rules suffices, so overwrite |
| these unreliable fields. */ |
| tziKey.StandardBias = tziReg.StandardBias; |
| tziKey.DaylightBias = tziReg.DaylightBias; |
| if (uprv_memcmp((char *)&tziKey, (char*)&tziReg, |
| sizeof(tziKey)) == 0) { |
| if (firstMatch < 0) { |
| firstMatch = j; |
| } |
| lastMatch = j; |
| } |
| } |
| } |
| |
| /* This should never happen; if it does it means our table doesn't |
| match Windows AT ALL, perhaps because this is post-XP? */ |
| if (firstMatch < 0) { |
| return NULL; |
| } |
| |
| if (firstMatch != lastMatch) { |
| /* Offset+Rules lookup yielded >= 2 matches. Try to match the |
| localized display name. Get the name from the registry |
| (not the API). This avoids conversion issues. Use the |
| standard name, since Windows modifies the daylight name to |
| match the standard name if there is no DST. */ |
| result = RegOpenKeyEx(HKEY_LOCAL_MACHINE, |
| CURRENT_ZONE_REGKEY, |
| 0, |
| KEY_QUERY_VALUE, |
| &hkey); |
| if (result == ERROR_SUCCESS) { |
| stdNameSize = sizeof(stdName); |
| result = RegQueryValueEx(hkey, |
| (LPTSTR)STANDARD_NAME_REGKEY, |
| NULL, |
| NULL, |
| (LPBYTE)stdName, |
| &stdNameSize); |
| RegCloseKey(hkey); |
| |
| /* Scan through the Windows time zone data in the registry |
| again (just the range of zones with matching TZIs) and |
| look for a standard display name match. */ |
| for (j=firstMatch; j<=lastMatch; j++) { |
| result = openTZRegKey(&hkey, ZONE_MAP[j].winid, winType); |
| if (result == ERROR_SUCCESS) { |
| stdRegNameSize = sizeof(stdRegName); |
| result = RegQueryValueEx(hkey, |
| (LPTSTR)STD_REGKEY, |
| NULL, |
| NULL, |
| (LPBYTE)stdRegName, |
| &stdRegNameSize); |
| } |
| RegCloseKey(hkey); |
| if (result == ERROR_SUCCESS && |
| stdRegNameSize == stdNameSize && |
| uprv_memcmp(stdName, stdRegName, stdNameSize) == 0) { |
| firstMatch = j; /* record the match */ |
| break; |
| } |
| } |
| } else { |
| RegCloseKey(hkey); /* should never get here */ |
| } |
| } |
| |
| return ZONE_MAP[firstMatch].icuid; |
| } |
| |
| #endif /*U_WINDOWS*/ |
| |
| /* Generic time zone layer -------------------------------------------------- */ |
| |
| /* Time zone utilities */ |
| U_CAPI void U_EXPORT2 |
| uprv_tzset() |
| { |
| #ifdef U_TZSET |
| U_TZSET(); |
| #else |
| /* no initialization*/ |
| #endif |
| } |
| |
| U_CAPI int32_t U_EXPORT2 |
| uprv_timezone() |
| { |
| #ifdef U_TIMEZONE |
| return U_TIMEZONE; |
| #else |
| time_t t, t1, t2; |
| struct tm tmrec; |
| UBool dst_checked; |
| int32_t tdiff = 0; |
| |
| time(&t); |
| uprv_memcpy( &tmrec, localtime(&t), sizeof(tmrec) ); |
| dst_checked = (tmrec.tm_isdst != 0); /* daylight savings time is checked*/ |
| t1 = mktime(&tmrec); /* local time in seconds*/ |
| uprv_memcpy( &tmrec, gmtime(&t), sizeof(tmrec) ); |
| t2 = mktime(&tmrec); /* GMT (or UTC) in seconds*/ |
| tdiff = t2 - t1; |
| /* imitate NT behaviour, which returns same timezone offset to GMT for |
| winter and summer*/ |
| if (dst_checked) |
| tdiff += 3600; |
| return tdiff; |
| #endif |
| } |
| |
| /* Note that U_TZNAME does *not* have to be tzname, but if it is, |
| some platforms need to have it declared here. */ |
| |
| #if defined(U_TZNAME) && (defined(U_IRIX) || defined(U_DARWIN) || defined(U_CYGWIN)) |
| /* RS6000 and others reject char **tzname. */ |
| extern U_IMPORT char *U_TZNAME[]; |
| #endif |
| |
| #if defined(U_DARWIN) /* For Mac OS X */ |
| #define TZZONELINK "/etc/localtime" |
| #define TZZONEINFO "/usr/share/zoneinfo/" |
| static char *gTimeZoneBuffer = NULL; /* Heap allocated */ |
| #endif |
| |
| U_CAPI const char* U_EXPORT2 |
| uprv_tzname(int n) |
| { |
| #ifdef U_WINDOWS |
| char* id = (char*) detectWindowsTimeZone(); |
| if (id != NULL) { |
| return id; |
| } |
| #endif |
| |
| #if defined(U_DARWIN) |
| int ret; |
| |
| char *tzenv; |
| |
| tzenv = getenv("TZFILE"); |
| if (tzenv != NULL) { |
| return tzenv; |
| } |
| |
| #if 0 |
| /* TZ is often set to "PST8PDT" or similar, so we cannot use it. Alan */ |
| tzenv = getenv("TZ"); |
| if (tzenv != NULL) { |
| return tzenv; |
| } |
| #endif |
| |
| /* Caller must handle threading issues */ |
| if (gTimeZoneBuffer == NULL) { |
| gTimeZoneBuffer = (char *) uprv_malloc(MAXPATHLEN + 2); |
| |
| ret = readlink(TZZONELINK, gTimeZoneBuffer, MAXPATHLEN + 2); |
| if (0 < ret) { |
| gTimeZoneBuffer[ret] = '\0'; |
| if (uprv_strncmp(gTimeZoneBuffer, TZZONEINFO, sizeof(TZZONEINFO) - 1) == 0) { |
| return (gTimeZoneBuffer += sizeof(TZZONEINFO) - 1); |
| } |
| } |
| |
| uprv_free(gTimeZoneBuffer); |
| gTimeZoneBuffer = NULL; |
| } |
| #endif |
| |
| #ifdef U_TZNAME |
| return U_TZNAME[n]; |
| #else |
| return ""; |
| #endif |
| } |
| |
| /* Get and set the ICU data directory --------------------------------------- */ |
| |
| static char *gDataDirectory = NULL; |
| #if U_POSIX_LOCALE |
| static char *gCorrectedPOSIXLocale = NULL; /* Heap allocated */ |
| #endif |
| |
| static UBool U_CALLCONV putil_cleanup(void) |
| { |
| if (gDataDirectory && *gDataDirectory) { |
| uprv_free(gDataDirectory); |
| } |
| gDataDirectory = NULL; |
| #if U_POSIX_LOCALE |
| if (gCorrectedPOSIXLocale) { |
| uprv_free(gCorrectedPOSIXLocale); |
| gCorrectedPOSIXLocale = NULL; |
| } |
| #endif |
| return TRUE; |
| } |
| |
| /* |
| * Set the data directory. |
| * Make a copy of the passed string, and set the global data dir to point to it. |
| * TODO: see bug #2849, regarding thread safety. |
| */ |
| U_CAPI void U_EXPORT2 |
| u_setDataDirectory(const char *directory) { |
| char *newDataDir; |
| int32_t length; |
| |
| if(directory==NULL || *directory==0) { |
| /* A small optimization to prevent the malloc and copy when the |
| shared library is used, and this is a way to make sure that NULL |
| is never returned. |
| */ |
| newDataDir = (char *)""; |
| } |
| else { |
| length=(int32_t)uprv_strlen(directory); |
| newDataDir = (char *)uprv_malloc(length + 2); |
| uprv_strcpy(newDataDir, directory); |
| |
| #if (U_FILE_SEP_CHAR != U_FILE_ALT_SEP_CHAR) |
| { |
| char *p; |
| while(p = uprv_strchr(newDataDir, U_FILE_ALT_SEP_CHAR)) { |
| *p = U_FILE_SEP_CHAR; |
| } |
| } |
| #endif |
| } |
| |
| umtx_lock(NULL); |
| if (gDataDirectory && *gDataDirectory) { |
| uprv_free(gDataDirectory); |
| } |
| gDataDirectory = newDataDir; |
| ucln_common_registerCleanup(UCLN_COMMON_PUTIL, putil_cleanup); |
| umtx_unlock(NULL); |
| } |
| |
| U_CAPI UBool U_EXPORT2 |
| uprv_pathIsAbsolute(const char *path) |
| { |
| if(!path || !*path) { |
| return FALSE; |
| } |
| |
| if(*path == U_FILE_SEP_CHAR) { |
| return TRUE; |
| } |
| |
| #if (U_FILE_SEP_CHAR != U_FILE_ALT_SEP_CHAR) |
| if(*path == U_FILE_ALT_SEP_CHAR) { |
| return TRUE; |
| } |
| #endif |
| |
| #if defined(U_WINDOWS) |
| if( (((path[0] >= 'A') && (path[0] <= 'Z')) || |
| ((path[0] >= 'a') && (path[0] <= 'z'))) && |
| path[1] == ':' ) { |
| return TRUE; |
| } |
| #endif |
| |
| return FALSE; |
| } |
| |
| U_CAPI const char * U_EXPORT2 |
| u_getDataDirectory(void) { |
| const char *path = NULL; |
| |
| /* if we have the directory, then return it immediately */ |
| umtx_lock(NULL); |
| path = gDataDirectory; |
| umtx_unlock(NULL); |
| |
| if(path) { |
| return path; |
| } |
| |
| /* |
| When ICU_PREVENT_USER_DATA_OVERRIDE is defined, users aren't allowed to |
| override ICU's data with the ICU_DATA environment variable. This prevents |
| problems where multiple custom copies of ICU's specific version of data |
| are installed on a system. Either the application must define the data |
| directory with u_setDataDirectory, define ICU_DATA_DIR when compiling |
| ICU, set the data with udata_setCommonData or trust that all of the |
| required data is contained in ICU's data library that contains |
| the entry point defined by U_ICUDATA_ENTRY_POINT. |
| |
| There may also be some platforms where environment variables |
| are not allowed. |
| */ |
| # if !defined(ICU_PREVENT_USER_DATA_OVERRIDE) |
| /* First try to get the environment variable */ |
| path=getenv("ICU_DATA"); |
| # endif |
| |
| /* ICU_DATA_DIR may be set as a compile option */ |
| # ifdef ICU_DATA_DIR |
| if(path==NULL || *path==0) { |
| path=ICU_DATA_DIR; |
| } |
| # endif |
| |
| if(path==NULL) { |
| /* It looks really bad, set it to something. */ |
| path = ""; |
| } |
| |
| u_setDataDirectory(path); |
| return gDataDirectory; |
| } |
| |
| |
| |
| |
| |
| /* Macintosh-specific locale information ------------------------------------ */ |
| #ifdef XP_MAC |
| |
| typedef struct { |
| int32_t script; |
| int32_t region; |
| int32_t lang; |
| int32_t date_region; |
| const char* posixID; |
| } mac_lc_rec; |
| |
| /* Todo: This will be updated with a newer version from www.unicode.org web |
| page when it's available.*/ |
| #define MAC_LC_MAGIC_NUMBER -5 |
| #define MAC_LC_INIT_NUMBER -9 |
| |
| static const mac_lc_rec mac_lc_recs[] = { |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 0, "en_US", |
| /* United States*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 1, "fr_FR", |
| /* France*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 2, "en_GB", |
| /* Great Britain*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 3, "de_DE", |
| /* Germany*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 4, "it_IT", |
| /* Italy*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 5, "nl_NL", |
| /* Metherlands*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 6, "fr_BE", |
| /* French for Belgium or Lxembourg*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 7, "sv_SE", |
| /* Sweden*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 9, "da_DK", |
| /* Denmark*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 10, "pt_PT", |
| /* Portugal*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 11, "fr_CA", |
| /* French Canada*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 13, "is_IS", |
| /* Israel*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 14, "ja_JP", |
| /* Japan*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 15, "en_AU", |
| /* Australia*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 16, "ar_AE", |
| /* the Arabic world (?)*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 17, "fi_FI", |
| /* Finland*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 18, "fr_CH", |
| /* French for Switzerland*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 19, "de_CH", |
| /* German for Switzerland*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 20, "el_GR", |
| /* Greece*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 21, "is_IS", |
| /* Iceland ===*/ |
| /*MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 22, "",*/ |
| /* Malta ===*/ |
| /*MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 23, "",*/ |
| /* Cyprus ===*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 24, "tr_TR", |
| /* Turkey ===*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 25, "sh_YU", |
| /* Croatian system for Yugoslavia*/ |
| /*MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 33, "",*/ |
| /* Hindi system for India*/ |
| /*MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 34, "",*/ |
| /* Pakistan*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 41, "lt_LT", |
| /* Lithuania*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 42, "pl_PL", |
| /* Poland*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 43, "hu_HU", |
| /* Hungary*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 44, "et_EE", |
| /* Estonia*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 45, "lv_LV", |
| /* Latvia*/ |
| /*MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 46, "",*/ |
| /* Lapland [Ask Rich for the data. HS]*/ |
| /*MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 47, "",*/ |
| /* Faeroe Islands*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 48, "fa_IR", |
| /* Iran*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 49, "ru_RU", |
| /* Russia*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 50, "en_IE", |
| /* Ireland*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 51, "ko_KR", |
| /* Korea*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 52, "zh_CN", |
| /* People's Republic of China*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 53, "zh_TW", |
| /* Taiwan*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, 54, "th_TH", |
| /* Thailand*/ |
| |
| /* fallback is en_US*/ |
| MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, MAC_LC_MAGIC_NUMBER, |
| MAC_LC_MAGIC_NUMBER, "en_US" |
| }; |
| |
| #endif |
| |
| #if U_POSIX_LOCALE |
| /* Return just the POSIX id, whatever happens to be in it */ |
| static const char *uprv_getPOSIXID(void) |
| { |
| static const char* posixID = NULL; |
| if (posixID == 0) { |
| posixID = getenv("LC_ALL"); |
| if (posixID == 0) { |
| posixID = getenv("LANG"); |
| if (posixID == 0) { |
| /* |
| * On Solaris two different calls to setlocale can result in |
| * different values. Only get this value once. |
| */ |
| posixID = setlocale(LC_ALL, NULL); |
| } |
| } |
| } |
| |
| if (posixID==0) |
| { |
| /* Nothing worked. Give it a nice value. */ |
| posixID = "en_US"; |
| } |
| else if ((uprv_strcmp("C", posixID) == 0) |
| || (uprv_strchr(posixID, ' ') != NULL) |
| || (uprv_strchr(posixID, '/') != NULL)) |
| { /* HPUX returns 'C C C C C C C' */ |
| /* Solaris can return /en_US/C/C/C/C/C on the second try. */ |
| /* Maybe we got some garbage. Give it a nice value. */ |
| posixID = "en_US_POSIX"; |
| } |
| return posixID; |
| } |
| #endif |
| |
| /* NOTE: The caller should handle thread safety */ |
| U_CAPI const char* U_EXPORT2 |
| uprv_getDefaultLocaleID() |
| { |
| #if U_POSIX_LOCALE |
| /* |
| Note that: (a '!' means the ID is improper somehow) |
| LC_ALL ----> default_loc codepage |
| -------------------------------------------------------- |
| ab.CD ab CD |
| ab@CD ab__CD - |
| ab@CD.EF ab__CD EF |
| |
| ab_CD.EF@GH ab_CD_GH EF |
| |
| Some 'improper' ways to do the same as above: |
| ! ab_CD@GH.EF ab_CD_GH EF |
| ! ab_CD.EF@GH.IJ ab_CD_GH EF |
| ! ab_CD@ZZ.EF@GH.IJ ab_CD_GH EF |
| |
| _CD@GH _CD_GH - |
| _CD.EF@GH _CD_GH EF |
| |
| The variant cannot have dots in it. |
| The 'rightmost' variant (@xxx) wins. |
| The leftmost codepage (.xxx) wins. |
| */ |
| char *correctedPOSIXLocale = 0; |
| const char* posixID = uprv_getPOSIXID(); |
| const char *p; |
| const char *q; |
| int32_t len; |
| |
| /* Format: (no spaces) |
| ll [ _CC ] [ . MM ] [ @ VV] |
| |
| l = lang, C = ctry, M = charmap, V = variant |
| */ |
| |
| if (gCorrectedPOSIXLocale != NULL) { |
| return gCorrectedPOSIXLocale; |
| } |
| |
| if ((p = uprv_strchr(posixID, '.')) != NULL) { |
| /* assume new locale can't be larger than old one? */ |
| correctedPOSIXLocale = uprv_malloc(uprv_strlen(posixID)); |
| uprv_strncpy(correctedPOSIXLocale, posixID, p-posixID); |
| correctedPOSIXLocale[p-posixID] = 0; |
| |
| /* do not copy after the @ */ |
| if ((p = uprv_strchr(correctedPOSIXLocale, '@')) != NULL) { |
| correctedPOSIXLocale[p-correctedPOSIXLocale] = 0; |
| } |
| } |
| |
| /* Note that we scan the *uncorrected* ID. */ |
| if ((p = uprv_strrchr(posixID, '@')) != NULL) { |
| if (correctedPOSIXLocale == NULL) { |
| correctedPOSIXLocale = uprv_malloc(uprv_strlen(posixID)); |
| uprv_strncpy(correctedPOSIXLocale, posixID, p-posixID); |
| correctedPOSIXLocale[p-posixID] = 0; |
| } |
| p++; |
| |
| /* Take care of any special cases here.. */ |
| if (!uprv_strcmp(p, "nynorsk")) { |
| p = "NY"; |
| |
| /* Should we assume no_NO_NY instead of possible no__NY? |
| * if (!uprv_strcmp(correctedPOSIXLocale, "no")) { |
| * uprv_strcpy(correctedPOSIXLocale, "no_NO"); |
| * } |
| */ |
| } |
| |
| if (uprv_strchr(correctedPOSIXLocale,'_') == NULL) { |
| uprv_strcat(correctedPOSIXLocale, "__"); /* aa@b -> aa__b */ |
| } |
| else { |
| uprv_strcat(correctedPOSIXLocale, "_"); /* aa_CC@b -> aa_CC_b */ |
| } |
| |
| if ((q = uprv_strchr(p, '.')) != NULL) { |
| /* How big will the resulting string be? */ |
| len = (int32_t)(uprv_strlen(correctedPOSIXLocale) + (q-p)); |
| uprv_strncat(correctedPOSIXLocale, p, q-p); |
| correctedPOSIXLocale[len] = 0; |
| } |
| else { |
| /* Anything following the @ sign */ |
| uprv_strcat(correctedPOSIXLocale, p); |
| } |
| |
| /* Should there be a map from 'no@nynorsk' -> no_NO_NY here? |
| * How about 'russian' -> 'ru'? |
| */ |
| } |
| |
| /* Was a correction made? */ |
| if (correctedPOSIXLocale != NULL) { |
| posixID = correctedPOSIXLocale; |
| } |
| else { |
| /* copy it, just in case the original pointer goes away. See j2395 */ |
| correctedPOSIXLocale = (char *)uprv_malloc(uprv_strlen(posixID) + 1); |
| posixID = uprv_strcpy(correctedPOSIXLocale, posixID); |
| } |
| |
| if (gCorrectedPOSIXLocale == NULL) { |
| gCorrectedPOSIXLocale = correctedPOSIXLocale; |
| ucln_common_registerCleanup(UCLN_COMMON_PUTIL, putil_cleanup); |
| correctedPOSIXLocale = NULL; |
| } |
| |
| if (correctedPOSIXLocale != NULL) { /* Was already set - clean up. */ |
| uprv_free(correctedPOSIXLocale); |
| } |
| |
| return posixID; |
| |
| #elif defined(U_WINDOWS) |
| UErrorCode status = U_ZERO_ERROR; |
| LCID id = GetThreadLocale(); |
| const char* locID = uprv_convertToPosix(id, &status); |
| |
| if (U_FAILURE(status)) { |
| locID = "en_US"; |
| } |
| return locID; |
| |
| #elif defined(XP_MAC) |
| int32_t script = MAC_LC_INIT_NUMBER; |
| /* = IntlScript(); or GetScriptManagerVariable(smSysScript);*/ |
| int32_t region = MAC_LC_INIT_NUMBER; |
| /* = GetScriptManagerVariable(smRegionCode);*/ |
| int32_t lang = MAC_LC_INIT_NUMBER; |
| /* = GetScriptManagerVariable(smScriptLang);*/ |
| int32_t date_region = MAC_LC_INIT_NUMBER; |
| const char* posixID = 0; |
| int32_t count = sizeof(mac_lc_recs) / sizeof(mac_lc_rec); |
| int32_t i; |
| Intl1Hndl ih; |
| |
| ih = (Intl1Hndl) GetIntlResource(1); |
| if (ih) |
| date_region = ((uint16_t)(*ih)->intl1Vers) >> 8; |
| |
| for (i = 0; i < count; i++) { |
| if ( ((mac_lc_recs[i].script == MAC_LC_MAGIC_NUMBER) |
| || (mac_lc_recs[i].script == script)) |
| && ((mac_lc_recs[i].region == MAC_LC_MAGIC_NUMBER) |
| || (mac_lc_recs[i].region == region)) |
| && ((mac_lc_recs[i].lang == MAC_LC_MAGIC_NUMBER) |
| || (mac_lc_recs[i].lang == lang)) |
| && ((mac_lc_recs[i].date_region == MAC_LC_MAGIC_NUMBER) |
| || (mac_lc_recs[i].date_region == date_region)) |
| ) |
| { |
| posixID = mac_lc_recs[i].posixID; |
| break; |
| } |
| } |
| |
| return posixID; |
| |
| #elif defined(OS400) |
| /* locales are process scoped and are by definition thread safe */ |
| static char correctedLocale[64]; |
| const char *localeID = getenv("LC_ALL"); |
| char *p; |
| |
| if (localeID == NULL) |
| localeID = getenv("LANG"); |
| if (localeID == NULL) |
| localeID = setlocale(LC_ALL, NULL); |
| /* Make sure we have something... */ |
| if (localeID == NULL) |
| return "en_US_POSIX"; |
| |
| /* Extract the locale name from the path. */ |
| if((p = uprv_strrchr(localeID, '/')) != NULL) |
| { |
| /* Increment p to start of locale name. */ |
| p++; |
| localeID = p; |
| } |
| |
| /* Copy to work location. */ |
| uprv_strcpy(correctedLocale, localeID); |
| |
| /* Strip off the '.locale' extension. */ |
| if((p = uprv_strchr(correctedLocale, '.')) != NULL) { |
| *p = 0; |
| } |
| |
| /* Upper case the locale name. */ |
| T_CString_toUpperCase(correctedLocale); |
| |
| /* See if we are using the POSIX locale. Any of the |
| * following are equivalent and use the same QLGPGCMA |
| * (POSIX) locale. |
| * QLGPGCMA2 means UCS2 |
| * QLGPGCMA_4 means UTF-32 |
| * QLGPGCMA_8 means UTF-8 |
| */ |
| if ((uprv_strcmp("C", correctedLocale) == 0) || |
| (uprv_strcmp("POSIX", correctedLocale) == 0) || |
| (uprv_strncmp("QLGPGCMA", correctedLocale, 8) == 0)) |
| { |
| uprv_strcpy(correctedLocale, "en_US_POSIX"); |
| } |
| else |
| { |
| int16_t LocaleLen; |
| |
| /* Lower case the lang portion. */ |
| for(p = correctedLocale; *p != 0 && *p != '_'; p++) |
| { |
| *p = uprv_tolower(*p); |
| } |
| |
| /* Adjust for Euro. After '_E' add 'URO'. */ |
| LocaleLen = uprv_strlen(correctedLocale); |
| if (correctedLocale[LocaleLen - 2] == '_' && |
| correctedLocale[LocaleLen - 1] == 'E') |
| { |
| uprv_strcat(correctedLocale, "URO"); |
| } |
| |
| /* If using Lotus-based locale then convert to |
| * equivalent non Lotus. |
| */ |
| else if (correctedLocale[LocaleLen - 2] == '_' && |
| correctedLocale[LocaleLen - 1] == 'L') |
| { |
| correctedLocale[LocaleLen - 2] = 0; |
| } |
| |
| /* There are separate simplified and traditional |
| * locales called zh_HK_S and zh_HK_T. |
| */ |
| else if (uprv_strncmp(correctedLocale, "zh_HK", 5) == 0) |
| { |
| uprv_strcpy(correctedLocale, "zh_HK"); |
| } |
| |
| /* A special zh_CN_GBK locale... |
| */ |
| else if (uprv_strcmp(correctedLocale, "zh_CN_GBK") == 0) |
| { |
| uprv_strcpy(correctedLocale, "zh_CN"); |
| } |
| |
| } |
| |
| return correctedLocale; |
| #endif |
| |
| } |
| |
| |
| static const char* |
| int_getDefaultCodepage() |
| { |
| #if defined(OS400) |
| uint32_t ccsid = 37; /* Default to ibm-37 */ |
| static char codepage[64]; |
| Qwc_JOBI0400_t jobinfo; |
| Qus_EC_t error = { sizeof(Qus_EC_t) }; /* SPI error code */ |
| |
| EPT_CALL(QUSRJOBI)(&jobinfo, sizeof(jobinfo), "JOBI0400", |
| "* ", " ", &error); |
| |
| if (error.Bytes_Available == 0) { |
| if (jobinfo.Coded_Char_Set_ID != 0xFFFF) { |
| ccsid = (uint32_t)jobinfo.Coded_Char_Set_ID; |
| } |
| else if (jobinfo.Default_Coded_Char_Set_Id != 0xFFFF) { |
| ccsid = (uint32_t)jobinfo.Default_Coded_Char_Set_Id; |
| } |
| /* else use the default */ |
| } |
| sprintf(codepage,"ibm-%d", ccsid); |
| return codepage; |
| |
| #elif defined(OS390) |
| static char codepage[64]; |
| sprintf(codepage,"%s" UCNV_SWAP_LFNL_OPTION_STRING, nl_langinfo(CODESET)); |
| return codepage; |
| |
| #elif defined(XP_MAC) |
| return "ibm-1275"; /* TODO: Macintosh Roman. There must be a better way. fixme! */ |
| |
| #elif defined(U_WINDOWS) |
| static char codepage[64]; |
| sprintf(codepage, "windows-%d", GetACP()); |
| return codepage; |
| |
| #elif U_POSIX_LOCALE |
| static char codesetName[100]; |
| char *name = NULL; |
| char *euro = NULL; |
| const char *localeName = NULL; |
| |
| uprv_memset(codesetName, 0, sizeof(codesetName)); |
| |
| /* Check setlocale before the environment variables |
| because the application may have set it first */ |
| /* setlocale needs "" and not NULL for Linux and Solaris */ |
| localeName = setlocale(LC_CTYPE, ""); |
| if (localeName != NULL && (name = (uprv_strchr(localeName, '.'))) != NULL) { |
| /* strip the locale name and look at the suffix only */ |
| name = uprv_strncpy(codesetName, name+1, sizeof(codesetName)); |
| codesetName[sizeof(codesetName)-1] = 0; |
| if ((euro = (uprv_strchr(name, '@'))) != NULL) { |
| *euro = 0; |
| } |
| /* if we can find the codset name from setlocale, return that. */ |
| if (*name) { |
| return name; |
| } |
| } |
| |
| #if U_HAVE_NL_LANGINFO_CODESET |
| if (*codesetName) { |
| uprv_memset(codesetName, 0, sizeof(codesetName)); |
| } |
| /* When available, check nl_langinfo first because it usually gives more |
| useful names. It depends on LC_CTYPE and not LANG or LC_ALL */ |
| { |
| const char *codeset = nl_langinfo(U_NL_LANGINFO_CODESET); |
| if (codeset != NULL) { |
| uprv_strncpy(codesetName, codeset, sizeof(codesetName)); |
| codesetName[sizeof(codesetName)-1] = 0; |
| return codesetName; |
| } |
| } |
| #endif |
| |
| /* Try a locale specified by the user. |
| This is usually underspecified and usually checked by setlocale already. */ |
| if (*codesetName) { |
| uprv_memset(codesetName, 0, sizeof(codesetName)); |
| } |
| localeName = uprv_getPOSIXID(); |
| if (localeName != NULL && (name = (uprv_strchr(localeName, '.'))) != NULL) { |
| /* strip the locale name and look at the suffix only */ |
| name = uprv_strncpy(codesetName, name+1, sizeof(codesetName)); |
| codesetName[sizeof(codesetName)-1] = 0; |
| if ((euro = (uprv_strchr(name, '@'))) != NULL) { |
| *euro = 0; |
| } |
| /* if we can find the codset name, return that. */ |
| if (*name) { |
| return name; |
| } |
| } |
| |
| if (*codesetName == 0) |
| { |
| /* if the table lookup failed, return US ASCII (ISO 646). */ |
| uprv_strcpy(codesetName, "US-ASCII"); |
| } |
| return codesetName; |
| #else |
| return "US-ASCII"; |
| #endif |
| } |
| |
| |
| U_CAPI const char* U_EXPORT2 |
| uprv_getDefaultCodepage() |
| { |
| static char const *name = NULL; |
| umtx_lock(NULL); |
| if (name == NULL) { |
| name = int_getDefaultCodepage(); |
| } |
| umtx_unlock(NULL); |
| return name; |
| } |
| |
| |
| /* end of platform-specific implementation -------------- */ |
| |
| /* version handling --------------------------------------------------------- */ |
| |
| U_CAPI void U_EXPORT2 |
| u_versionFromString(UVersionInfo versionArray, const char *versionString) { |
| char *end; |
| uint16_t part=0; |
| |
| if(versionArray==NULL) { |
| return; |
| } |
| |
| if(versionString!=NULL) { |
| for(;;) { |
| versionArray[part]=(uint8_t)uprv_strtoul(versionString, &end, 10); |
| if(end==versionString || ++part==U_MAX_VERSION_LENGTH || *end!=U_VERSION_DELIMITER) { |
| break; |
| } |
| versionString=end+1; |
| } |
| } |
| |
| while(part<U_MAX_VERSION_LENGTH) { |
| versionArray[part++]=0; |
| } |
| } |
| |
| U_CAPI void U_EXPORT2 |
| u_versionToString(UVersionInfo versionArray, char *versionString) { |
| uint16_t count, part; |
| uint8_t field; |
| |
| if(versionString==NULL) { |
| return; |
| } |
| |
| if(versionArray==NULL) { |
| versionString[0]=0; |
| return; |
| } |
| |
| /* count how many fields need to be written */ |
| for(count=4; count>0 && versionArray[count-1]==0; --count) { |
| } |
| |
| if(count <= 1) { |
| count = 2; |
| } |
| |
| /* write the first part */ |
| /* write the decimal field value */ |
| field=versionArray[0]; |
| if(field>=100) { |
| *versionString++=(char)('0'+field/100); |
| field%=100; |
| } |
| if(field>=10) { |
| *versionString++=(char)('0'+field/10); |
| field%=10; |
| } |
| *versionString++=(char)('0'+field); |
| |
| /* write the following parts */ |
| for(part=1; part<count; ++part) { |
| /* write a dot first */ |
| *versionString++=U_VERSION_DELIMITER; |
| |
| /* write the decimal field value */ |
| field=versionArray[part]; |
| if(field>=100) { |
| *versionString++=(char)('0'+field/100); |
| field%=100; |
| } |
| if(field>=10) { |
| *versionString++=(char)('0'+field/10); |
| field%=10; |
| } |
| *versionString++=(char)('0'+field); |
| } |
| |
| /* NUL-terminate */ |
| *versionString=0; |
| } |
| |
| U_CAPI void U_EXPORT2 |
| u_getVersion(UVersionInfo versionArray) { |
| u_versionFromString(versionArray, U_ICU_VERSION); |
| } |
| |
| /* |
| * Hey, Emacs, please set the following: |
| * |
| * Local Variables: |
| * indent-tabs-mode: nil |
| * End: |
| * |
| */ |