src/com/ibm/icu/util/ULocale.java - external/github.com/unicode-org/icu - Git at Google

 /*
 ******************************************************************************
 * Copyright (C) 2003-2009, International Business Machines Corporation and   *
 * others. All Rights Reserved.                                               *
 ******************************************************************************
 */

 package com.ibm.icu.util;

 import java.io.Serializable;
 import java.text.ParseException;
 import java.util.Collections;
 import java.util.Comparator;
 import java.util.Iterator;
 import java.util.Locale;
 import java.util.Map;
 import java.util.MissingResourceException;
 import java.util.Set;
 import java.util.TreeMap;

 import com.ibm.icu.impl.ICUCache;
 import com.ibm.icu.impl.ICUResourceBundle;
 import com.ibm.icu.impl.LocaleUtility;
 import com.ibm.icu.impl.SimpleCache;
 import com.ibm.icu.impl.Utility;
 import com.ibm.icu.impl.locale.AsciiUtil;
 import com.ibm.icu.impl.locale.BaseLocale;
 import com.ibm.icu.impl.locale.InternalLocaleBuilder;
 import com.ibm.icu.impl.locale.LanguageTag;
 import com.ibm.icu.impl.locale.LocaleExtensions;
 import com.ibm.icu.impl.locale.LocaleSyntaxException;
 import com.ibm.icu.impl.locale.LanguageTag.Extension;

 /**
  * A class analogous to {@link java.util.Locale} that provides additional
  * support for ICU protocol.  In ICU 3.0 this class is enhanced to support
  * RFC 3066 language identifiers.
  *
  * <p>Many classes and services in ICU follow a factory idiom, in
  * which a factory method or object responds to a client request with
  * an object.  The request includes a locale (the <i>requested</i>
  * locale), and the returned object is constructed using data for that
  * locale.  The system may lack data for the requested locale, in
  * which case the locale fallback mechanism will be invoked until a
  * populated locale is found (the <i>valid</i> locale).  Furthermore,
  * even when a populated locale is found (the <i>valid</i> locale),
  * further fallback may be required to reach a locale containing the
  * specific data required by the service (the <i>actual</i> locale).
  *
  * <p>ULocale performs <b>'normalization'</b> and <b>'canonicalization'</b> of locale ids.
  * Normalization 'cleans up' ICU locale ids as follows:
  * <ul>
  * <li>language, script, country, variant, and keywords are properly cased<br>
  * (lower, title, upper, upper, and lower case respectively)</li>
  * <li>hyphens used as separators are converted to underscores</li>
  * <li>three-letter language and country ids are converted to two-letter
  * equivalents where available</li>
  * <li>surrounding spaces are removed from keywords and values</li>
  * <li>if there are multiple keywords, they are put in sorted order</li>
  * </ul>
  * Canonicalization additionally performs the following:
  * <ul>
  * <li>POSIX ids are converted to ICU format IDs</li>
  * <li>'grandfathered' 3066 ids are converted to ICU standard form</li>
  * <li>'PREEURO' and 'EURO' variants are converted to currency keyword form, with the currency
  * id appropriate to the country of the locale (for PREEURO) or EUR (for EURO).
  * </ul>
  * All ULocale constructors automatically normalize the locale id.  To handle
  * POSIX ids, <code>canonicalize</code> can be called to convert the id
  * to canonical form, or the <code>canonicalInstance</code> factory method
  * can be called.</p>
  *
  * <p>This class provides selectors {@link #VALID_LOCALE} and {@link
  * #ACTUAL_LOCALE} intended for use in methods named
  * <tt>getLocale()</tt>.  These methods exist in several ICU classes,
  * including {@link com.ibm.icu.util.Calendar}, {@link
  * com.ibm.icu.util.Currency}, {@link com.ibm.icu.text.UFormat},
  * {@link com.ibm.icu.text.BreakIterator}, {@link
  * com.ibm.icu.text.Collator}, {@link
  * com.ibm.icu.text.DateFormatSymbols}, and {@link
  * com.ibm.icu.text.DecimalFormatSymbols} and their subclasses, if
  * any.  Once an object of one of these classes has been created,
  * <tt>getLocale()</tt> may be called on it to determine the valid and
  * actual locale arrived at during the object's construction.
  *
  * <p>Note: The <tt>getLocale()</tt> method will be implemented in ICU
  * 3.0; ICU 2.8 contains a partial preview implementation.  The
  * <i>actual</i> locale is returned correctly, but the <i>valid</i>
  * locale is not, in most cases.
  *
  * @see java.util.Locale
  * @author weiv
  * @author Alan Liu
  * @author Ram Viswanadha
  * @stable ICU 2.8
  */
 public final class ULocale implements Serializable {
     // using serialver from jdk1.4.2_05
     private static final long serialVersionUID = 3715177670352309217L;

     /**
      * Useful constant for language.
      * @stable ICU 3.0
      */
     public static final ULocale ENGLISH = new ULocale("en", Locale.ENGLISH);

     /**
      * Useful constant for language.
      * @stable ICU 3.0
      */
     public static final ULocale FRENCH = new ULocale("fr", Locale.FRENCH);

     /**
      * Useful constant for language.
      * @stable ICU 3.0
      */
     public static final ULocale GERMAN = new ULocale("de", Locale.GERMAN);

     /**
      * Useful constant for language.
      * @stable ICU 3.0
      */
     public static final ULocale ITALIAN = new ULocale("it", Locale.ITALIAN);

     /**
      * Useful constant for language.
      * @stable ICU 3.0
      */
     public static final ULocale JAPANESE = new ULocale("ja", Locale.JAPANESE);

     /**
      * Useful constant for language.
      * @stable ICU 3.0
      */
     public static final ULocale KOREAN = new ULocale("ko", Locale.KOREAN);

     /**
      * Useful constant for language.
      * @stable ICU 3.0
      */
     public static final ULocale CHINESE = new ULocale("zh", Locale.CHINESE);

     /**
      * Useful constant for language.
      * @stable ICU 3.0
      */
     public static final ULocale SIMPLIFIED_CHINESE = new ULocale("zh_Hans", Locale.CHINESE);

     /**
      * Useful constant for language.
      * @stable ICU 3.0
      */
     public static final ULocale TRADITIONAL_CHINESE = new ULocale("zh_Hant", Locale.CHINESE);

     /**
      * Useful constant for country/region.
      * @stable ICU 3.0
      */
     public static final ULocale FRANCE = new ULocale("fr_FR", Locale.FRANCE);

     /**
      * Useful constant for country/region.
      * @stable ICU 3.0
      */
     public static final ULocale GERMANY = new ULocale("de_DE", Locale.GERMANY);

     /**
      * Useful constant for country/region.
      * @stable ICU 3.0
      */
     public static final ULocale ITALY = new ULocale("it_IT", Locale.ITALY);

     /**
      * Useful constant for country/region.
      * @stable ICU 3.0
      */
     public static final ULocale JAPAN = new ULocale("ja_JP", Locale.JAPAN);

     /**
      * Useful constant for country/region.
      * @stable ICU 3.0
      */
     public static final ULocale KOREA = new ULocale("ko_KR", Locale.KOREA);

     /**
      * Useful constant for country/region.
      * @stable ICU 3.0
      */
     public static final ULocale CHINA = new ULocale("zh_Hans_CN", Locale.CHINA);

     /**
      * Useful constant for country/region.
      * @stable ICU 3.0
      */
     public static final ULocale PRC = CHINA;

     /**
      * Useful constant for country/region.
      * @stable ICU 3.0
      */
     public static final ULocale TAIWAN = new ULocale("zh_Hant_TW", Locale.TAIWAN);

     /**
      * Useful constant for country/region.
      * @stable ICU 3.0
      */
     public static final ULocale UK = new ULocale("en_GB", Locale.UK);

     /**
      * Useful constant for country/region.
      * @stable ICU 3.0
      */
     public static final ULocale US = new ULocale("en_US", Locale.US);

     /**
      * Useful constant for country/region.
      * @stable ICU 3.0
      */
     public static final ULocale CANADA = new ULocale("en_CA", Locale.CANADA);

     /**
      * Useful constant for country/region.
      * @stable ICU 3.0
      */
     public static final ULocale CANADA_FRENCH = new ULocale("fr_CA", Locale.CANADA_FRENCH);

     /**
      * Handy constant.
      */
     private static final String EMPTY_STRING = "";

     // Used in both ULocale and IDParser, so moved up here.
     private static final char UNDERSCORE            = '_';

     // default empty locale
     private static final Locale EMPTY_LOCALE = new Locale("", "");

     /**
      * The root ULocale.
      * @stable ICU 2.8
      */
     public static final ULocale ROOT = new ULocale("root", EMPTY_LOCALE);

     private static final SimpleCache CACHE = new SimpleCache();

     /**
      * Cache the locale.
      */
     private transient Locale locale;

     /**
      * The raw localeID that we were passed in.
      */
     private String localeID;

     /**
      * Tables used in normalizing portions of the id.
      */
     /* tables updated per http://lcweb.loc.gov/standards/iso639-2/
        to include the revisions up to 2001/7/27 *CWB*/
     /* The 3 character codes are the terminology codes like RFC 3066.
        This is compatible with prior ICU codes */
     /* "in" "iw" "ji" "jw" & "sh" have been withdrawn but are still in
        the table but now at the end of the table because
        3 character codes are duplicates.  This avoids bad searches
        going from 3 to 2 character codes.*/
     /* The range qaa-qtz is reserved for local use. */

     private static String[] _languages;
     private static String[] _replacementLanguages;
     private static String[] _obsoleteLanguages;
     private static String[] _languages3;
     private static String[] _obsoleteLanguages3;

     // Avoid initializing languages tables unless we have to.
     private static void initLanguageTables() {
         if (_languages == null) {

             /* This list MUST be in sorted order, and MUST contain the two-letter codes
                if one exists otherwise use the three letter code */
             String[] tempLanguages = {
                 "aa",  "ab",  "ace", "ach", "ada", "ady", "ae",  "af",  "afa",
                 "afh", "ak",  "akk", "ale", "alg", "am",  "an",  "ang", "apa",
                 "ar",  "arc", "arn", "arp", "art", "arw", "as",  "ast",
                 "ath", "aus", "av",  "awa", "ay",  "az",  "ba",  "bad",
                 "bai", "bal", "ban", "bas", "bat", "be",  "bej",
                 "bem", "ber", "bg",  "bh",  "bho", "bi",  "bik", "bin",
                 "bla", "bm",  "bn",  "bnt", "bo",  "br",  "bra", "bs",
                 "btk", "bua", "bug", "byn", "ca",  "cad", "cai", "car", "cau",
                 "ce",  "ceb", "cel", "ch",  "chb", "chg", "chk", "chm",
                 "chn", "cho", "chp", "chr", "chy", "cmc", "co",  "cop",
                 "cpe", "cpf", "cpp", "cr",  "crh", "crp", "cs",  "csb", "cu",  "cus",
                 "cv",  "cy",  "da",  "dak", "dar", "day", "de",  "del", "den",
                 "dgr", "din", "doi", "dra", "dsb", "dua", "dum", "dv",  "dyu",
                 "dz",  "ee",  "efi", "egy", "eka", "el",  "elx", "en",
                 "enm", "eo",  "es",  "et",  "eu",  "ewo", "fa",
                 "fan", "fat", "ff",  "fi",  "fiu", "fj",  "fo",  "fon",
                 "fr",  "frm", "fro", "fur", "fy",  "ga",  "gaa", "gay",
                 "gba", "gd",  "gem", "gez", "gil", "gl",  "gmh", "gn",
                 "goh", "gon", "gor", "got", "grb", "grc", "gu",  "gv",
                 "gwi", "ha",  "hai", "haw", "he",  "hi",  "hil", "him",
                 "hit", "hmn", "ho",  "hr",  "hsb", "ht",  "hu",  "hup", "hy",  "hz",
                 "ia",  "iba", "id",  "ie",  "ig",  "ii",  "ijo", "ik",
                 "ilo", "inc", "ine", "inh", "io",  "ira", "iro", "is",  "it",
                 "iu",  "ja",  "jbo", "jpr", "jrb", "jv",  "ka",  "kaa", "kab",
                 "kac", "kam", "kar", "kaw", "kbd", "kg",  "kha", "khi",
                 "kho", "ki",  "kj",  "kk",  "kl",  "km",  "kmb", "kn",
                 "ko",  "kok", "kos", "kpe", "kr",  "krc", "kro", "kru", "ks",
                 "ku",  "kum", "kut", "kv",  "kw",  "ky",  "la",  "lad",
                 "lah", "lam", "lb",  "lez", "lg",  "li",  "ln",  "lo",  "lol",
                 "loz", "lt",  "lu",  "lua", "lui", "lun", "luo", "lus",
                 "lv",  "mad", "mag", "mai", "mak", "man", "map", "mas",
                 "mdf", "mdr", "men", "mg",  "mga", "mh",  "mi",  "mic", "min",
                 "mis", "mk",  "mkh", "ml",  "mn",  "mnc", "mni", "mno",
                 "mo",  "moh", "mos", "mr",  "ms",  "mt",  "mul", "mun",
                 "mus", "mwr", "my",  "myn", "myv", "na",  "nah", "nai", "nap",
                 "nb",  "nd",  "nds", "ne",  "new", "ng",  "nia", "nic",
                 "niu", "nl",  "nn",  "no",  "nog", "non", "nr",  "nso", "nub",
                 "nv",  "nwc", "ny",  "nym", "nyn", "nyo", "nzi", "oc",  "oj",
                 "om",  "or",  "os",  "osa", "ota", "oto", "pa",  "paa",
                 "pag", "pal", "pam", "pap", "pau", "peo", "phi", "phn",
                 "pi",  "pl",  "pon", "pra", "pro", "ps",  "pt",  "qu",
                 "raj", "rap", "rar", "rm",  "rn",  "ro",  "roa", "rom",
                 "ru",  "rup", "rw",  "sa",  "sad", "sah", "sai", "sal", "sam",
                 "sas", "sat", "sc",  "sco", "sd",  "se",  "sel", "sem",
                 "sg",  "sga", "sgn", "shn", "si",  "sid", "sio", "sit",
                 "sk",  "sl",  "sla", "sm",  "sma", "smi", "smj", "smn",
                 "sms", "sn",  "snk", "so",  "sog", "son", "sq",  "sr",
                 "srr", "ss",  "ssa", "st",  "su",  "suk", "sus", "sux",
                 "sv",  "sw",  "syr", "ta",  "tai", "te",  "tem", "ter",
                 "tet", "tg",  "th",  "ti",  "tig", "tiv", "tk",  "tkl",
                 "tl",  "tlh", "tli", "tmh", "tn",  "to",  "tog", "tpi", "tr",
                 "ts",  "tsi", "tt",  "tum", "tup", "tut", "tvl", "tw",
                 "ty",  "tyv", "udm", "ug",  "uga", "uk",  "umb", "und", "ur",
                 "uz",  "vai", "ve",  "vi",  "vo",  "vot", "wa",  "wak",
                 "wal", "war", "was", "wen", "wo",  "xal", "xh",  "yao", "yap",
                 "yi",  "yo",  "ypk", "za",  "zap", "zen", "zh",  "znd",
                 "zu",  "zun",
             };

             String[] tempReplacementLanguages = {
                 "id", "he", "yi", "jv", "sr", "nb",/* replacement language codes */
             };

             String[] tempObsoleteLanguages = {
                 "in", "iw", "ji", "jw", "sh", "no",    /* obsolete language codes */
             };

             /* This list MUST contain a three-letter code for every two-letter code in the
                list above, and they MUST ne in the same order (i.e., the same language must
                be in the same place in both lists)! */
             String[] tempLanguages3 = {
                 /*"aa",  "ab",  "ace", "ach", "ada", "ady", "ae",  "af",  "afa",    */
                 "aar", "abk", "ace", "ach", "ada", "ady", "ave", "afr", "afa",
                 /*"afh", "ak",  "akk", "ale", "alg", "am",  "an",  "ang", "apa",    */
                 "afh", "aka", "akk", "ale", "alg", "amh", "arg", "ang", "apa",
                 /*"ar",  "arc", "arn", "arp", "art", "arw", "as",  "ast",    */
                 "ara", "arc", "arn", "arp", "art", "arw", "asm", "ast",
                 /*"ath", "aus", "av",  "awa", "ay",  "az",  "ba",  "bad",    */
                 "ath", "aus", "ava", "awa", "aym", "aze", "bak", "bad",
                 /*"bai", "bal", "ban", "bas", "bat", "be",  "bej",    */
                 "bai", "bal", "ban", "bas", "bat", "bel", "bej",
                 /*"bem", "ber", "bg",  "bh",  "bho", "bi",  "bik", "bin",    */
                 "bem", "ber", "bul", "bih", "bho", "bis", "bik", "bin",
                 /*"bla", "bm",  "bn",  "bnt", "bo",  "br",  "bra", "bs",     */
                 "bla", "bam",  "ben", "bnt", "bod", "bre", "bra", "bos",
                 /*"btk", "bua", "bug", "byn", "ca",  "cad", "cai", "car", "cau",    */
                 "btk", "bua", "bug", "byn", "cat", "cad", "cai", "car", "cau",
                 /*"ce",  "ceb", "cel", "ch",  "chb", "chg", "chk", "chm",    */
                 "che", "ceb", "cel", "cha", "chb", "chg", "chk", "chm",
                 /*"chn", "cho", "chp", "chr", "chy", "cmc", "co",  "cop",    */
                 "chn", "cho", "chp", "chr", "chy", "cmc", "cos", "cop",
                 /*"cpe", "cpf", "cpp", "cr",  "crh", "crp", "cs",  "csb", "cu",  "cus",    */
                 "cpe", "cpf", "cpp", "cre", "crh", "crp", "ces", "csb", "chu", "cus",
                 /*"cv",  "cy",  "da",  "dak", "dar", "day", "de",  "del", "den",    */
                 "chv", "cym", "dan", "dak", "dar", "day", "deu", "del", "den",
                 /*"dgr", "din", "doi", "dra", "dsb", "dua", "dum", "dv",  "dyu",    */
                 "dgr", "din", "doi", "dra", "dsb", "dua", "dum", "div", "dyu",
                 /*"dz",  "ee",  "efi", "egy", "eka", "el",  "elx", "en",     */
                 "dzo", "ewe", "efi", "egy", "eka", "ell", "elx", "eng",
                 /*"enm", "eo",  "es",  "et",  "eu",  "ewo", "fa",     */
                 "enm", "epo", "spa", "est", "eus", "ewo", "fas",
                 /*"fan", "fat", "ff",  "fi",  "fiu", "fj",  "fo",  "fon",    */
                 "fan", "fat", "ful", "fin", "fiu", "fij", "fao", "fon",
                 /*"fr",  "frm", "fro", "fur", "fy",  "ga",  "gaa", "gay",    */
                 "fra", "frm", "fro", "fur", "fry", "gle", "gaa", "gay",
                 /*"gba", "gd",  "gem", "gez", "gil", "gl",  "gmh", "gn",     */
                 "gba", "gla", "gem", "gez", "gil", "glg", "gmh", "grn",
                 /*"goh", "gon", "gor", "got", "grb", "grc", "gu",  "gv",     */
                 "goh", "gon", "gor", "got", "grb", "grc", "guj", "glv",
                 /*"gwi", "ha",  "hai", "haw", "he",  "hi",  "hil", "him",    */
                 "gwi", "hau", "hai", "haw", "heb", "hin", "hil", "him",
                 /*"hit", "hmn", "ho",  "hr",  "hsb", "ht",  "hu",  "hup", "hy",  "hz",     */
                 "hit", "hmn", "hmo", "hrv", "hsb", "hat", "hun", "hup", "hye", "her",
                 /*"ia",  "iba", "id",  "ie",  "ig",  "ii",  "ijo", "ik",     */
                 "ina", "iba", "ind", "ile", "ibo", "iii", "ijo", "ipk",
                 /*"ilo", "inc", "ine", "inh", "io",  "ira", "iro", "is",  "it",      */
                 "ilo", "inc", "ine", "inh", "ido", "ira", "iro", "isl", "ita",
                 /*"iu",  "ja",  "jbo", "jpr", "jrb", "jv",  "ka",  "kaa", "kab",   */
                 "iku", "jpn", "jbo", "jpr", "jrb", "jaw", "kat", "kaa", "kab",
                 /*"kac", "kam", "kar", "kaw", "kbd", "kg",  "kha", "khi",    */
                 "kac", "kam", "kar", "kaw", "kbd", "kon", "kha", "khi",
                 /*"kho", "ki",  "kj",  "kk",  "kl",  "km",  "kmb", "kn",     */
                 "kho", "kik", "kua", "kaz", "kal", "khm", "kmb", "kan",
                 /*"ko",  "kok", "kos", "kpe", "kr",  "krc", "kro", "kru", "ks",     */
                 "kor", "kok", "kos", "kpe", "kau", "krc", "kro", "kru", "kas",
                 /*"ku",  "kum", "kut", "kv",  "kw",  "ky",  "la",  "lad",    */
                 "kur", "kum", "kut", "kom", "cor", "kir", "lat", "lad",
                 /*"lah", "lam", "lb",  "lez", "lg",  "li",  "ln",  "lo",  "lol",    */
                 "lah", "lam", "ltz", "lez", "lug", "lim", "lin", "lao", "lol",
                 /*"loz", "lt",  "lu",  "lua", "lui", "lun", "luo", "lus",    */
                 "loz", "lit", "lub", "lua", "lui", "lun", "luo", "lus",
                 /*"lv",  "mad", "mag", "mai", "mak", "man", "map", "mas",    */
                 "lav", "mad", "mag", "mai", "mak", "man", "map", "mas",
                 /*"mdf", "mdr", "men", "mg",  "mga", "mh",  "mi",  "mic", "min",    */
                 "mdf", "mdr", "men", "mlg", "mga", "mah", "mri", "mic", "min",
                 /*"mis", "mk",  "mkh", "ml",  "mn",  "mnc", "mni", "mno",    */
                 "mis", "mkd", "mkh", "mal", "mon", "mnc", "mni", "mno",
                 /*"mo",  "moh", "mos", "mr",  "ms",  "mt",  "mul", "mun",    */
                 "mol", "moh", "mos", "mar", "msa", "mlt", "mul", "mun",
                 /*"mus", "mwr", "my",  "myn", "myv", "na",  "nah", "nai", "nap",    */
                 "mus", "mwr", "mya", "myn", "myv", "nau", "nah", "nai", "nap",
                 /*"nb",  "nd",  "nds", "ne",  "new", "ng",  "nia", "nic",    */
                 "nob", "nde", "nds", "nep", "new", "ndo", "nia", "nic",
                 /*"niu", "nl",  "nn",  "no",  "nog", "non", "nr",  "nso", "nub",    */
                 "niu", "nld", "nno", "nor", "nog", "non", "nbl", "nso", "nub",
                 /*"nv",  "nwc", "ny",  "nym", "nyn", "nyo", "nzi", "oc",  "oj",     */
                 "nav", "nwc", "nya", "nym", "nyn", "nyo", "nzi", "oci", "oji",
                 /*"om",  "or",  "os",  "osa", "ota", "oto", "pa",  "paa",    */
                 "orm", "ori", "oss", "osa", "ota", "oto", "pan", "paa",
                 /*"pag", "pal", "pam", "pap", "pau", "peo", "phi", "phn",    */
                 "pag", "pal", "pam", "pap", "pau", "peo", "phi", "phn",
                 /*"pi",  "pl",  "pon", "pra", "pro", "ps",  "pt",  "qu",     */
                 "pli", "pol", "pon", "pra", "pro", "pus", "por", "que",
                 /*"raj", "rap", "rar", "rm",  "rn",  "ro",  "roa", "rom",    */
                 "raj", "rap", "rar", "roh", "run", "ron", "roa", "rom",
                 /*"ru",  "rup", "rw",  "sa",  "sad", "sah", "sai", "sal", "sam",    */
                 "rus", "rup", "kin", "san", "sad", "sah", "sai", "sal", "sam",
                 /*"sas", "sat", "sc",  "sco", "sd",  "se",  "sel", "sem",    */
                 "sas", "sat", "srd", "sco", "snd", "sme", "sel", "sem",
                 /*"sg",  "sga", "sgn", "shn", "si",  "sid", "sio", "sit",    */
                 "sag", "sga", "sgn", "shn", "sin", "sid", "sio", "sit",
                 /*"sk",  "sl",  "sla", "sm",  "sma", "smi", "smj", "smn",    */
                 "slk", "slv", "sla", "smo", "sma", "smi", "smj", "smn",
                 /*"sms", "sn",  "snk", "so",  "sog", "son", "sq",  "sr",     */
                 "sms", "sna", "snk", "som", "sog", "son", "sqi", "srp",
                 /*"srr", "ss",  "ssa", "st",  "su",  "suk", "sus", "sux",    */
                 "srr", "ssw", "ssa", "sot", "sun", "suk", "sus", "sux",
                 /*"sv",  "sw",  "syr", "ta",  "tai", "te",  "tem", "ter",    */
                 "swe", "swa", "syr", "tam", "tai", "tel", "tem", "ter",
                 /*"tet", "tg",  "th",  "ti",  "tig", "tiv", "tk",  "tkl",    */
                 "tet", "tgk", "tha", "tir", "tig", "tiv", "tuk", "tkl",
                 /*"tl",  "tlh", "tli", "tmh", "tn",  "to",  "tog", "tpi", "tr",     */
                 "tgl", "tlh", "tli", "tmh", "tsn", "ton", "tog", "tpi", "tur",
                 /*"ts",  "tsi", "tt",  "tum", "tup", "tut", "tvl", "tw",     */
                 "tso", "tsi", "tat", "tum", "tup", "tut", "tvl", "twi",
                 /*"ty",  "tyv", "udm", "ug",  "uga", "uk",  "umb", "und", "ur",     */
                 "tah", "tyv", "udm", "uig", "uga", "ukr", "umb", "und", "urd",
                 /*"uz",  "vai", "ve",  "vi",  "vo",  "vot", "wa",  "wak",    */
                 "uzb", "vai", "ven", "vie", "vol", "vot", "wln", "wak",
                 /*"wal", "war", "was", "wen", "wo",  "xal", "xh",  "yao", "yap",    */
                 "wal", "war", "was", "wen", "wol", "xal", "xho", "yao", "yap",
                 /*"yi",  "yo",  "ypk", "za",  "zap", "zen", "zh",  "znd",    */
                 "yid", "yor", "ypk", "zha", "zap", "zen", "zho", "znd",
                 /*"zu",  "zun",                                              */
                 "zul", "zun",
             };

             String[] tempObsoleteLanguages3 = {
                 /* "in",  "iw",  "ji",  "jw",  "sh", */
                 "ind", "heb", "yid", "jaw", "srp",
             };

             synchronized (ULocale.class) {
                 if (_languages == null) {
                     _languages = tempLanguages;
                     _replacementLanguages = tempReplacementLanguages;
                     _obsoleteLanguages = tempObsoleteLanguages;
                     _languages3 = tempLanguages3;
                     _obsoleteLanguages3 = tempObsoleteLanguages3;
                 }
             }
         }
     }

     private static String[] _countries;
     private static String[] _deprecatedCountries;
     private static String[] _replacementCountries;
     private static String[] _obsoleteCountries;
     private static String[] _countries3;
     private static String[] _obsoleteCountries3;

     // Avoid initializing country tables unless we have to.
     private static void initCountryTables() {
         if (_countries == null) {
             /* ZR(ZAR) is now CD(COD) and FX(FXX) is PS(PSE) as per
                http://www.evertype.com/standards/iso3166/iso3166-1-en.html
                added new codes keeping the old ones for compatibility
                updated to include 1999/12/03 revisions *CWB*/

             /* RO(ROM) is now RO(ROU) according to
                http://www.iso.org/iso/en/prods-services/iso3166ma/03updates-on-iso-3166/nlv3e-rou.html
             */

             /* This list MUST be in sorted order, and MUST contain only two-letter codes! */
             String[] tempCountries = {
                 "AD",  "AE",  "AF",  "AG",  "AI",  "AL",  "AM",  "AN",
                 "AO",  "AQ",  "AR",  "AS",  "AT",  "AU",  "AW",  "AX",  "AZ",
                 "BA",  "BB",  "BD",  "BE",  "BF",  "BG",  "BH",  "BI",
                 "BJ",  "BL",  "BM",  "BN",  "BO",  "BR",  "BS",  "BT",  "BV",
                 "BW",  "BY",  "BZ",  "CA",  "CC",  "CD",  "CF",  "CG",
                 "CH",  "CI",  "CK",  "CL",  "CM",  "CN",  "CO",  "CR",
                 "CU",  "CV",  "CX",  "CY",  "CZ",  "DE",  "DJ",  "DK",
                 "DM",  "DO",  "DZ",  "EC",  "EE",  "EG",  "EH",  "ER",
                 "ES",  "ET",  "FI",  "FJ",  "FK",  "FM",  "FO",  "FR",
                 "GA",  "GB",  "GD",  "GE",  "GF",  "GG",  "GH",  "GI",  "GL",
                 "GM",  "GN",  "GP",  "GQ",  "GR",  "GS",  "GT",  "GU",
                 "GW",  "GY",  "HK",  "HM",  "HN",  "HR",  "HT",  "HU",
                 "ID",  "IE",  "IL",  "IM",  "IN",  "IO",  "IQ",  "IR",  "IS",
                 "IT",  "JE",  "JM",  "JO",  "JP",  "KE",  "KG",  "KH",  "KI",
                 "KM",  "KN",  "KP",  "KR",  "KW",  "KY",  "KZ",  "LA",
                 "LB",  "LC",  "LI",  "LK",  "LR",  "LS",  "LT",  "LU",
                 "LV",  "LY",  "MA",  "MC",  "MD",  "ME",  "MF",  "MG",  "MH",  "MK",
                 "ML",  "MM",  "MN",  "MO",  "MP",  "MQ",  "MR",  "MS",
                 "MT",  "MU",  "MV",  "MW",  "MX",  "MY",  "MZ",  "NA",
                 "NC",  "NE",  "NF",  "NG",  "NI",  "NL",  "NO",  "NP",
                 "NR",  "NU",  "NZ",  "OM",  "PA",  "PE",  "PF",  "PG",
                 "PH",  "PK",  "PL",  "PM",  "PN",  "PR",  "PS",  "PT",
                 "PW",  "PY",  "QA",  "RE",  "RO",  "RS",  "RU",  "RW",  "SA",
                 "SB",  "SC",  "SD",  "SE",  "SG",  "SH",  "SI",  "SJ",
                 "SK",  "SL",  "SM",  "SN",  "SO",  "SR",  "ST",  "SV",
                 "SY",  "SZ",  "TC",  "TD",  "TF",  "TG",  "TH",  "TJ",
                 "TK",  "TL",  "TM",  "TN",  "TO",  "TR",  "TT",  "TV",
                 "TW",  "TZ",  "UA",  "UG",  "UM",  "US",  "UY",  "UZ",
                 "VA",  "VC",  "VE",  "VG",  "VI",  "VN",  "VU",  "WF",
                 "WS",  "YE",  "YT",  "ZA",  "ZM",  "ZW",
             };

             /* this table is used for 3 letter codes */
             String[] tempObsoleteCountries = {
                 "FX",  "CS",  "RO",  "TP",  "YU",  "ZR",  /* obsolete country codes */
             };

             String[] tempDeprecatedCountries = {
                "BU", "CS", "DY", "FX", "HV", "NH", "RH", "TP", "YU", "ZR" /* deprecated country list */
             };
             String[] tempReplacementCountries = {
            /*  "BU", "CS", "DY", "FX", "HV", "NH", "RH", "TP", "YU", "ZR" */
                "MM", "RS", "BJ", "FR", "BF", "VU", "ZW", "TL", "RS", "CD",   /* replacement country codes */
             };

             /* This list MUST contain a three-letter code for every two-letter code in
                the above list, and they MUST be listed in the same order! */
             String[] tempCountries3 = {
                 /*  "AD",  "AE",  "AF",  "AG",  "AI",  "AL",  "AM",  "AN",     */
                     "AND", "ARE", "AFG", "ATG", "AIA", "ALB", "ARM", "ANT",
                 /*  "AO",  "AQ",  "AR",  "AS",  "AT",  "AU",  "AW",  "AX",  "AZ",     */
                     "AGO", "ATA", "ARG", "ASM", "AUT", "AUS", "ABW", "ALA", "AZE",
                 /*  "BA",  "BB",  "BD",  "BE",  "BF",  "BG",  "BH",  "BI",     */
                     "BIH", "BRB", "BGD", "BEL", "BFA", "BGR", "BHR", "BDI",
                 /*  "BJ",  "BL",  "BM",  "BN",  "BO",  "BR",  "BS",  "BT",  "BV",     */
                     "BEN", "BLM", "BMU", "BRN", "BOL", "BRA", "BHS", "BTN", "BVT",
                 /*  "BW",  "BY",  "BZ",  "CA",  "CC",  "CD",  "CF",  "CG",     */
                     "BWA", "BLR", "BLZ", "CAN", "CCK", "COD", "CAF", "COG",
                 /*  "CH",  "CI",  "CK",  "CL",  "CM",  "CN",  "CO",  "CR",     */
                     "CHE", "CIV", "COK", "CHL", "CMR", "CHN", "COL", "CRI",
                 /*  "CU",  "CV",  "CX",  "CY",  "CZ",  "DE",  "DJ",  "DK",     */
                     "CUB", "CPV", "CXR", "CYP", "CZE", "DEU", "DJI", "DNK",
                 /*  "DM",  "DO",  "DZ",  "EC",  "EE",  "EG",  "EH",  "ER",     */
                     "DMA", "DOM", "DZA", "ECU", "EST", "EGY", "ESH", "ERI",
                 /*  "ES",  "ET",  "FI",  "FJ",  "FK",  "FM",  "FO",  "FR",     */
                     "ESP", "ETH", "FIN", "FJI", "FLK", "FSM", "FRO", "FRA",
                 /*  "GA",  "GB",  "GD",  "GE",  "GF",  "GG",  "GH",  "GI",  "GL",     */
                     "GAB", "GBR", "GRD", "GEO", "GUF", "GGY", "GHA", "GIB", "GRL",
                 /*  "GM",  "GN",  "GP",  "GQ",  "GR",  "GS",  "GT",  "GU",     */
                     "GMB", "GIN", "GLP", "GNQ", "GRC", "SGS", "GTM", "GUM",
                 /*  "GW",  "GY",  "HK",  "HM",  "HN",  "HR",  "HT",  "HU",     */
                     "GNB", "GUY", "HKG", "HMD", "HND", "HRV", "HTI", "HUN",
                 /*  "ID",  "IE",  "IL",  "IM",  "IN",  "IO",  "IQ",  "IR",  "IS" */
                     "IDN", "IRL", "ISR", "IMN", "IND", "IOT", "IRQ", "IRN", "ISL",
                 /*  "IT",  "JE",  "JM",  "JO",  "JP",  "KE",  "KG",  "KH",  "KI",     */
                     "ITA", "JEY", "JAM", "JOR", "JPN", "KEN", "KGZ", "KHM", "KIR",
                 /*  "KM",  "KN",  "KP",  "KR",  "KW",  "KY",  "KZ",  "LA",     */
                     "COM", "KNA", "PRK", "KOR", "KWT", "CYM", "KAZ", "LAO",
                 /*  "LB",  "LC",  "LI",  "LK",  "LR",  "LS",  "LT",  "LU",     */
                     "LBN", "LCA", "LIE", "LKA", "LBR", "LSO", "LTU", "LUX",
                 /*  "LV",  "LY",  "MA",  "MC",  "MD",  "ME",  "MF",  "MG",  "MH",  "MK",     */
                     "LVA", "LBY", "MAR", "MCO", "MDA", "MNE", "MAF", "MDG", "MHL", "MKD",
                 /*  "ML",  "MM",  "MN",  "MO",  "MP",  "MQ",  "MR",  "MS",     */
                     "MLI", "MMR", "MNG", "MAC", "MNP", "MTQ", "MRT", "MSR",
                 /*  "MT",  "MU",  "MV",  "MW",  "MX",  "MY",  "MZ",  "NA",     */
                     "MLT", "MUS", "MDV", "MWI", "MEX", "MYS", "MOZ", "NAM",
                 /*  "NC",  "NE",  "NF",  "NG",  "NI",  "NL",  "NO",  "NP",     */
                     "NCL", "NER", "NFK", "NGA", "NIC", "NLD", "NOR", "NPL",
                 /*  "NR",  "NU",  "NZ",  "OM",  "PA",  "PE",  "PF",  "PG",     */
                     "NRU", "NIU", "NZL", "OMN", "PAN", "PER", "PYF", "PNG",
                 /*  "PH",  "PK",  "PL",  "PM",  "PN",  "PR",  "PS",  "PT",     */
                     "PHL", "PAK", "POL", "SPM", "PCN", "PRI", "PSE", "PRT",
                 /*  "PW",  "PY",  "QA",  "RE",  "RO",  "RS",  "RU",  "RW",  "SA",     */
                     "PLW", "PRY", "QAT", "REU", "ROU", "SRB", "RUS", "RWA", "SAU",
                 /*  "SB",  "SC",  "SD",  "SE",  "SG",  "SH",  "SI",  "SJ",     */
                     "SLB", "SYC", "SDN", "SWE", "SGP", "SHN", "SVN", "SJM",
                 /*  "SK",  "SL",  "SM",  "SN",  "SO",  "SR",  "ST",  "SV",     */
                     "SVK", "SLE", "SMR", "SEN", "SOM", "SUR", "STP", "SLV",
                 /*  "SY",  "SZ",  "TC",  "TD",  "TF",  "TG",  "TH",  "TJ",     */
                     "SYR", "SWZ", "TCA", "TCD", "ATF", "TGO", "THA", "TJK",
                 /*  "TK",  "TL",  "TM",  "TN",  "TO",  "TR",  "TT",  "TV",     */
                     "TKL", "TLS", "TKM", "TUN", "TON", "TUR", "TTO", "TUV",
                 /*  "TW",  "TZ",  "UA",  "UG",  "UM",  "US",  "UY",  "UZ",     */
                     "TWN", "TZA", "UKR", "UGA", "UMI", "USA", "URY", "UZB",
                 /*  "VA",  "VC",  "VE",  "VG",  "VI",  "VN",  "VU",  "WF",     */
                     "VAT", "VCT", "VEN", "VGB", "VIR", "VNM", "VUT", "WLF",
                 /*  "WS",  "YE",  "YT",  "ZA",  "ZM",  "ZW"          */
                     "WSM", "YEM", "MYT", "ZAF", "ZMB", "ZWE",
             };

             String[] tempObsoleteCountries3 = {
                 /*"FX",  "CS",  "RO",  "TP",  "YU",  "ZR",   */
                 "FXX", "SCG", "ROM", "TMP", "YUG", "ZAR",
             };

             synchronized (ULocale.class) {
                 if (_countries == null) {
                     _countries = tempCountries;
                     _deprecatedCountries = tempDeprecatedCountries;
                     _replacementCountries = tempReplacementCountries;
                     _obsoleteCountries = tempObsoleteCountries;
                     _countries3 = tempCountries3;
                     _obsoleteCountries3 = tempObsoleteCountries3;
                 }
             }
         }
     }

     private static String[][] CANONICALIZE_MAP;
     private static String[][] variantsToKeywords;

     private static void initCANONICALIZE_MAP() {
         if (CANONICALIZE_MAP == null) {
             /**
              * This table lists pairs of locale ids for canonicalization.  The
              * The 1st item is the normalized id. The 2nd item is the
              * canonicalized id. The 3rd is the keyword. The 4th is the keyword value.
              */
             String[][] tempCANONICALIZE_MAP = {
 //              { EMPTY_STRING,     "en_US_POSIX", null, null }, /* .NET name */
                 { "C",              "en_US_POSIX", null, null }, /* POSIX name */
                 { "art_LOJBAN",     "jbo", null, null }, /* registered name */
                 { "az_AZ_CYRL",     "az_Cyrl_AZ", null, null }, /* .NET name */
                 { "az_AZ_LATN",     "az_Latn_AZ", null, null }, /* .NET name */
                 { "ca_ES_PREEURO",  "ca_ES", "currency", "ESP" },
                 { "cel_GAULISH",    "cel__GAULISH", null, null }, /* registered name */
                 { "de_1901",        "de__1901", null, null }, /* registered name */
                 { "de_1906",        "de__1906", null, null }, /* registered name */
                 { "de__PHONEBOOK",  "de", "collation", "phonebook" }, /* Old ICU name */
                 { "de_AT_PREEURO",  "de_AT", "currency", "ATS" },
                 { "de_DE_PREEURO",  "de_DE", "currency", "DEM" },
                 { "de_LU_PREEURO",  "de_LU", "currency", "EUR" },
                 { "el_GR_PREEURO",  "el_GR", "currency", "GRD" },
                 { "en_BOONT",       "en__BOONT", null, null }, /* registered name */
                 { "en_SCOUSE",      "en__SCOUSE", null, null }, /* registered name */
                 { "en_BE_PREEURO",  "en_BE", "currency", "BEF" },
                 { "en_IE_PREEURO",  "en_IE", "currency", "IEP" },
                 { "es__TRADITIONAL", "es", "collation", "traditional" }, /* Old ICU name */
                 { "es_ES_PREEURO",  "es_ES", "currency", "ESP" },
                 { "eu_ES_PREEURO",  "eu_ES", "currency", "ESP" },
                 { "fi_FI_PREEURO",  "fi_FI", "currency", "FIM" },
                 { "fr_BE_PREEURO",  "fr_BE", "currency", "BEF" },
                 { "fr_FR_PREEURO",  "fr_FR", "currency", "FRF" },
                 { "fr_LU_PREEURO",  "fr_LU", "currency", "LUF" },
                 { "ga_IE_PREEURO",  "ga_IE", "currency", "IEP" },
                 { "gl_ES_PREEURO",  "gl_ES", "currency", "ESP" },
                 { "hi__DIRECT",     "hi", "collation", "direct" }, /* Old ICU name */
                 { "it_IT_PREEURO",  "it_IT", "currency", "ITL" },
                 { "ja_JP_TRADITIONAL", "ja_JP", "calendar", "japanese" },
 //              { "nb_NO_NY",       "nn_NO", null, null },
                 { "nl_BE_PREEURO",  "nl_BE", "currency", "BEF" },
                 { "nl_NL_PREEURO",  "nl_NL", "currency", "NLG" },
                 { "pt_PT_PREEURO",  "pt_PT", "currency", "PTE" },
                 { "sl_ROZAJ",       "sl__ROZAJ", null, null }, /* registered name */
                 { "sr_SP_CYRL",     "sr_Cyrl_RS", null, null }, /* .NET name */
                 { "sr_SP_LATN",     "sr_Latn_RS", null, null }, /* .NET name */
                 { "sr_YU_CYRILLIC", "sr_Cyrl_RS", null, null }, /* Linux name */
                 { "th_TH_TRADITIONAL", "th_TH", "calendar", "buddhist" }, /* Old ICU name */
                 { "uz_UZ_CYRILLIC", "uz_Cyrl_UZ", null, null }, /* Linux name */
                 { "uz_UZ_CYRL",     "uz_Cyrl_UZ", null, null }, /* .NET name */
                 { "uz_UZ_LATN",     "uz_Latn_UZ", null, null }, /* .NET name */
                 { "zh_CHS",         "zh_Hans", null, null }, /* .NET name */
                 { "zh_CHT",         "zh_Hant", null, null }, /* .NET name */
                 { "zh_GAN",         "zh__GAN", null, null }, /* registered name */
                 { "zh_GUOYU",       "zh", null, null }, /* registered name */
                 { "zh_HAKKA",       "zh__HAKKA", null, null }, /* registered name */
                 { "zh_MIN",         "zh__MIN", null, null }, /* registered name */
                 { "zh_MIN_NAN",     "zh__MINNAN", null, null }, /* registered name */
                 { "zh_WUU",         "zh__WUU", null, null }, /* registered name */
                 { "zh_XIANG",       "zh__XIANG", null, null }, /* registered name */
                 { "zh_YUE",         "zh__YUE", null, null } /* registered name */
             };

             synchronized (ULocale.class) {
                 if (CANONICALIZE_MAP == null) {
                     CANONICALIZE_MAP = tempCANONICALIZE_MAP;
                 }
             }
         }
         if (variantsToKeywords == null) {
             /**
              * This table lists pairs of locale ids for canonicalization.  The
              * The first item is the normalized variant id.
              */
             String[][] tempVariantsToKeywords = {
                     { "EURO",   "currency", "EUR" },
                     { "PINYIN", "collation", "pinyin" }, /* Solaris variant */
                     { "STROKE", "collation", "stroke" }  /* Solaris variant */
             };

             synchronized (ULocale.class) {
                 if (variantsToKeywords == null) {
                     variantsToKeywords = tempVariantsToKeywords;
                 }
             }
         }
     }

     /*
      * This table is used for mapping between ICU and special Java
      * locales.  When an ICU locale matches <minumum base> with
      * <keyword>/<value>, the ICU locale is mapped to <Java> locale.
      * For example, both ja_JP@calendar=japanese and ja@calendar=japanese
      * are mapped to Java locale "ja_JP_JP".  ICU locale "nn" is mapped
      * to Java locale "no_NO_NY".
      */
     private static final String[][] _javaLocaleMap = {
     //  { <Java>,       <ICU base>, <keyword>,  <value>,    <minimum base>
         { "ja_JP_JP",   "ja_JP",    "calendar", "japanese", "ja"},
         { "no_NO_NY",   "nn_NO",    null,       null,       "nn"},
         { "th_TH_TH",   "th_TH",    "numbers",  "thai",     "th"},
     };

     /**
      * Private constructor used by static initializers.
      */
     private ULocale(String localeID, Locale locale) {
         this.localeID = localeID;
         this.locale = locale;
     }

     /**
      * Construct a ULocale object from a {@link java.util.Locale}.
      * @param loc a JDK locale
      * @stable ICU 2.8
      * @internal
      */
     private ULocale(Locale loc) {
         this.localeID = getName(forLocale(loc).toString());
         this.locale = loc;
     }

     /**
      * Return a ULocale object for a {@link java.util.Locale}.
      * The ULocale is canonicalized.
      * @param loc a JDK locale
      * @stable ICU 3.2
      */
     public static ULocale forLocale(Locale loc) {
         if (loc == null) {
             return null;
         }
         ULocale result = (ULocale)CACHE.get(loc);
         if (result == null) {
             if (defaultULocale != null && loc == defaultULocale.locale) {
             result = defaultULocale;
         } else {
                 String locStr = loc.toString();
                 if (locStr.length() == 0) {
                     result = ROOT;
                 } else {
                     for (int i = 0; i < _javaLocaleMap.length; i++) {
                         if (_javaLocaleMap[i][0].equals(locStr)) {
                             IDParser p = new IDParser(_javaLocaleMap[i][1]);
                             p.setKeywordValue(_javaLocaleMap[i][2], _javaLocaleMap[i][3]);
                             locStr = p.getName();
                             break;
                         }
                     }
                     result = new ULocale(locStr, loc);
                 }
             }
             CACHE.put(loc, result);
         }
         return result;
     }

     /**
      * Construct a ULocale from a RFC 3066 locale ID. The locale ID consists
      * of optional language, script, country, and variant fields in that order,
      * separated by underscores, followed by an optional keyword list.  The
      * script, if present, is four characters long-- this distinguishes it
      * from a country code, which is two characters long.  Other fields
      * are distinguished by position as indicated by the underscores.  The
      * start of the keyword list is indicated by '@', and consists of two
      * or more keyword/value pairs separated by semicolons(';').
      * <p>
      * This constructor does not canonicalize the localeID.  So, for
      * example, "zh__pinyin" remains unchanged instead of converting
      * to "zh@collation=pinyin".  By default ICU only recognizes the
      * latter as specifying pinyin collation.  Use {@link #createCanonical}
      * or {@link #canonicalize} if you need to canonicalize the localeID.
      *
      * @param localeID string representation of the locale, e.g:
      * "en_US", "sy_Cyrl_YU", "zh__pinyin", "es_ES@currency=EUR;collation=traditional"
      * @stable ICU 2.8
      */
     public ULocale(String localeID) {
         this.localeID = getName(localeID);
     }

     /**
      * Convenience overload of ULocale(String, String, String) for
      * compatibility with java.util.Locale.
      * @see #ULocale(String, String, String)
      * @stable ICU 3.4
      */
     public ULocale(String a, String b) {
         this(a, b, null);
     }

     /**
      * Construct a ULocale from a localeID constructed from the three 'fields' a, b, and c.  These
      * fields are concatenated using underscores to form a localeID of
      * the form a_b_c, which is then handled like the localeID passed
      * to <code>ULocale(String localeID)</code>.
      *
      * <p>Java locale strings consisting of language, country, and
      * variant will be handled by this form, since the country code
      * (being shorter than four letters long) will not be interpreted
      * as a script code.  If a script code is present, the final
      * argument ('c') will be interpreted as the country code.  It is
      * recommended that this constructor only be used to ease porting,
      * and that clients instead use the single-argument constructor
      * when constructing a ULocale from a localeID.
      * @param a first component of the locale id
      * @param b second component of the locale id
      * @param c third component of the locale id
      * @see #ULocale(String)
      * @stable ICU 3.0
      */
     public ULocale(String a, String b, String c) {
         localeID = getName(lscvToID(a, b, c, EMPTY_STRING));
     }

     /**
      * Create a ULocale from the id by first canonicalizing the id.
      * @param nonCanonicalID the locale id to canonicalize
      * @return the locale created from the canonical version of the ID.
      * @stable ICU 3.0
      */
     public static ULocale createCanonical(String nonCanonicalID) {
         return new ULocale(canonicalize(nonCanonicalID), (Locale)null);
     }

     private static String lscvToID(String lang, String script, String country, String variant) {
         StringBuffer buf = new StringBuffer();

         if (lang != null && lang.length() > 0) {
             buf.append(lang);
         }
         if (script != null && script.length() > 0) {
             buf.append(UNDERSCORE);
             buf.append(script);
         }
         if (country != null && country.length() > 0) {
             buf.append(UNDERSCORE);
             buf.append(country);
         }
         if (variant != null && variant.length() > 0) {
             if (country == null || country.length() == 0) {
                 buf.append(UNDERSCORE);
             }
             buf.append(UNDERSCORE);
             buf.append(variant);
         }
         return buf.toString();
     }

     /**
      * Convert this ULocale object to a {@link java.util.Locale}.
      * @return a JDK locale that either exactly represents this object
      * or is the closest approximation.
      * @stable ICU 2.8
      */
     public Locale toLocale() {
         if (locale == null) {
             IDParser p = new IDParser(localeID);
             String base = p.getBaseName();
             for (int i = 0; i < _javaLocaleMap.length; i++) {
                 if (base.equals(_javaLocaleMap[i][1]) || base.equals(_javaLocaleMap[i][4])) {
                     if (_javaLocaleMap[i][2] != null) {
                         String val = p.getKeywordValue(_javaLocaleMap[i][2]);
                         if (val != null && val.equals(_javaLocaleMap[i][3])) {
                             p = new IDParser(_javaLocaleMap[i][0]);
                             break;
                         }
                     } else {
                         p = new IDParser(_javaLocaleMap[i][0]);
                         break;
                     }
                 }
             }
             String[] names = p.getLanguageScriptCountryVariant();
             locale = new Locale(names[0], names[2], names[3]);
         }
         return locale;
     }

     private static ICUCache nameCache = new SimpleCache();
     /**
      * Keep our own default ULocale.
      */
     private static Locale defaultLocale = Locale.getDefault();
     private static ULocale defaultULocale = new ULocale(defaultLocale);

     /**
      * Returns the current default ULocale.
      * @stable ICU 2.8
      */
     public static ULocale getDefault() {
         synchronized (ULocale.class) {
             Locale currentDefault = Locale.getDefault();
             if (!defaultLocale.equals(currentDefault)) {
                 defaultLocale = currentDefault;
                 defaultULocale = new ULocale(defaultLocale);
             }
             return defaultULocale;
         }
     }

     /**
      * Sets the default ULocale.  This also sets the default Locale.
      * If the caller does not have write permission to the
      * user.language property, a security exception will be thrown,
      * and the default ULocale will remain unchanged.
      * @param newLocale the new default locale
      * @throws SecurityException
      *        if a security manager exists and its
      *        <code>checkPermission</code> method doesn't allow the operation.
      * @throws NullPointerException if <code>newLocale</code> is null
      * @see SecurityManager#checkPermission(java.security.Permission)
      * @see java.util.PropertyPermission
      * @stable ICU 3.0
      */
     public static synchronized void setDefault(ULocale newLocale){
         Locale.setDefault(newLocale.toLocale());
         defaultULocale = newLocale;
     }

     /**
      * This is for compatibility with Locale-- in actuality, since ULocale is
      * immutable, there is no reason to clone it, so this API returns 'this'.
      * @stable ICU 3.0
      */
     public Object clone() {
         return this;
     }

     /**
      * Returns the hashCode.
      * @stable ICU 3.0
      */
     public int hashCode() {
         return localeID.hashCode();
     }

     /**
      * Returns true if the other object is another ULocale with the
      * same full name, or is a String localeID that matches the full name.
      * Note that since names are not canonicalized, two ULocales that
      * function identically might not compare equal.
      *
      * @return true if this Locale is equal to the specified object.
      * @stable ICU 3.0
      */
     public boolean equals(Object obj) {
         if (this == obj) {
             return true;
         }
         if (obj instanceof String) {
             return localeID.equals((String)obj);
         }
         if (obj instanceof ULocale) {
             return localeID.equals(((ULocale)obj).localeID);
         }
         return false;
     }

     /**
      * Returns a list of all installed locales.
      * @stable ICU 3.0
      */
     public static ULocale[] getAvailableLocales() {
         return ICUResourceBundle.getAvailableULocales();
     }

     private static VersionInfo gCLDRVersion = null;

     /**
      * Returns the current CLDR version
      * @draft ICU 4.2
      * @provisional This API might change or be removed in a future release.
      */
     public static VersionInfo getCLDRVersion() {
         // fetching this data should be idempotent.
         if(gCLDRVersion == null) {
             // from ZoneMeta.java
             UResourceBundle supplementalDataBundle = UResourceBundle.getBundleInstance(ICUResourceBundle.ICU_BASE_NAME, "supplementalData", ICUResourceBundle.ICU_DATA_CLASS_LOADER);
             UResourceBundle cldrVersionBundle = supplementalDataBundle.get("cldrVersion");
             gCLDRVersion = VersionInfo.getInstance(cldrVersionBundle.getString());
         }
         return gCLDRVersion;
     }

     /**
      * Returns a list of all 2-letter country codes defined in ISO 3166.
      * Can be used to create Locales.
      * @stable ICU 3.0
      */
     public static String[] getISOCountries() {
         initCountryTables();
         return (String[])_countries.clone();
     }

     /**
      * Returns a list of all 2-letter language codes defined in ISO 639.
      * Can be used to create Locales.
      * [NOTE:  ISO 639 is not a stable standard-- some languages' codes have changed.
      * The list this function returns includes both the new and the old codes for the
      * languages whose codes have changed.]
      * @stable ICU 3.0
      */
     public static String[] getISOLanguages() {
         initLanguageTables();
         return (String[])_languages.clone();
     }

     /**
      * Returns the language code for this locale, which will either be the empty string
      * or a lowercase ISO 639 code.
      * @see #getDisplayLanguage()
      * @see #getDisplayLanguage(ULocale)
      * @stable ICU 3.0
      */
     public String getLanguage() {
         return getLanguage(localeID);
     }

     /**
      * Returns the language code for the locale ID,
      * which will either be the empty string
      * or a lowercase ISO 639 code.
      * @see #getDisplayLanguage()
      * @see #getDisplayLanguage(ULocale)
      * @stable ICU 3.0
      */
     public static String getLanguage(String localeID) {
         return new IDParser(localeID).getLanguage();
     }

     /**
      * Returns the script code for this locale, which might be the empty string.
      * @see #getDisplayScript()
      * @see #getDisplayScript(ULocale)
      * @stable ICU 3.0
      */
     public String getScript() {
         return getScript(localeID);
     }

     /**
      * Returns the script code for the specified locale, which might be the empty string.
      * @see #getDisplayScript()
      * @see #getDisplayScript(ULocale)
      * @stable ICU 3.0
      */
     public static String getScript(String localeID) {
         return new IDParser(localeID).getScript();
     }

     /**
      * Returns the country/region code for this locale, which will either be the empty string
      * or an uppercase ISO 3166 2-letter code.
      * @see #getDisplayCountry()
      * @see #getDisplayCountry(ULocale)
      * @stable ICU 3.0
      */
     public String getCountry() {
         return getCountry(localeID);
     }

     /**
      * Returns the country/region code for this locale, which will either be the empty string
      * or an uppercase ISO 3166 2-letter code.
      * @param localeID
      * @see #getDisplayCountry()
      * @see #getDisplayCountry(ULocale)
      * @stable ICU 3.0
      */
     public static String getCountry(String localeID) {
         return new IDParser(localeID).getCountry();
     }

     /**
      * Returns the variant code for this locale, which might be the empty string.
      * @see #getDisplayVariant()
      * @see #getDisplayVariant(ULocale)
      * @stable ICU 3.0
      */
     public String getVariant() {
         return getVariant(localeID);
     }

     /**
      * Returns the variant code for the specified locale, which might be the empty string.
      * @see #getDisplayVariant()
      * @see #getDisplayVariant(ULocale)
      * @stable ICU 3.0
      */
     public static String getVariant(String localeID) {
         return new IDParser(localeID).getVariant();
     }

     /**
      * Returns the fallback locale for the specified locale, which might be the empty string.
      * @stable ICU 3.2
      */
     public static String getFallback(String localeID) {
         return getFallbackString(getName(localeID));
     }

     /**
      * Returns the fallback locale for this locale.  If this locale is root, returns null.
      * @stable ICU 3.2
      */
     public ULocale getFallback() {
         if (localeID.length() == 0 || localeID.charAt(0) == '@') {
             return null;
         }
         return new ULocale(getFallbackString(localeID), (Locale)null);
     }

     /**
      * Return the given (canonical) locale id minus the last part before the tags.
      */
     private static String getFallbackString(String fallback) {
         int limit = fallback.indexOf('@');
         if (limit == -1) {
             limit = fallback.length();
         }
         int start = fallback.lastIndexOf('_', limit);
         if (start == -1) {
             start = 0;
         }
         return fallback.substring(0, start) + fallback.substring(limit);
     }

     /**
      * Returns the (normalized) base name for this locale.
      * @return the base name as a String.
      * @stable ICU 3.0
      */
     public String getBaseName() {
         return getBaseName(localeID);
     }

     /**
      * Returns the (normalized) base name for the specified locale.
      * @param localeID the locale ID as a string
      * @return the base name as a String.
      * @stable ICU 3.0
      */
     public static String getBaseName(String localeID){
         if (localeID.indexOf('@') == -1) {
             return localeID;
         }
         return new IDParser(localeID).getBaseName();
     }

     /**
      * Returns the (normalized) full name for this locale.
      *
      * @return String the full name of the localeID
      * @stable ICU 3.0
      */
     public String getName() {
         return localeID; // always normalized
     }

     /**
      * Returns the (normalized) full name for the specified locale.
      *
      * @param localeID the localeID as a string
      * @return String the full name of the localeID
      * @stable ICU 3.0
      */
     public static String getName(String localeID){
         String name = (String)nameCache.get(localeID);
         if (name == null) {
             name = new IDParser(localeID).getName();
             nameCache.put(localeID, name);
         }
         return name;
     }

     /**
      * Returns a string representation of this object.
      * @stable ICU 3.0
      */
     public String toString() {
         return localeID;
     }

     /**
      * Returns an iterator over keywords for this locale.  If there
      * are no keywords, returns null.
      * @return iterator over keywords, or null if there are no keywords.
      * @stable ICU 3.0
      */
     public Iterator getKeywords() {
         return getKeywords(localeID);
     }

     /**
      * Returns an iterator over keywords for the specified locale.  If there
      * are no keywords, returns null.
      * @return an iterator over the keywords in the specified locale, or null
      * if there are no keywords.
      * @stable ICU 3.0
      */
     public static Iterator getKeywords(String localeID){
         return new IDParser(localeID).getKeywords();
     }

     /**
      * Returns the value for a keyword in this locale. If the keyword is not defined, returns null.
      * @param keywordName name of the keyword whose value is desired. Case insensitive.
      * @return the value of the keyword, or null.
      * @stable ICU 3.0
      */
     public String getKeywordValue(String keywordName){
         return getKeywordValue(localeID, keywordName);
     }

     /**
      * Returns the value for a keyword in the specified locale. If the keyword is not defined, returns null.
      * The locale name does not need to be normalized.
      * @param keywordName name of the keyword whose value is desired. Case insensitive.
      * @return String the value of the keyword as a string
      * @stable ICU 3.0
      */
     public static String getKeywordValue(String localeID, String keywordName) {
         return new IDParser(localeID).getKeywordValue(keywordName);
     }

     /**
      * Utility class to parse and normalize locale ids (including POSIX style)
      */
     private static final class IDParser {
         private char[] id;
         private int index;
         private char[] buffer;
         private int blen;
         // um, don't handle POSIX ids unless we request it.  why not?  well... because.
         private boolean canonicalize;
         private boolean hadCountry;

         // used when canonicalizing
         Map keywords;
         String baseName;

         /**
          * Parsing constants.
          */
         private static final char KEYWORD_SEPARATOR     = '@';
         private static final char HYPHEN                = '-';
         private static final char KEYWORD_ASSIGN        = '=';
         private static final char COMMA                 = ',';
         private static final char ITEM_SEPARATOR        = ';';
         private static final char DOT                   = '.';

         private IDParser(String localeID) {
             this(localeID, false);
         }

         private IDParser(String localeID, boolean canonicalize) {
             id = localeID.toCharArray();
             index = 0;
             buffer = new char[id.length + 5];
             blen = 0;
             this.canonicalize = canonicalize;
         }

         private void reset() {
             index = blen = 0;
         }

         // utilities for working on text in the buffer

         /**
          * Append c to the buffer.
          */
         private void append(char c) {
             try {
                 buffer[blen] = c;
             }
             catch (IndexOutOfBoundsException e) {
                 if (buffer.length > 512) {
                     // something is seriously wrong, let this go
                     throw e;
                 }
                 char[] nbuffer = new char[buffer.length * 2];
                 System.arraycopy(buffer, 0, nbuffer, 0, buffer.length);
                 nbuffer[blen] = c;
                 buffer = nbuffer;
             }
             ++blen;
         }

         private void addSeparator() {
             append(UNDERSCORE);
         }

         /**
          * Returns the text in the buffer from start to blen as a String.
          */
         private String getString(int start) {
             if (start == blen) {
                 return EMPTY_STRING;
             }
             return new String(buffer, start, blen-start);
         }

         /**
          * Set the length of the buffer to pos, then append the string.
          */
         private void set(int pos, String s) {
             this.blen = pos; // no safety
             append(s);
         }

         /**
          * Append the string to the buffer.
          */
         private void append(String s) {
             for (int i = 0; i < s.length(); ++i) {
                 append(s.charAt(i));
             }
         }

         // utilities for parsing text out of the id

         /**
          * Character to indicate no more text is available in the id.
          */
         private static final char DONE = '\uffff';

         /**
          * Returns the character at index in the id, and advance index.  The returned character
          * is DONE if index was at the limit of the buffer.  The index is advanced regardless
          * so that decrementing the index will always 'unget' the last character returned.
          */
         private char next() {
             if (index == id.length) {
                 index++;
                 return DONE;
             }

             return id[index++];
         }

         /**
          * Advance index until the next terminator or id separator, and leave it there.
          */
         private void skipUntilTerminatorOrIDSeparator() {
             while (!isTerminatorOrIDSeparator(next())) {
             }
             --index;
         }

         /**
          * Returns true if the character at index in the id is a terminator.
          */
         private boolean atTerminator() {
             return index >= id.length || isTerminator(id[index]);
         }

         /*
          * Returns true if the character is an id separator (underscore or hyphen).
          */
 /*        private boolean isIDSeparator(char c) {
             return c == UNDERSCORE || c == HYPHEN;
         }*/

         /**
          * Returns true if the character is a terminator (keyword separator, dot, or DONE).
          * Dot is a terminator because of the POSIX form, where dot precedes the codepage.
          */
         private boolean isTerminator(char c) {
             // always terminate at DOT, even if not handling POSIX.  It's an error...
             return c == KEYWORD_SEPARATOR || c == DONE || c == DOT;
         }

         /**
          * Returns true if the character is a terminator or id separator.
          */
         private boolean isTerminatorOrIDSeparator(char c) {
             return c == KEYWORD_SEPARATOR || c == UNDERSCORE || c == HYPHEN ||
                 c == DONE || c == DOT;
         }

         /**
          * Returns true if the start of the buffer has an experimental or private language
          * prefix, the pattern '[ixIX][-_].' shows the syntax checked.
          */
         private boolean haveExperimentalLanguagePrefix() {
             if (id.length > 2) {
                 char c = id[1];
                 if (c == HYPHEN || c == UNDERSCORE) {
                     c = id[0];
                     return c == 'x' || c == 'X' || c == 'i' || c == 'I';
                 }
             }
             return false;
         }

         /**
          * Returns true if a value separator occurs at or after index.
          */
         private boolean haveKeywordAssign() {
             // assume it is safe to start from index
             for (int i = index; i < id.length; ++i) {
                 if (id[i] == KEYWORD_ASSIGN) {
                     return true;
                 }
             }
             return false;
         }

         /**
          * Advance index past language, and accumulate normalized language code in buffer.
          * Index must be at 0 when this is called.  Index is left at a terminator or id
          * separator.  Returns the start of the language code in the buffer.
          */
         private int parseLanguage() {
             if (haveExperimentalLanguagePrefix()) {
                 append(Character.toLowerCase(id[0]));
                 append(HYPHEN);
                 index = 2;
             }

             char c;
             while(!isTerminatorOrIDSeparator(c = next())) {
                 append(Character.toLowerCase(c));
             }
             --index; // unget

             if (blen == 3) {
                 initLanguageTables();

                 /* convert 3 character code to 2 character code if possible *CWB*/
                 String lang = getString(0);
                 int offset = findIndex(_languages3, lang);
                 if (offset >= 0) {
                     set(0, _languages[offset]);
                 } else {
                     offset = findIndex(_obsoleteLanguages3, lang);
                     if (offset >= 0) {
                         set(0, _obsoleteLanguages[offset]);
                     }
                 }
             }

             return 0;
         }

         /**
          * Advance index past language.  Index must be at 0 when this is called.  Index
          * is left at a terminator or id separator.
          */
         private void skipLanguage() {
             if (haveExperimentalLanguagePrefix()) {
                 index = 2;
             }
             skipUntilTerminatorOrIDSeparator();
         }

         /**
          * Advance index past script, and accumulate normalized script in buffer.
          * Index must be immediately after the language.
          * If the item at this position is not a script (is not four characters
          * long) leave index and buffer unchanged.  Otherwise index is left at
          * a terminator or id separator.  Returns the start of the script code
          * in the buffer (this may be equal to the buffer length, if there is no
          * script).
          */
         private int parseScript() {
             if (!atTerminator()) {
                 int oldIndex = index; // save original index
                 ++index;

                 int oldBlen = blen; // get before append hyphen, if we truncate everything is undone
                 char c;
                 while(!isTerminatorOrIDSeparator(c = next())) {
                     if (blen == oldBlen) { // first pass
                         addSeparator();
                         append(Character.toUpperCase(c));
                     } else {
                         append(Character.toLowerCase(c));
                     }
                 }
                 --index; // unget

                 /* If it's not exactly 4 characters long, then it's not a script. */
                 if (index - oldIndex != 5) { // +1 to account for separator
                     index = oldIndex;
                     blen = oldBlen;
                 } else {
                     oldBlen++; // index past hyphen, for clients who want to extract just the script
                 }

                 return oldBlen;
             }
             return blen;
         }

         /**
          * Advance index past script.
          * Index must be immediately after the language and IDSeparator.
          * If the item at this position is not a script (is not four characters
          * long) leave index.  Otherwise index is left at a terminator or
          * id separator.
          */
         private void skipScript() {
             if (!atTerminator()) {
                 int oldIndex = index;
                 ++index;

                 skipUntilTerminatorOrIDSeparator();
                 if (index - oldIndex != 5) { // +1 to account for separator
                     index = oldIndex;
                 }
             }
         }

         /**
          * Advance index past country, and accumulate normalized country in buffer.
          * Index must be immediately after the script (if there is one, else language)
          * and IDSeparator.  Return the start of the country code in the buffer.
          */
         private int parseCountry() {
             if (!atTerminator()) {
                 int oldIndex = index;
                 ++index;

                 int oldBlen = blen;
                 char c;
                 while (!isTerminatorOrIDSeparator(c = next())) {
                     if (oldBlen == blen) { // first, add hyphen
                         hadCountry = true; // we have a country, let variant parsing know
                         addSeparator();
                         ++oldBlen; // increment past hyphen
                     }
                     append(Character.toUpperCase(c));
                 }
                 --index; // unget

                 int charsAppended = blen - oldBlen;

                 if (charsAppended == 0) {
                     // Do nothing.
                 }
                 else if (charsAppended < 2 || charsAppended > 3) {
                     // It's not a country, so return index and blen to
                     // their previous values.
                     index = oldIndex;
                     --oldBlen;
                     blen = oldBlen;
                     hadCountry = false;
                 }
                 else if (charsAppended == 3) {
                     initCountryTables();

                     /* convert 3 character code to 2 character code if possible *CWB*/
                     int offset = findIndex(_countries3, getString(oldBlen));
                     if (offset >= 0) {
                         set(oldBlen, _countries[offset]);
                     } else {
                         offset = findIndex(_obsoleteCountries3, getString(oldBlen));
                         if (offset >= 0) {
                             set(oldBlen, _obsoleteCountries[offset]);
                         }
                     }
                 }

                 return oldBlen;
             }

             return blen;
         }

         /**
          * Advance index past country.
          * Index must be immediately after the script (if there is one, else language)
          * and IDSeparator.
          */
         private void skipCountry() {
             if (!atTerminator()) {
                 ++index;
                 /*
                  * Save the index point after the separator, since the format
                  * requires two separators if the country is not present.
                  */
                 int oldIndex = index;

                 skipUntilTerminatorOrIDSeparator();
                 int charsSkipped = index - oldIndex;
                 if (charsSkipped < 2 || charsSkipped > 3) {
                     index = oldIndex;
                 }
             }
         }

         /**
          * Advance index past variant, and accumulate normalized variant in buffer.  This ignores
          * the codepage information from POSIX ids.  Index must be immediately after the country
          * or script.  Index is left at the keyword separator or at the end of the text.  Return
          * the start of the variant code in the buffer.
          *
          * In standard form, we can have the following forms:
          * ll__VVVV
          * ll_CC_VVVV
          * ll_Ssss_VVVV
          * ll_Ssss_CC_VVVV
          *
          * This also handles POSIX ids, which can have the following forms (pppp is code page id):
          * ll_CC.pppp          --> ll_CC
          * ll_CC.pppp@VVVV     --> ll_CC_VVVV
          * ll_CC@VVVV          --> ll_CC_VVVV
          *
          * We identify this use of '@' in POSIX ids by looking for an '=' following
          * the '@'.  If there is one, we consider '@' to start a keyword list, instead of
          * being part of a POSIX id.
          *
          * Note:  since it was decided that we want an option to not handle POSIX ids, this
          * becomes a bit more complex.
          */
         private int parseVariant() {
             int oldBlen = blen;

             boolean start = true;
             boolean needSeparator = true;
             boolean skipping = false;
             char c;
             while ((c = next()) != DONE) {
                 if (c == DOT) {
                     start = false;
                     skipping = true;
                 } else if (c == KEYWORD_SEPARATOR) {
                     if (haveKeywordAssign()) {
                         break;
                     }
                     skipping = false;
                     start = false;
                     needSeparator = true; // add another underscore if we have more text
                 } else if (start) {
                     start = false;
                 } else if (!skipping) {
                     if (needSeparator) {
                         boolean incOldBlen = blen == oldBlen; // need to skip separators
                         needSeparator = false;
                         if (incOldBlen && !hadCountry) { // no country, we'll need two
                             addSeparator();
                             ++oldBlen; // for sure
                         }
                         addSeparator();
                         if (incOldBlen) { // only for the first separator
                             ++oldBlen;
                         }
                     }
                     c = Character.toUpperCase(c);
                     if (c == HYPHEN || c == COMMA) {
                         c = UNDERSCORE;
                     }
                     append(c);
                 }
             }
             --index; // unget

             return oldBlen;
         }

         // no need for skipvariant, to get the keywords we'll just scan directly for
         // the keyword separator

         /**
          * Returns the normalized language id, or the empty string.
          */
         public String getLanguage() {
             reset();
             return getString(parseLanguage());
         }

         /**
          * Returns the normalized script id, or the empty string.
          */
         public String getScript() {
             reset();
             skipLanguage();
             return getString(parseScript());
         }

         /**
          * return the normalized country id, or the empty string.
          */
         public String getCountry() {
             reset();
             skipLanguage();
             skipScript();
             return getString(parseCountry());
         }

         /**
          * Returns the normalized variant id, or the empty string.
          */
         public String getVariant() {
             reset();
             skipLanguage();
             skipScript();
             skipCountry();
             return getString(parseVariant());
         }

         /**
          * Returns the language, script, country, and variant as separate strings.
          */
         public String[] getLanguageScriptCountryVariant() {
             reset();
             return new String[] {
                 getString(parseLanguage()),
                 getString(parseScript()),
                 getString(parseCountry()),
                 getString(parseVariant())
             };
         }

         public void setBaseName(String baseName) {
             this.baseName = baseName;
         }

         public void parseBaseName() {
             if (baseName != null) {
                 set(0, baseName);
             } else {
                 reset();
                 parseLanguage();
                 parseScript();
                 parseCountry();
                 parseVariant();

                 // catch unwanted trailing underscore after country if there was no variant
                 if (blen > 1 && buffer[blen-1] == UNDERSCORE) {
                     --blen;
                 }
             }
         }

         /**
          * Returns the normalized base form of the locale id.  The base
          * form does not include keywords.
          */
         public String getBaseName() {
             if (baseName != null) {
                 return baseName;
             }
             parseBaseName();
             return getString(0);
         }

         /**
          * Returns the normalized full form of the locale id.  The full
          * form includes keywords if they are present.
          */
         public String getName() {
             parseBaseName();
             parseKeywords();
             return getString(0);
         }

         // keyword utilities

         /**
          * If we have keywords, advance index to the start of the keywords and return true,
          * otherwise return false.
          */
         private boolean setToKeywordStart() {
             for (int i = index; i < id.length; ++i) {
                 if (id[i] == KEYWORD_SEPARATOR) {
                     if (canonicalize) {
                         for (int j = ++i; j < id.length; ++j) { // increment i past separator for return
                             if (id[j] == KEYWORD_ASSIGN) {
                                 index = i;
                                 return true;
                             }
                         }
                     } else {
                         if (++i < id.length) {
                             index = i;
                             return true;
                         }
                     }
                     break;
                 }
             }
             return false;
         }

         private static boolean isDoneOrKeywordAssign(char c) {
             return c == DONE || c == KEYWORD_ASSIGN;
         }

         private static boolean isDoneOrItemSeparator(char c) {
             return c == DONE || c == ITEM_SEPARATOR;
         }

         private String getKeyword() {
             int start = index;
             while (!isDoneOrKeywordAssign(next())) {
             }
             --index;
             return AsciiUtil.toLowerString(new String(id, start, index-start).trim());
         }

         private String getValue() {
             int start = index;
             while (!isDoneOrItemSeparator(next())) {
             }
             --index;
             return new String(id, start, index-start).trim(); // leave case alone
         }

         private Comparator getKeyComparator() {
             final Comparator comp = new Comparator() {
                     public int compare(Object lhs, Object rhs) {
                         return ((String)lhs).compareTo((String)rhs);
                     }
                 };
             return comp;
         }

         /**
          * Returns a map of the keywords and values, or null if there are none.
          */
         private Map getKeywordMap() {
             if (keywords == null) {
                 TreeMap m = null;
                 if (setToKeywordStart()) {
                     // trim spaces and convert to lower case, both keywords and values.
                     do {
                         String key = getKeyword();
                         if (key.length() == 0) {
                             break;
                         }
                         char c = next();
                         if (c != KEYWORD_ASSIGN) {
                             // throw new IllegalArgumentException("key '" + key + "' missing a value.");
                             if (c == DONE) {
                                 break;
                             } else {
                                 continue;
                             }
                         }
                         String value = getValue();
                         if (value.length() == 0) {
                             // throw new IllegalArgumentException("key '" + key + "' missing a value.");
                             continue;
                         }
                         if (m == null) {
                             m = new TreeMap(getKeyComparator());
                         } else if (m.containsKey(key)) {
                             // throw new IllegalArgumentException("key '" + key + "' already has a value.");
                             continue;
                         }
                         m.put(key, value);
                     } while (next() == ITEM_SEPARATOR);
                 }
                 keywords = m != null ? m : Collections.EMPTY_MAP;
             }

             return keywords;
         }


         /**
          * Parse the keywords and return start of the string in the buffer.
          */
         private int parseKeywords() {
             int oldBlen = blen;
             Map m = getKeywordMap();
             if (!m.isEmpty()) {
                 Iterator iter = m.entrySet().iterator();
                 boolean first = true;
                 while (iter.hasNext()) {
                     append(first ? KEYWORD_SEPARATOR : ITEM_SEPARATOR);
                     first = false;
                     Map.Entry e = (Map.Entry)iter.next();
                     append((String)e.getKey());
                     append(KEYWORD_ASSIGN);
                     append((String)e.getValue());
                 }
                 if (blen != oldBlen) {
                     ++oldBlen;
                 }
             }
             return oldBlen;
         }

         /**
          * Returns an iterator over the keywords, or null if we have an empty map.
          */
         public Iterator getKeywords() {
             Map m = getKeywordMap();
             return m.isEmpty() ? null : m.keySet().iterator();
         }

         /**
          * Returns the value for the named keyword, or null if the keyword is not
          * present.
          */
         public String getKeywordValue(String keywordName) {
             Map m = getKeywordMap();
             return m.isEmpty() ? null : (String)m.get(AsciiUtil.toLowerString(keywordName.trim()));
         }

         /**
          * Set the keyword value only if it is not already set to something else.
          */
         public void defaultKeywordValue(String keywordName, String value) {
             setKeywordValue(keywordName, value, false);
         }

         /**
          * Set the value for the named keyword, or unset it if value is null.  If
          * keywordName itself is null, unset all keywords.  If keywordName is not null,
          * value must not be null.
          */
         public void setKeywordValue(String keywordName, String value) {
             setKeywordValue(keywordName, value, true);
         }

         /**
          * Set the value for the named keyword, or unset it if value is null.  If
          * keywordName itself is null, unset all keywords.  If keywordName is not null,
          * value must not be null.  If reset is true, ignore any previous value for
          * the keyword, otherwise do not change the keyword (including removal of
          * one or all keywords).
          */
         private void setKeywordValue(String keywordName, String value, boolean reset) {
             if (keywordName == null) {
                 if (reset) {
                     // force new map, ignore value
                     keywords = Collections.EMPTY_MAP;
                 }
             } else {
                 keywordName = AsciiUtil.toLowerString(keywordName.trim());
                 if (keywordName.length() == 0) {
                     throw new IllegalArgumentException("keyword must not be empty");
                 }
                 if (value != null) {
                     value = value.trim();
                     if (value.length() == 0) {
                         throw new IllegalArgumentException("value must not be empty");
                     }
                 }
                 Map m = getKeywordMap();
                 if (m.isEmpty()) { // it is EMPTY_MAP
                     if (value != null) {
                         // force new map
                         keywords = new TreeMap(getKeyComparator());
                         keywords.put(keywordName, value.trim());
                     }
                 } else {
                     if (reset || !m.containsKey(keywordName)) {
                         if (value != null) {
                             m.put(keywordName, value);
                         } else {
                             m.remove(keywordName);
                             if (m.isEmpty()) {
                                 // force new map
                                 keywords = Collections.EMPTY_MAP;
                             }
                         }
                     }
                 }
             }
         }
     }

     /**
      * linear search of the string array. the arrays are unfortunately ordered by the
      * two-letter target code, not the three-letter search code, which seems backwards.
      */
     private static int findIndex(String[] array, String target){
         for (int i = 0; i < array.length; i++) {
             if (target.equals(array[i])) {
                 return i;
             }
         }
         return -1;
     }

     /**
      * Returns the canonical name for the specified locale ID.  This is used to convert POSIX
      * and other grandfathered IDs to standard ICU form.
      * @param localeID the locale id
      * @return the canonicalized id
      * @stable ICU 3.0
      */
     public static String canonicalize(String localeID){
         IDParser parser = new IDParser(localeID, true);
         String baseName = parser.getBaseName();
         boolean foundVariant = false;

         // formerly, we always set to en_US_POSIX if the basename was empty, but
         // now we require that the entire id be empty, so that "@foo=bar"
         // will pass through unchanged.
         // {dlf} I'd rather keep "" unchanged.
         if (localeID.equals("")) {
             return "";
 //              return "en_US_POSIX";
         }

         // we have an ID in the form xx_Yyyy_ZZ_KKKKK

         initCANONICALIZE_MAP();

         /* convert the variants to appropriate ID */
         for (int i = 0; i < variantsToKeywords.length; i++) {
             String[] vals = variantsToKeywords[i];
             int idx = baseName.lastIndexOf("_" + vals[0]);
             if (idx > -1) {
                 foundVariant = true;

                 baseName = baseName.substring(0, idx);
                 if (baseName.endsWith("_")) {
                     baseName = baseName.substring(0, --idx);
                 }
                 parser.setBaseName(baseName);
                 parser.defaultKeywordValue(vals[1], vals[2]);
                 break;
             }
         }

         /* See if this is an already known locale */
         for (int i = 0; i < CANONICALIZE_MAP.length; i++) {
             if (CANONICALIZE_MAP[i][0].equals(baseName)) {
                 foundVariant = true;

                 String[] vals = CANONICALIZE_MAP[i];
                 parser.setBaseName(vals[1]);
                 if (vals[2] != null) {
                     parser.defaultKeywordValue(vals[2], vals[3]);
                 }
                 break;
             }
         }

         /* total mondo hack for Norwegian, fortunately the main NY case is handled earlier */
         if (!foundVariant) {
             if (parser.getLanguage().equals("nb") && parser.getVariant().equals("NY")) {
                 parser.setBaseName(lscvToID("nn", parser.getScript(), parser.getCountry(), null));
             }
         }

         return parser.getName();
     }

     /**
      * Given a keyword and a value, return a new locale with an updated
      * keyword and value.  If keyword is null, this removes all keywords from the locale id.
      * Otherwise, if the value is null, this removes the value for this keyword from the
      * locale id.  Otherwise, this adds/replaces the value for this keyword in the locale id.
      * The keyword and value must not be empty.
      * @param keyword the keyword to add/remove, or null to remove all keywords.
      * @param value the value to add/set, or null to remove this particular keyword.
      * @return the updated locale
      * @stable ICU 3.2
      */
     public ULocale setKeywordValue(String keyword, String value) {
         return new ULocale(setKeywordValue(localeID, keyword, value), (Locale)null);
     }

     /**
      * Given a locale id, a keyword, and a value, return a new locale id with an updated
      * keyword and value.  If keyword is null, this removes all keywords from the locale id.
      * Otherwise, if the value is null, this removes the value for this keyword from the
      * locale id.  Otherwise, this adds/replaces the value for this keyword in the locale id.
      * The keyword and value must not be empty.
      * @param localeID the locale id to modify
      * @param keyword the keyword to add/remove, or null to remove all keywords.
      * @param value the value to add/set, or null to remove this particular keyword.
      * @return the updated locale id
      * @stable ICU 3.2
      */
     public static String setKeywordValue(String localeID, String keyword, String value) {
         IDParser parser = new IDParser(localeID);
         parser.setKeywordValue(keyword, value);
         return parser.getName();
     }

     /*
      * Given a locale id, a keyword, and a value, return a new locale id with an updated
      * keyword and value, if the keyword does not already have a value.  The keyword and
      * value must not be null or empty.
      * @param localeID the locale id to modify
      * @param keyword the keyword to add, if not already present
      * @param value the value to add, if not already present
      * @return the updated locale id
      * @internal
      */
 /*    private static String defaultKeywordValue(String localeID, String keyword, String value) {
         IDParser parser = new IDParser(localeID);
         parser.defaultKeywordValue(keyword, value);
         return parser.getName();
     }*/

     /**
      * Returns a three-letter abbreviation for this locale's language.  If the locale
      * doesn't specify a language, returns the empty string.  Otherwise, returns
      * a lowercase ISO 639-2/T language code.
      * The ISO 639-2 language codes can be found on-line at
      *   <a href="ftp://dkuug.dk/i18n/iso-639-2.txt"><code>ftp://dkuug.dk/i18n/iso-639-2.txt</code></a>
      * @exception MissingResourceException Throws MissingResourceException if the
      * three-letter language abbreviation is not available for this locale.
      * @stable ICU 3.0
      */
     public String getISO3Language(){
         return getISO3Language(localeID);
     }

     /**
      * Returns a three-letter abbreviation for this locale's language.  If the locale
      * doesn't specify a language, returns the empty string.  Otherwise, returns
      * a lowercase ISO 639-2/T language code.
      * The ISO 639-2 language codes can be found on-line at
      *   <a href="ftp://dkuug.dk/i18n/iso-639-2.txt"><code>ftp://dkuug.dk/i18n/iso-639-2.txt</code></a>
      * @exception MissingResourceException Throws MissingResourceException if the
      * three-letter language abbreviation is not available for this locale.
      * @stable ICU 3.0
      */
     public static String getISO3Language(String localeID){
         initLanguageTables();

         String language = getLanguage(localeID);
         int offset = findIndex(_languages, language);
         if(offset>=0){
             return _languages3[offset];
         } else {
             offset = findIndex(_obsoleteLanguages, language);
             if (offset >= 0) {
                 return _obsoleteLanguages3[offset];
             }
         }
         return EMPTY_STRING;
     }

     /**
      * Returns a three-letter abbreviation for this locale's country/region.  If the locale
      * doesn't specify a country, returns the empty string.  Otherwise, returns
      * an uppercase ISO 3166 3-letter country code.
      * @exception MissingResourceException Throws MissingResourceException if the
      * three-letter country abbreviation is not available for this locale.
      * @stable ICU 3.0
      */
     public String getISO3Country(){
         return getISO3Country(localeID);
     }
     /**
      * Returns a three-letter abbreviation for this locale's country/region.  If the locale
      * doesn't specify a country, returns the empty string.  Otherwise, returns
      * an uppercase ISO 3166 3-letter country code.
      * @exception MissingResourceException Throws MissingResourceException if the
      * three-letter country abbreviation is not available for this locale.
      * @stable ICU 3.0
      */
     public static String getISO3Country(String localeID){
         initCountryTables();

         String country = getCountry(localeID);
         int offset = findIndex(_countries, country);
         if(offset>=0){
             return _countries3[offset];
         }else{
             offset = findIndex(_obsoleteCountries, country);
             if(offset>=0){
                 return _obsoleteCountries3[offset];
             }
         }
         return EMPTY_STRING;
     }

     // display names

     /**
      * Utility to fetch locale display data from resource bundle tables.
      */
     private static String getTableString(String tableName, String subtableName, String item, String displayLocaleID) {
         if (item.length() > 0) {
             try {
                 ICUResourceBundle bundle = (ICUResourceBundle)UResourceBundle.
                   getBundleInstance(ICUResourceBundle.ICU_BASE_NAME, displayLocaleID);
                 return getTableString(tableName, subtableName, item, bundle);
             } catch (Exception e) {
 //              System.out.println("gtsu: " + e.getMessage());
             }
         }
         return item;
     }

     /**
      * Utility to fetch locale display data from resource bundle tables.
      */
     private static String getTableString(String tableName, String subtableName, String item, ICUResourceBundle bundle) {
 //      System.out.println("gts table: " + tableName +
 //                         " subtable: " + subtableName +
 //                         " item: " + item +
 //                         " bundle: " + bundle.getULocale());
         try {
             for (;;) {
                 // special case currency
                 if ("currency".equals(subtableName)) {
                     ICUResourceBundle table = bundle.getWithFallback("Currencies");
                     table = table.getWithFallback(item);
                     return table.getString(1);
                 } else {
                     ICUResourceBundle table = bundle.getWithFallback(tableName);
                     try {
                         if (subtableName != null) {
                             table = table.getWithFallback(subtableName);
                         }
                         return table.getStringWithFallback(item);
                     }
                     catch (MissingResourceException e) {

                         if(subtableName==null){
                             try{
                                 // may be a deprecated code
                                 String currentName = null;
                                 if(tableName.equals("Countries")){
                                     currentName = getCurrentCountryID(item);
                                 }else if(tableName.equals("Languages")){
                                     currentName = getCurrentLanguageID(item);
                                 }
                                 return table.getStringWithFallback(currentName);
                             }catch (MissingResourceException ex){/* fall through*/}
                         }

                         // still can't figure out ?.. try the fallback mechanism
                         String fallbackLocale = table.getWithFallback("Fallback").getString();
                         if (fallbackLocale.length() == 0) {
                             fallbackLocale = "root";
                         }
 //                      System.out.println("bundle: " + bundle.getULocale() + " fallback: " + fallbackLocale);
                         if(fallbackLocale.equals(table.getULocale().localeID)){
                             return item;
                         }
                         bundle = (ICUResourceBundle)UResourceBundle.getBundleInstance(ICUResourceBundle.ICU_BASE_NAME,
                                                                                       fallbackLocale);
 //                          System.out.println("fallback from " + table.getULocale() + " to " + fallbackLocale +
 //                                             ", got bundle " + bundle.getULocale());
                     }
                 }
             }
         }
         catch (Exception e) {
 //          System.out.println("gtsi: " + e.getMessage());
         }
         return item;
     }

     /**
      * Returns this locale's language localized for display in the default locale.
      * @return the localized language name.
      * @stable ICU 3.0
      */
     public String getDisplayLanguage() {
         return getDisplayLanguageInternal(localeID, getDefault().localeID);
     }

     /**
      * Returns this locale's language localized for display in the provided locale.
      * @param displayLocale the locale in which to display the name.
      * @return the localized language name.
      * @stable ICU 3.0
      */
     public String getDisplayLanguage(ULocale displayLocale) {
         return getDisplayLanguageInternal(localeID, displayLocale.localeID);
     }

     /**
      * Returns a locale's language localized for display in the provided locale.
      * This is a cover for the ICU4C API.
      * @param localeID the id of the locale whose language will be displayed
      * @param displayLocaleID the id of the locale in which to display the name.
      * @return the localized language name.
      * @stable ICU 3.0
      */
     public static String getDisplayLanguage(String localeID, String displayLocaleID) {
         return getDisplayLanguageInternal(localeID, getName(displayLocaleID));
     }

     /**
      * Returns a locale's language localized for display in the provided locale.
      * This is a cover for the ICU4C API.
      * @param localeID the id of the locale whose language will be displayed.
      * @param displayLocale the locale in which to display the name.
      * @return the localized language name.
      * @stable ICU 3.0
      */
     public static String getDisplayLanguage(String localeID, ULocale displayLocale) {
         return getDisplayLanguageInternal(localeID, displayLocale.localeID);
     }

     static String getCurrentCountryID(String oldID){
         initCountryTables();
         int offset = findIndex(_deprecatedCountries, oldID);
         if (offset >= 0) {
             return _replacementCountries[offset];
         }
         return oldID;
     }
     static String getCurrentLanguageID(String oldID){
         initLanguageTables();
         int offset = findIndex(_obsoleteLanguages, oldID);
         if (offset >= 0) {
             return _replacementLanguages[offset];
         }
         return oldID;
     }


     // displayLocaleID is canonical, localeID need not be since parsing will fix this.
     private static String getDisplayLanguageInternal(String localeID, String displayLocaleID) {
         return getTableString("Languages", null, new IDParser(localeID).getLanguage(), displayLocaleID);
     }

     /**
      * Returns this locale's script localized for display in the default locale.
      * @return the localized script name.
      * @stable ICU 3.0
      */
     public String getDisplayScript() {
         return getDisplayScriptInternal(localeID, getDefault().localeID);
     }

     /**
      * Returns this locale's script localized for display in the provided locale.
      * @param displayLocale the locale in which to display the name.
      * @return the localized script name.
      * @stable ICU 3.0
      */
     public String getDisplayScript(ULocale displayLocale) {
         return getDisplayScriptInternal(localeID, displayLocale.localeID);
     }

     /**
      * Returns a locale's script localized for display in the provided locale.
      * This is a cover for the ICU4C API.
      * @param localeID the id of the locale whose script will be displayed
      * @param displayLocaleID the id of the locale in which to display the name.
      * @return the localized script name.
      * @stable ICU 3.0
      */
     public static String getDisplayScript(String localeID, String displayLocaleID) {
         return getDisplayScriptInternal(localeID, getName(displayLocaleID));
     }

     /**
      * Returns a locale's script localized for display in the provided locale.
      * @param localeID the id of the locale whose script will be displayed.
      * @param displayLocale the locale in which to display the name.
      * @return the localized script name.
      * @stable ICU 3.0
      */
     public static String getDisplayScript(String localeID, ULocale displayLocale) {
         return getDisplayScriptInternal(localeID, displayLocale.localeID);
     }

     // displayLocaleID is canonical, localeID need not be since parsing will fix this.
     private static String getDisplayScriptInternal(String localeID, String displayLocaleID) {
         return getTableString("Scripts", null, new IDParser(localeID).getScript(), displayLocaleID);
     }

     /**
      * Returns this locale's country localized for display in the default locale.
      * @return the localized country name.
      * @stable ICU 3.0
      */
     public String getDisplayCountry() {
         return getDisplayCountryInternal(localeID, getDefault().localeID);
     }

     /**
      * Returns this locale's country localized for display in the provided locale.
      * @param displayLocale the locale in which to display the name.
      * @return the localized country name.
      * @stable ICU 3.0
      */
     public String getDisplayCountry(ULocale displayLocale){
         return getDisplayCountryInternal(localeID, displayLocale.localeID);
     }

     /**
      * Returns a locale's country localized for display in the provided locale.
      * This is a cover for the ICU4C API.
      * @param localeID the id of the locale whose country will be displayed
      * @param displayLocaleID the id of the locale in which to display the name.
      * @return the localized country name.
      * @stable ICU 3.0
      */
     public static String getDisplayCountry(String localeID, String displayLocaleID) {
         return getDisplayCountryInternal(localeID, getName(displayLocaleID));
     }

     /**
      * Returns a locale's country localized for display in the provided locale.
      * This is a cover for the ICU4C API.
      * @param localeID the id of the locale whose country will be displayed.
      * @param displayLocale the locale in which to display the name.
      * @return the localized country name.
      * @stable ICU 3.0
      */
     public static String getDisplayCountry(String localeID, ULocale displayLocale) {
         return getDisplayCountryInternal(localeID, displayLocale.localeID);
     }

     // displayLocaleID is canonical, localeID need not be since parsing will fix this.
     private static String getDisplayCountryInternal(String localeID, String displayLocaleID) {
         return getTableString("Countries", null,  new IDParser(localeID).getCountry(), displayLocaleID);
     }

     /**
      * Returns this locale's variant localized for display in the default locale.
      * @return the localized variant name.
      * @stable ICU 3.0
      */
     public String getDisplayVariant() {
         return getDisplayVariantInternal(localeID, getDefault().localeID);
     }

     /**
      * Returns this locale's variant localized for display in the provided locale.
      * @param displayLocale the locale in which to display the name.
      * @return the localized variant name.
      * @stable ICU 3.0
      */
     public String getDisplayVariant(ULocale displayLocale) {
         return getDisplayVariantInternal(localeID, displayLocale.localeID);
     }

     /**
      * Returns a locale's variant localized for display in the provided locale.
      * This is a cover for the ICU4C API.
      * @param localeID the id of the locale whose variant will be displayed
      * @param displayLocaleID the id of the locale in which to display the name.
      * @return the localized variant name.
      * @stable ICU 3.0
      */
     public static String getDisplayVariant(String localeID, String displayLocaleID){
         return getDisplayVariantInternal(localeID, getName(displayLocaleID));
     }

     /**
      * Returns a locale's variant localized for display in the provided locale.
      * This is a cover for the ICU4C API.
      * @param localeID the id of the locale whose variant will be displayed.
      * @param displayLocale the locale in which to display the name.
      * @return the localized variant name.
      * @stable ICU 3.0
      */
     public static String getDisplayVariant(String localeID, ULocale displayLocale) {
         return getDisplayVariantInternal(localeID, displayLocale.localeID);
     }

     // displayLocaleID is canonical, localeID need not be since parsing will fix this.
     private static String getDisplayVariantInternal(String localeID, String displayLocaleID) {
         return getTableString("Variants", null, new IDParser(localeID).getVariant(), displayLocaleID);
     }

     /**
      * Returns a keyword localized for display in the default locale.
      * @param keyword the keyword to be displayed.
      * @return the localized keyword name.
      * @see #getKeywords()
      * @stable ICU 3.0
      */
     public static String getDisplayKeyword(String keyword) {
         return getDisplayKeywordInternal(keyword, getDefault().localeID);
     }

     /**
      * Returns a keyword localized for display in the specified locale.
      * @param keyword the keyword to be displayed.
      * @param displayLocaleID the id of the locale in which to display the keyword.
      * @return the localized keyword name.
      * @see #getKeywords(String)
      * @stable ICU 3.0
      */
     public static String getDisplayKeyword(String keyword, String displayLocaleID) {
         return getDisplayKeywordInternal(keyword, getName(displayLocaleID));
     }

     /**
      * Returns a keyword localized for display in the specified locale.
      * @param keyword the keyword to be displayed.
      * @param displayLocale the locale in which to display the keyword.
      * @return the localized keyword name.
      * @see #getKeywords(String)
      * @stable ICU 3.0
      */
     public static String getDisplayKeyword(String keyword, ULocale displayLocale) {
         return getDisplayKeywordInternal(keyword, displayLocale.localeID);
     }

     // displayLocaleID is canonical, localeID need not be since parsing will fix this.
     private static String getDisplayKeywordInternal(String keyword, String displayLocaleID) {
         return getTableString("Keys", null, AsciiUtil.toLowerString(keyword.trim()), displayLocaleID);
     }

     /**
      * Returns a keyword value localized for display in the default locale.
      * @param keyword the keyword whose value is to be displayed.
      * @return the localized value name.
      * @stable ICU 3.0
      */
     public String getDisplayKeywordValue(String keyword) {
         return getDisplayKeywordValueInternal(localeID, keyword, getDefault().localeID);
     }

     /**
      * Returns a keyword value localized for display in the specified locale.
      * @param keyword the keyword whose value is to be displayed.
      * @param displayLocale the locale in which to display the value.
      * @return the localized value name.
      * @stable ICU 3.0
      */
     public String getDisplayKeywordValue(String keyword, ULocale displayLocale) {
         return getDisplayKeywordValueInternal(localeID, keyword, displayLocale.localeID);
     }

     /**
      * Returns a keyword value localized for display in the specified locale.
      * This is a cover for the ICU4C API.
      * @param localeID the id of the locale whose keyword value is to be displayed.
      * @param keyword the keyword whose value is to be displayed.
      * @param displayLocaleID the id of the locale in which to display the value.
      * @return the localized value name.
      * @stable ICU 3.0
      */
     public static String getDisplayKeywordValue(String localeID, String keyword, String displayLocaleID) {
         return getDisplayKeywordValueInternal(localeID, keyword, getName(displayLocaleID));
     }

     /**
      * Returns a keyword value localized for display in the specified locale.
      * This is a cover for the ICU4C API.
      * @param localeID the id of the locale whose keyword value is to be displayed.
      * @param keyword the keyword whose value is to be displayed.
      * @param displayLocale the id of the locale in which to display the value.
      * @return the localized value name.
      * @stable ICU 3.0
      */
     public static String getDisplayKeywordValue(String localeID, String keyword, ULocale displayLocale) {
         return getDisplayKeywordValueInternal(localeID, keyword, displayLocale.localeID);
     }

     // displayLocaleID is canonical, localeID need not be since parsing will fix this.
     private static String getDisplayKeywordValueInternal(String localeID, String keyword, String displayLocaleID) {
         keyword = AsciiUtil.toLowerString(keyword.trim());
         String value = new IDParser(localeID).getKeywordValue(keyword);
         return getTableString("Types", keyword, value, displayLocaleID);
     }

     /**
      * Returns this locale name localized for display in the default locale.
      * @return the localized locale name.
      * @stable ICU 3.0
      */
     public String getDisplayName() {
         return getDisplayNameInternal(localeID, getDefault().localeID);
     }

     /**
      * Returns this locale name localized for display in the provided locale.
      * @param displayLocale the locale in which to display the locale name.
      * @return the localized locale name.
      * @stable ICU 3.0
      */
     public String getDisplayName(ULocale displayLocale) {
         return getDisplayNameInternal(localeID, displayLocale.localeID);
     }

     /**
      * Returns the locale ID localized for display in the provided locale.
      * This is a cover for the ICU4C API.
      * @param localeID the locale whose name is to be displayed.
      * @param displayLocaleID the id of the locale in which to display the locale name.
      * @return the localized locale name.
      * @stable ICU 3.0
      */
     public static String getDisplayName(String localeID, String displayLocaleID) {
         return getDisplayNameInternal(localeID, getName(displayLocaleID));
     }

     /**
      * Returns the locale ID localized for display in the provided locale.
      * This is a cover for the ICU4C API.
      * @param localeID the locale whose name is to be displayed.
      * @param displayLocale the locale in which to display the locale name.
      * @return the localized locale name.
      * @stable ICU 3.0
      */
     public static String getDisplayName(String localeID, ULocale displayLocale) {
         return getDisplayNameInternal(localeID, displayLocale.localeID);
     }

     // displayLocaleID is canonical, localeID need not be since parsing will fix this.
     private static String getDisplayNameInternal(String localeID, String displayLocaleID) {
         // lang
         // lang (script, country, variant, keyword=value, ...)
         // script, country, variant, keyword=value, ...

         final String[] tableNames = { "Languages", "Scripts", "Countries", "Variants" };

         ICUResourceBundle bundle = (ICUResourceBundle)UResourceBundle.getBundleInstance(ICUResourceBundle.ICU_BASE_NAME, displayLocaleID);

         StringBuffer buf = new StringBuffer();

         IDParser parser = new IDParser(localeID);
         String[] names = parser.getLanguageScriptCountryVariant();

         boolean haveLanguage = names[0].length() > 0;
         boolean openParen = false;
         for (int i = 0; i < names.length; ++i) {
             String name = names[i];
             if (name.length() > 0) {
                 name = getTableString(tableNames[i], null, name, bundle);
                 if (buf.length() > 0) { // need a separator
                     if (haveLanguage & !openParen) {
                         buf.append(" (");
                         openParen = true;
                     } else {
                         buf.append(", ");
                     }
                 }
                 buf.append(name);
             }
         }

         Map m = parser.getKeywordMap();
         if (!m.isEmpty()) {
             Iterator keys = m.entrySet().iterator();
             while (keys.hasNext()) {
                 if (buf.length() > 0) {
                     if (haveLanguage & !openParen) {
                         buf.append(" (");
                         openParen = true;
                     } else {
                         buf.append(", ");
                     }
                 }
                 Map.Entry e = (Map.Entry)keys.next();
                 String key = (String)e.getKey();
                 String val = (String)e.getValue();
                 buf.append(getTableString("Keys", null, key, bundle));
                 buf.append("=");
                 buf.append(getTableString("Types", key, val, bundle));
             }
         }

         if (openParen) {
             buf.append(")");
         }

         return buf.toString();
     }

     /**
      * Returns this locale's layout orientation for characters.  The possible
      * values are "left-to-right", "right-to-left", "top-to-bottom" or
      * "bottom-to-top".
      * @return The locale's layout orientation for characters.
      * @stable ICU 4.0
      */
     public String getCharacterOrientation() {
         return getTableString("layout", null, "characters", getName());
     }

     /**
      * Returns this locale's layout orientation for lines.  The possible
      * values are "left-to-right", "right-to-left", "top-to-bottom" or
      * "bottom-to-top".
      * @return The locale's layout orientation for lines.
      * @stable ICU 4.0
      */
     public String getLineOrientation() {
         return getTableString("layout", null, "lines", getName());
     }

     /**
      * Selector for <tt>getLocale()</tt> indicating the locale of the
      * resource containing the data.  This is always at or above the
      * valid locale.  If the valid locale does not contain the
      * specific data being requested, then the actual locale will be
      * above the valid locale.  If the object was not constructed from
      * locale data, then the valid locale is <i>null</i>.
      *
      * @draft ICU 2.8 (retain)
      * @provisional This API might change or be removed in a future release.
      */
     public static Type ACTUAL_LOCALE = new Type();

     /**
      * Selector for <tt>getLocale()</tt> indicating the most specific
      * locale for which any data exists.  This is always at or above
      * the requested locale, and at or below the actual locale.  If
      * the requested locale does not correspond to any resource data,
      * then the valid locale will be above the requested locale.  If
      * the object was not constructed from locale data, then the
      * actual locale is <i>null</i>.
      *
      * <p>Note: The valid locale will be returned correctly in ICU
      * 3.0 or later.  In ICU 2.8, it is not returned correctly.
      * @draft ICU 2.8 (retain)
      * @provisional This API might change or be removed in a future release.
      */
     public static Type VALID_LOCALE = new Type();

     /**
      * Opaque selector enum for <tt>getLocale()</tt>.
      * @see com.ibm.icu.util.ULocale
      * @see com.ibm.icu.util.ULocale#ACTUAL_LOCALE
      * @see com.ibm.icu.util.ULocale#VALID_LOCALE
      * @draft ICU 2.8 (retainAll)
      * @provisional This API might change or be removed in a future release.
      */
     public static final class Type {
         private Type() {}
     }

   /**
     * Based on a HTTP formatted list of acceptable locales, determine an available locale for the user.
     * NullPointerException is thrown if acceptLanguageList or availableLocales is
     * null.  If fallback is non-null, it will contain true if a fallback locale (one
     * not in the acceptLanguageList) was returned.  The value on entry is ignored.
     * ULocale will be one of the locales in availableLocales, or the ROOT ULocale if
     * if a ROOT locale was used as a fallback (because nothing else in
     * availableLocales matched).  No ULocale array element should be null; behavior
     * is undefined if this is the case.
     * @param acceptLanguageList list in HTTP "Accept-Language:" format of acceptable locales
     * @param availableLocales list of available locales. One of these will be returned.
     * @param fallback if non-null, a 1-element array containing a boolean to be set with the fallback status
     * @return one of the locales from the availableLocales list, or null if none match
     * @stable ICU 3.4
     */

     public static ULocale acceptLanguage(String acceptLanguageList, ULocale[] availableLocales,
                                          boolean[] fallback) {
         if (acceptLanguageList == null) {
             throw new NullPointerException();
         }
         ULocale acceptList[] = null;
         try {
             acceptList = parseAcceptLanguage(acceptLanguageList, true);
         } catch (ParseException pe) {
             acceptList = null;
         }
         if (acceptList == null) {
             return null;
         }
         return acceptLanguage(acceptList, availableLocales, fallback);
     }

     /**
     * Based on a list of acceptable locales, determine an available locale for the user.
     * NullPointerException is thrown if acceptLanguageList or availableLocales is
     * null.  If fallback is non-null, it will contain true if a fallback locale (one
     * not in the acceptLanguageList) was returned.  The value on entry is ignored.
     * ULocale will be one of the locales in availableLocales, or the ROOT ULocale if
     * if a ROOT locale was used as a fallback (because nothing else in
     * availableLocales matched).  No ULocale array element should be null; behavior
     * is undefined if this is the case.
     * @param acceptLanguageList list of acceptable locales
     * @param availableLocales list of available locales. One of these will be returned.
     * @param fallback if non-null, a 1-element array containing a boolean to be set with the fallback status
     * @return one of the locales from the availableLocales list, or null if none match
     * @stable ICU 3.4
     */

     public static ULocale acceptLanguage(ULocale[] acceptLanguageList, ULocale[]
     availableLocales, boolean[] fallback) {
         // fallbacklist
         int i,j;
         if(fallback != null) {
             fallback[0]=true;
         }
         for(i=0;i<acceptLanguageList.length;i++) {
             ULocale aLocale = acceptLanguageList[i];
             boolean[] setFallback = fallback;
             do {
                 for(j=0;j<availableLocales.length;j++) {
                     if(availableLocales[j].equals(aLocale)) {
                         if(setFallback != null) {
                             setFallback[0]=false; // first time with this locale - not a fallback.
                         }
                         return availableLocales[j];
                     }
                 }
                 Locale loc = aLocale.toLocale();
                 Locale parent = LocaleUtility.fallback(loc);
                 if(parent != null) {
                     aLocale = new ULocale(parent);
                 } else {
                     aLocale = null;
                 }
                 setFallback = null; // Do not set fallback in later iterations
             } while (aLocale != null);
         }
         return null;
     }

    /**
     * Based on a HTTP formatted list of acceptable locales, determine an available locale for the user.
     * NullPointerException is thrown if acceptLanguageList or availableLocales is
     * null.  If fallback is non-null, it will contain true if a fallback locale (one
     * not in the acceptLanguageList) was returned.  The value on entry is ignored.
     * ULocale will be one of the locales in availableLocales, or the ROOT ULocale if
     * if a ROOT locale was used as a fallback (because nothing else in
     * availableLocales matched).  No ULocale array element should be null; behavior
     * is undefined if this is the case.
     * This function will choose a locale from the ULocale.getAvailableLocales() list as available.
     * @param acceptLanguageList list in HTTP "Accept-Language:" format of acceptable locales
     * @param fallback if non-null, a 1-element array containing a boolean to be set with the fallback status
     * @return one of the locales from the ULocale.getAvailableLocales() list, or null if none match
     * @stable ICU 3.4
     */

     public static ULocale acceptLanguage(String acceptLanguageList, boolean[] fallback) {
         return acceptLanguage(acceptLanguageList, ULocale.getAvailableLocales(),
                                 fallback);
     }

    /**
     * Based on an ordered array of acceptable locales, determine an available locale for the user.
     * NullPointerException is thrown if acceptLanguageList or availableLocales is
     * null.  If fallback is non-null, it will contain true if a fallback locale (one
     * not in the acceptLanguageList) was returned.  The value on entry is ignored.
     * ULocale will be one of the locales in availableLocales, or the ROOT ULocale if
     * if a ROOT locale was used as a fallback (because nothing else in
     * availableLocales matched).  No ULocale array element should be null; behavior
     * is undefined if this is the case.
     * This function will choose a locale from the ULocale.getAvailableLocales() list as available.
     * @param acceptLanguageList ordered array of acceptable locales (preferred are listed first)
     * @param fallback if non-null, a 1-element array containing a boolean to be set with the fallback status
     * @return one of the locales from the ULocale.getAvailableLocales() list, or null if none match
     * @stable ICU 3.4
     */

     public static ULocale acceptLanguage(ULocale[] acceptLanguageList, boolean[]
                                          fallback) {
         return acceptLanguage(acceptLanguageList, ULocale.getAvailableLocales(),
                 fallback);
     }

     /**
      * Package local method used for parsing Accept-Language string
      * @internal ICU 3.8
      */
     static ULocale[] parseAcceptLanguage(String acceptLanguage, boolean isLenient) throws ParseException {
         /**
          * @internal ICU 3.4
          */
         class ULocaleAcceptLanguageQ implements Comparable {
             private double q;
             private double serial;
             public ULocaleAcceptLanguageQ(double theq, int theserial) {
                 q = theq;
                 serial = theserial;
             }
             public int compareTo(Object o) {
                 ULocaleAcceptLanguageQ other = (ULocaleAcceptLanguageQ) o;
                 if (q > other.q) { // reverse - to sort in descending order
                     return -1;
                 } else if (q < other.q) {
                     return 1;
                 }
                 if (serial < other.serial) {
                     return -1;
                 } else if (serial > other.serial) {
                     return 1;
                 } else {
                     return 0; // same object
                 }
             }
         }

         // parse out the acceptLanguage into an array
         TreeMap map = new TreeMap();
         StringBuffer languageRangeBuf = new StringBuffer();
         StringBuffer qvalBuf = new StringBuffer();
         int state = 0;
         acceptLanguage += ","; // append comma to simplify the parsing code
         int n;
         boolean subTag = false;
         boolean q1 = false;
         for (n = 0; n < acceptLanguage.length(); n++) {
             boolean gotLanguageQ = false;
             char c = acceptLanguage.charAt(n);
             switch (state) {
             case 0: // before language-range start
                 if (('A' <= c && c <= 'Z') || ('a' <= c && c <= 'z')) {
                     // in language-range
                     languageRangeBuf.append(c);
                     state = 1;
                     subTag = false;
                 } else if (c == '*') {
                     languageRangeBuf.append(c);
                     state = 2;
                 } else if (c != ' ' && c != '\t') {
                     // invalid character
                     state = -1;
                 }
                 break;
             case 1: // in language-range
                 if (('A' <= c && c <= 'Z') || ('a' <= c && c <= 'z')) {
                     languageRangeBuf.append(c);
                 } else if (c == '-') {
                     subTag = true;
                     languageRangeBuf.append(c);
                 } else if (c == '_') {
                     if (isLenient) {
                         subTag = true;
                         languageRangeBuf.append(c);
                     } else {
                         state = -1;
                     }
                 } else if ('0' <= c && c <= '9') {
                     if (subTag) {
                         languageRangeBuf.append(c);
                     } else {
                         // DIGIT is allowed only in language sub tag
                         state = -1;
                     }
                 } else if (c == ',') {
                     // language-q end
                     gotLanguageQ = true;
                 } else if (c == ' ' || c == '\t') {
                     // language-range end
                     state = 3;
                 } else if (c == ';') {
                     // before q
                     state = 4;
                 } else {
                     // invalid character for language-range
                     state = -1;
                 }
                 break;
             case 2: // saw wild card range
                 if (c == ',') {
                     // language-q end
                     gotLanguageQ = true;
                 } else if (c == ' ' || c == '\t') {
                     // language-range end
                     state = 3;
                 } else if (c == ';') {
                     // before q
                     state = 4;
                 } else {
                     // invalid
                     state = -1;
                 }
                 break;
             case 3: // language-range end
                 if (c == ',') {
                     // language-q end
                     gotLanguageQ = true;
                 } else if (c == ';') {
                     // before q
                     state =4;
                 } else if (c != ' ' && c != '\t') {
                     // invalid
                     state = -1;
                 }
                 break;
             case 4: // before q
                 if (c == 'q') {
                     // before equal
                     state = 5;
                 } else if (c != ' ' && c != '\t') {
                     // invalid
                     state = -1;
                 }
                 break;
             case 5: // before equal
                 if (c == '=') {
                     // before q value
                     state = 6;
                 } else if (c != ' ' && c != '\t') {
                     // invalid
                     state = -1;
                 }
                 break;
             case 6: // before q value
                 if (c == '0') {
                     // q value start with 0
                     q1 = false;
                     qvalBuf.append(c);
                     state = 7;
                 } else if (c == '1') {
                     // q value start with 1
                     qvalBuf.append(c);
                     state = 7;
                 } else if (c == '.') {
                     if (isLenient) {
                         qvalBuf.append(c);
                         state = 8;
                     } else {
                         state = -1;
                     }
                 } else if (c != ' ' && c != '\t') {
                     // invalid
                     state = -1;
                 }
                 break;
             case 7: // q value start
                 if (c == '.') {
                     // before q value fraction part
                     qvalBuf.append(c);
                     state = 8;
                 } else if (c == ',') {
                     // language-q end
                     gotLanguageQ = true;
                 } else if (c == ' ' || c == '\t') {
                     // after q value
                     state = 10;
                 } else {
                     // invalid
                     state = -1;
                 }
                 break;
             case 8: // before q value fraction part
                 if ('0' <= c || c <= '9') {
                     if (q1 && c != '0' && !isLenient) {
                         // if q value starts with 1, the fraction part must be 0
                         state = -1;
                     } else {
                         // in q value fraction part
                         qvalBuf.append(c);
                         state = 9;
                     }
                 } else {
                     // invalid
                     state = -1;
                 }
                 break;
             case 9: // in q value fraction part
                 if ('0' <= c && c <= '9') {
                     if (q1 && c != '0') {
                         // if q value starts with 1, the fraction part must be 0
                         state = -1;
                     } else {
                         qvalBuf.append(c);
                     }
                 } else if (c == ',') {
                     // language-q end
                     gotLanguageQ = true;
                 } else if (c == ' ' || c == '\t') {
                     // after q value
                     state = 10;
                 } else {
                     // invalid
                     state = -1;
                 }
                 break;
             case 10: // after q value
                 if (c == ',') {
                     // language-q end
                     gotLanguageQ = true;
                 } else if (c != ' ' && c != '\t') {
                     // invalid
                     state = -1;
                 }
                 break;
             }
             if (state == -1) {
                 // error state
                 throw new ParseException("Invalid Accept-Language", n);
             }
             if (gotLanguageQ) {
                 double q = 1.0;
                 if (qvalBuf.length() != 0) {
                     try {
                         q = Double.parseDouble(qvalBuf.toString());
                     } catch (NumberFormatException nfe) {
                         // Already validated, so it should never happen
                         q = 1.0;
                     }
                     if (q > 1.0) {
                         q = 1.0;
                     }
                 }
                 if (languageRangeBuf.charAt(0) != '*') {
                     int serial = map.size();
                     ULocaleAcceptLanguageQ entry = new ULocaleAcceptLanguageQ(q, serial);
                     map.put(entry, new ULocale(canonicalize(languageRangeBuf.toString()))); // sort in reverse order..   1.0, 0.9, 0.8 .. etc
                 }

                 // reset buffer and parse state
                 languageRangeBuf.setLength(0);
                 qvalBuf.setLength(0);
                 state = 0;
             }
         }
         if (state != 0) {
             // Well, the parser should handle all cases.  So just in case.
             throw new ParseException("Invalid AcceptlLanguage", n);
         }

         // pull out the map
         ULocale acceptList[] = (ULocale[])map.values().toArray(new ULocale[map.size()]);
         return acceptList;
     }

     private static final String UNDEFINED_LANGUAGE = "und";
     private static final String UNDEFINED_SCRIPT = "Zzzz";
     private static final String UNDEFINED_REGION = "ZZ";

     /**
      * Add the likely subtags for a provided locale ID, per the algorithm described
      * in the following CLDR technical report:
      *
      *   http://www.unicode.org/reports/tr35/#Likely_Subtags
      *
      * If the provided ULocale instance is already in the maximal form, or there is no
      * data available available for maximization, it will be returned.  For example,
      * "und-Zzzz" cannot be maximized, since there is no reasonable maximization.
      * Otherwise, a new ULocale instance with the maximal form is returned.
      *
      * Examples:
      *
      * "en" maximizes to "en_Latn_US"
      *
      * "de" maximizes to "de_Latn_US"
      *
      * "sr" maximizes to "sr_Cyrl_RS"
      *
      * "sh" maximizes to "sr_Latn_RS" (Note this will not reverse.)
      *
      * "zh_Hani" maximizes to "zh_Hans_CN" (Note this will not reverse.)
      *
      * @param loc The ULocale to maximize
      * @return The maximized ULocale instance.
      * @stable ICU 4.0
      */
     public static ULocale
     addLikelySubtags(ULocale loc)
     {
         String[] tags = new String[3];
         String trailing = null;

         int trailingIndex = parseTagString(
             loc.localeID,
             tags);

         if (trailingIndex < loc.localeID.length()) {
             trailing = loc.localeID.substring(trailingIndex);
         }

         String newLocaleID =
             createLikelySubtagsString(
                 (String)tags[0],
                 (String)tags[1],
                 (String)tags[2],
                 trailing);

         return newLocaleID == null ? loc : new ULocale(newLocaleID);
     }

     /**
      * Minimize the subtags for a provided locale ID, per the algorithm described
      * in the following CLDR technical report:
      *
      *   http://www.unicode.org/reports/tr35/#Likely_Subtags
      *
      * If the provided ULocale instance is already in the minimal form, or there
      * is no data available for minimization, it will be returned.  Since the
      * minimization algorithm relies on proper maximization, see the comments
      * for addLikelySubtags for reasons why there might not be any data.
      *
      * Examples:
      *
      * "en_Latn_US" minimizes to "en"
      *
      * "de_Latn_US" minimizes to "de"
      *
      * "sr_Cyrl_RS" minimizes to "sr"
      *
      * "zh_Hant_TW" minimizes to "zh_TW" (The region is preferred to the
      * script, and minimizing to "zh" would imply "zh_Hans_CN".)
      *
      * @param loc The ULocale to minimize
      * @return The minimized ULocale instance.
      * @stable ICU 4.0
      */
     public static ULocale
     minimizeSubtags(ULocale loc)
     {
         String[] tags = new String[3];

         int trailingIndex = parseTagString(
                 loc.localeID,
                 tags);

         String originalLang = (String)tags[0];
         String originalScript = (String)tags[1];
         String originalRegion = (String)tags[2];
         String originalTrailing = null;

         if (trailingIndex < loc.localeID.length()) {
             /*
              * Create a String that contains everything
              * after the language, script, and region.
              */
             originalTrailing = loc.localeID.substring(trailingIndex);
         }

         /**
          * First, we need to first get the maximization
          * by adding any likely subtags.
          **/
         String maximizedLocaleID =
             createLikelySubtagsString(
                 originalLang,
                 originalScript,
                 originalRegion,
                 null);

         /**
          * If maximization fails, there's nothing
          * we can do.
          **/
         if (isEmptyString(maximizedLocaleID)) {
             return loc;
         }
         else {
             /**
              * Start first with just the language.
              **/
             String tag =
                 createLikelySubtagsString(
                     originalLang,
                     null,
                     null,
                     null);

             if (tag.equals(maximizedLocaleID)) {
                 String newLocaleID =
                     createTagString(
                         originalLang,
                         null,
                         null,
                         originalTrailing);

                 return new ULocale(newLocaleID);
             }
         }

         /**
          * Next, try the language and region.
          **/
         if (originalRegion.length() != 0) {

             String tag =
                 createLikelySubtagsString(
                     originalLang,
                     null,
                     originalRegion,
                     null);

             if (tag.equals(maximizedLocaleID)) {
                 String newLocaleID =
                     createTagString(
                         originalLang,
                         null,
                         originalRegion,
                         originalTrailing);

                 return new ULocale(newLocaleID);
             }
         }

         /**
          * Finally, try the language and script.  This is our last chance,
          * since trying with all three subtags would only yield the
          * maximal version that we already have.
          **/
         if (originalRegion.length() != 0 &&
             originalScript.length() != 0) {

             String tag =
                 createLikelySubtagsString(
                     originalLang,
                     originalScript,
                     null,
                     null);

             if (tag.equals(maximizedLocaleID)) {
                 String newLocaleID =
                     createTagString(
                         originalLang,
                         originalScript,
                         null,
                         originalTrailing);

                 return new ULocale(newLocaleID);
             }
         }

         return loc;
     }

     /**
      * A trivial utility function that checks for a null
      * reference or checks the length of the supplied String.
      *
      *   @param string The string to check
      *
      *   @return true if the String is empty, or if the reference is null.
      */
     private static boolean isEmptyString(String string) {
       return string == null || string.length() == 0;
     }

     /**
      * Append a tag to a StringBuffer, adding the separator if necessary.The tag must
      * not be a zero-length string.
      *
      * @param tag The tag to add.
      * @param buffer The output buffer.
      **/
     private static void
     appendTag(
         String tag,
         StringBuffer buffer) {

         if (buffer.length() != 0) {
             buffer.append(UNDERSCORE);
         }

         buffer.append(tag);
     }

     /**
      * Create a tag string from the supplied parameters.  The lang, script and region
      * parameters may be null references.
      *
      * If any of the language, script or region parameters are empty, and the alternateTags
      * parameter is not null, it will be parsed for potential language, script and region tags
      * to be used when constructing the new tag.  If the alternateTags parameter is null, or
      * it contains no language tag, the default tag for the unknown language is used.
      *
      * @param lang The language tag to use.
      * @param script The script tag to use.
      * @param region The region tag to use.
      * @param trailing Any trailing data to append to the new tag.
      * @param alternateTags A string containing any alternate tags.
      * @return The new tag string.
      **/
     private static String
     createTagString(
         String lang,
         String script,
         String region,
         String trailing,
         String alternateTags) {

         IDParser parser = null;
         boolean regionAppended = false;

         StringBuffer tag = new StringBuffer();

         if (!isEmptyString(lang)) {
             appendTag(
                 lang,
                 tag);
         }
         else if (isEmptyString(alternateTags)) {
             /*
              * Append the value for an unknown language, if
              * we found no language.
              */
             appendTag(
                 UNDEFINED_LANGUAGE,
                 tag);
         }
         else {
             parser = new IDParser(alternateTags);

             String alternateLang = parser.getLanguage();

             /*
              * Append the value for an unknown language, if
              * we found no language.
              */
             appendTag(
                 !isEmptyString(alternateLang) ? alternateLang : UNDEFINED_LANGUAGE,
                 tag);
         }

         if (!isEmptyString(script)) {
             appendTag(
                 script,
                 tag);
         }
         else if (!isEmptyString(alternateTags)) {
             /*
              * Parse the alternateTags string for the script.
              */
             if (parser == null) {
                 parser = new IDParser(alternateTags);
             }

             String alternateScript = parser.getScript();

             if (!isEmptyString(alternateScript)) {
                 appendTag(
                     alternateScript,
                     tag);
             }
         }

         if (!isEmptyString(region)) {
             appendTag(
                 region,
                 tag);

             regionAppended = true;
         }
         else if (!isEmptyString(alternateTags)) {
             /*
              * Parse the alternateTags string for the region.
              */
             if (parser == null) {
                 parser = new IDParser(alternateTags);
             }

             String alternateRegion = parser.getCountry();

             if (!isEmptyString(alternateRegion)) {
                 appendTag(
                     alternateRegion,
                     tag);

                 regionAppended = true;
             }
         }

         if (trailing != null && trailing.length() > 1) {
             /*
              * The current ICU format expects two underscores
              * will separate the variant from the preceeding
              * parts of the tag, if there is no region.
              */
             int separators = 0;

             if (trailing.charAt(0) == UNDERSCORE) {
                 if (trailing.charAt(1) == UNDERSCORE) {
                     separators = 2;
                 }
                 }
                 else {
                     separators = 1;
                 }

             if (regionAppended) {
                 /*
                  * If we appended a region, we may need to strip
                  * the extra separator from the variant portion.
                  */
                 if (separators == 2) {
                     tag.append(trailing.substring(1));
                 }
                 else {
                     tag.append(trailing);
                 }
             }
             else {
                 /*
                  * If we did not append a region, we may need to add
                  * an extra separator to the variant portion.
                  */
                 if (separators == 1) {
                     tag.append(UNDERSCORE);
                 }
                 tag.append(trailing);
             }
         }

         return tag.toString();
     }

     /**
      * Create a tag string from the supplied parameters.  The lang, script and region
      * parameters may be null references.If the lang parameter is an empty string, the
      * default value for an unknown language is written to the output buffer.
      *
      * @param lang The language tag to use.
      * @param script The script tag to use.
      * @param region The region tag to use.
      * @param trailing Any trailing data to append to the new tag.
      * @return The new String.
      **/
     static String
     createTagString(
             String lang,
             String script,
             String region,
             String trailing) {

         return createTagString(
                     lang,
                     script,
                     region,
                     trailing,
                     null);
     }

     /**
      * Parse the language, script, and region subtags from a tag string, and return the results.
      *
      * This function does not return the canonical strings for the unknown script and region.
      *
      * @param localeID The locale ID to parse.
      * @param tags An array of three String references to return the subtag strings.
      * @return The number of chars of the localeID parameter consumed.
      **/
     private static int
     parseTagString(
         String localeID,
         String tags[])
     {
         IDParser parser = new IDParser(localeID);

         String lang = parser.getLanguage();
         String script = parser.getScript();
         String region = parser.getCountry();

         if (isEmptyString(lang)) {
             tags[0] = UNDEFINED_LANGUAGE;
         }
         else {
             tags[0] = lang;
         }

         if (script.equals(UNDEFINED_SCRIPT)) {
             tags[1] = "";
         }
         else {
             tags[1] = script;
         }

         if (region.equals(UNDEFINED_REGION)) {
             tags[2] = "";
         }
         else {
             tags[2] = region;
         }

         /*
          * Search for the variant.  If there is one, then return the index of
          * the preceeding separator.
          * If there's no variant, search for the keyword delimiter,
          * and return its index.  Otherwise, return the length of the
          * string.
          *
          * $TOTO(dbertoni) we need to take into account that we might
          * find a part of the language as the variant, since it can
          * can have a variant portion that is long enough to contain
          * the same characters as the variant.
          */
         String variant = parser.getVariant();

         if (!isEmptyString(variant)){
             int index = localeID.indexOf(variant);


             return  index > 0 ? index - 1 : index;
         }
         else
         {
             int index = localeID.indexOf('@');

             return index == -1 ? localeID.length() : index;
         }
     }

     private static String
     lookupLikelySubtags(String localeId) {
         UResourceBundle bundle =
             UResourceBundle.getBundleInstance(
                     ICUResourceBundle.ICU_BASE_NAME, "likelySubtags");
         try {
             return bundle.getString(localeId);
         }
         catch(MissingResourceException e) {
             return null;
         }
     }

     private static String
     createLikelySubtagsString(
         String lang,
         String script,
         String region,
         String variants) {

         /**
          * Try the language with the script and region first.
          **/
         if (!isEmptyString(script) && !isEmptyString(region)) {

             String searchTag =
                 createTagString(
                     lang,
                     script,
                     region,
                     null);

             String likelySubtags = lookupLikelySubtags(searchTag);

             /*
             if (likelySubtags == null) {
                 if (likelySubtags2 != null) {
                     System.err.println("Tag mismatch: \"(null)\" \"" + likelySubtags2 + "\"");
                 }
             }
             else if (likelySubtags2 == null) {
                 System.err.println("Tag mismatch: \"" + likelySubtags + "\" \"(null)\"");
             }
             else if (!likelySubtags.equals(likelySubtags2)) {
                 System.err.println("Tag mismatch: \"" + likelySubtags + "\" \"" + likelySubtags2 + "\"");
             }
             */
             if (likelySubtags != null) {
                 // Always use the language tag from the
                 // maximal string, since it may be more
                 // specific than the one provided.
                 return createTagString(
                             null,
                             null,
                             null,
                             variants,
                             likelySubtags);
             }
         }

         /**
          * Try the language with just the script.
          **/
         if (!isEmptyString(script)) {

             String searchTag =
                 createTagString(
                     lang,
                     script,
                     null,
                     null);

             String likelySubtags = lookupLikelySubtags(searchTag);
             if (likelySubtags != null) {
                 // Always use the language tag from the
                 // maximal string, since it may be more
                 // specific than the one provided.
                 return createTagString(
                             null,
                             null,
                             region,
                             variants,
                             likelySubtags);
             }
         }

         /**
          * Try the language with just the region.
          **/
         if (!isEmptyString(region)) {

             String searchTag =
                 createTagString(
                     lang,
                     null,
                     region,
                     null);

             String likelySubtags = lookupLikelySubtags(searchTag);

             if (likelySubtags != null) {
                 // Always use the language tag from the
                 // maximal string, since it may be more
                 // specific than the one provided.
                 return createTagString(
                             null,
                             script,
                             null,
                             variants,
                             likelySubtags);
             }
         }

         /**
          * Finally, try just the language.
          **/
         {
             String searchTag =
                 createTagString(
                     lang,
                     null,
                     null,
                     null);

             String likelySubtags = lookupLikelySubtags(searchTag);

             if (likelySubtags != null) {
                 // Always use the language tag from the
                 // maximal string, since it may be more
                 // specific than the one provided.
                 return createTagString(
                             null,
                             script,
                             region,
                             variants,
                             likelySubtags);
             }
         }

         return null;
     }

     // --------------------------------
     //      BCP47/OpenJDK APIs
     // --------------------------------

     /**
      * The key for private use locale extension.
      * @see #getExtension(char)
      * @see Builder#setExtension(char, String)
      *
      * @draft ICU 4.2
      * @provisional This API might change or be removed in a future release.
      */
     static public final char PRIVATE_USE_EXTENSION = 'x';

     /**
      * The key for LDML extension.
      * @see #getExtension(char)
      * @see Builder#setExtension(char, String)
      *
      * @draft ICU 4.2
      * @provisional This API might change or be removed in a future release.
      */
     static public final char LDML_EXTENSION = 'u';

     /**
      * Returns the extension associated with the specified extension key, or
      * null if there is no extension associated with the key.  The key must
      * be one of <code>[0-9A-Za-z]</code>.
      * <BR><STRONG>Note:</STRONG>Extension key 'x' and 'X' is reserved for BCP47
      * private use.  To get the private use value, use <code>PRIVATE_USE_KEY</code>.
      * <p>
      * @param key the extension key
      * @return the extension, or null if this locale
      * defines no extension for the specified key.
      * @throws IllegalArgumentException if the key is not valid.
      * @see #PRIVATE_USE_EXTENSION
      *
      * @draft ICU 4.2
      * @provisional This API might change or be removed in a future release.
      */
     public String getExtension(char key) {
         if (!LocaleExtensions.isValidExtensionKey(key)) {
             throw new IllegalArgumentException("Invalid extension key: " + key);
         }
         return extensions().getExtensionValue(key);
     }

     /**
      * Returns the set of extension keys associated with this locale, or null
      * if it has no extensions.  The* returned set is immutable.
      * @return the set of extension keys, or null if this locale has
      * no extensions.
      *
      * @draft ICU 4.2
      * @provisional This API might change or be removed in a future release.
      */
     public Set getExtensionKeys() {
         return extensions().getExtensionKeys();
     }

     /**
      * Returns the LDML keyword value ('type') associated with
      * the specified LDML key for this locale.  LDML keywords are specified
      * by the 'u' extension and consist of key/type pairs.  The key must be
      * two alphanumeric characters in length, or an IllegalArgumentException
      * is thrown.
      * @param key the LDML key
      * @return the value ('type') associated with the key, or null if the
      * locale does not define a value for the key.
      * @throws IllegalArgumentException if the key is not valid.
      *
      * @draft ICU 4.2
      * @provisional This API might change or be removed in a future release.
      */
     public String getLDMLExtensionValue(String key) {
         if (!LocaleExtensions.isValidLDMLKey(key)) {
             throw new IllegalArgumentException("Invalid LDML key: " + key);
         }
         return extensions().getLDMLKeywordType(key);
     }

     /**
      * Returns the set of keys for LDML keywords defined by this locale, or
      * null if this locale has no locale extension.  The returned set is
      * immutable.
      * @return The set of the LDML keys, or null
      *
      * @draft ICU 4.2
      * @provisional This API might change or be removed in a future release.
      */
     public Set getLDMLExtensionKeys() {
         return extensions().getLDMLKeywordKeys();
     }

     /**
      * Returns a well-formed language tag representing this locale.
      * <p>
      * <b>Note</b>: If the language, country, or variant fields do
      * not satisfy BCP47 language tag syntax requirements, they are
      * omitted from the result.  For example, using the constructor it
      * is possible to create a Locale instance with digits in the
      * language field, or only two characters in the variant field.
      * Since these are not well-formed BCP47 language tag syntax, they
      * cannot be expressed in BCP47.  Since such 'legacy' locales lose
      * information when converting to BCP47, it is
      * recommended that clients switch to conforming locales.
      * <p>
      * <b>Note</b>: Underscores in the variant tag are normalized to
      * hyphen, and all fields, keys, and values are normalized to
      * lower case.
      * @return a BCP47 language tag representing the locale.
      *
      * @draft ICU 4.2
      * @provisional This API might change or be removed in a future release.
      */
     public String toLanguageTag() {
         return LanguageTag.toLanguageTag(base(), extensions());
     }

     /**
      * Returns a locale for the specified language tag string.  If the
      * specified language tag contains any ill-formed subtags, the first
      * such subtag and all following subtags are ignored.
      * <p>
      * This implements the 'Language-Tag' production of BCP47, and so supports
      * grandfathered (regular and irregular) as well as private use language
      * tags.  Private use tags are represented as 'und-x-whatever', and
      * grandfathered tags are converted to their canonical replacements where
      * they exist.  Note that a few grandfathered tags have no modern replacement,
      * these will be converted using the fallback described in the first paragraph,
      * so some information might be lost.
      * <p>
      * For a list of grandfathered tags, see
      * <a href="http://www.ietf.org/internet-drafts/draft-ietf-ltru-4646bis-21.txt">
      * RFC4646</a>
      * (<span style="background-color: #00ccff; font-weight: bold">Currently Draft,
      * remove or reference final version before release.</span>)
      * @param langtag the language tag
      * @return the locale that best represents the language tag
      *
      * @draft ICU 4.2
      * @provisional This API might change or be removed in a future release.
      */
     public static ULocale forLanguageTag(String langtag) {
         ULocale locale = ULocale.ROOT;
         LanguageTag tag = null;
         while (true) {
             try {
                 tag = LanguageTag.parse(langtag);

                 Builder bldr = new Builder();

                 String language = tag.getLanguage();
                 // do nothing with language code "und"
                 if (!language.equals("und")) {
                     bldr.setLanguage(language);
                 }

                 bldr.setScript(tag.getScript())
                     .setRegion(tag.getRegion()).setVariant(tag.getVariant());

                 // setExtension may throw an exception if
                 // it contains malformed LDML keys.
                 Set exts = tag.getExtensions();
                 if (exts != null) {
                     Iterator itr = exts.iterator();
                     while (itr.hasNext()) {
                         Extension e = (Extension)itr.next();
                         bldr.setExtension(e.getSingleton(), e.getValue());
                     }
                 }
                 bldr.setExtension(PRIVATE_USE_EXTENSION, tag.getPrivateUse());
                 locale = bldr.create();
                 break;
             } catch (LocaleSyntaxException e) {
                 // this exception was thrown by LanguageTag#parse
                 // - fall through
             } catch (IllformedLocaleException e) {
                 // this expection was thrown by setExtension with
                 // malformed LDML keys - fall through
             }
             // remove the last subtag and try it again
             int idx = langtag.lastIndexOf('-');
             if (idx == -1) {
                 // no more subtags
                 break;
             }
             langtag = langtag.substring(0, idx);
         }

         return locale;
     }


     /**
      * Builder is used to build instances of Locale from values
      * configured by the setter.
      * <p>
      * Builder supports the 'langtag' production of RFC 4646.
      * Language tags consist of the ASCII digits, upper and lower case
      * letters, and hyphen (which appears only as a field separator).
      * As a convenience, underscores are accepted and normalized to
      * hyphen.  Values with any other character are ill-formed.  Since
      * language tags are case-insensitive, they are normalized
      * to lower case, case distinctions are <b>not</b>
      * preserved by the builder.
      * <p>
      * Note that since this implements 'langtag' and not 'Language-Tag',
      * grandfathered language tags are not supported by the builder.
      * Clients should use {@link #forLanguageTag} instead.
      * <p>
      * Builders can be reused; <code>clear()</code> resets all fields
      * to their default values.
      * @see Builder#create
      * @see Builder#clear
      *
      * @draft ICU 4.2
      * @provisional This API might change or be removed in a future release.
      */
     public static final class Builder {

         private InternalLocaleBuilder _locbld = new InternalLocaleBuilder();

         /**
          * Constructs an empty Builder.
          * The default values of all fields, extensions, and private
          * use information are empty, the language is undefined.
          *
          * @draft ICU 4.2
          * @provisional This API might change or be removed in a future release.
          */
         public Builder() {
         }

         /**
          * Resets the builder to match the provided locale.  The previous state
          * of the builder is discarded.  Fields that do not
          * conform to BCP47 syntax are ill-formed.
          * @param loc the locale
          * @return this builder
          * @throws IllformedLocaleException if <code>loc</code> has any ill-formed
          * fields.
          *
          * @draft ICU 4.2
          * @provisional This API might change or be removed in a future release.
          */
         public Builder setLocale(ULocale loc) {
             clear();
             setLanguage(loc.getLanguage())
                 .setScript(loc.getScript())
                 .setRegion(loc.getCountry())
                 .setVariant(loc.getVariant());

             Set extKeys = loc.getExtensionKeys();
             if (extKeys != null) {
                 Iterator itr = extKeys.iterator();
                 while (itr.hasNext()) {
                     char key = ((Character)itr.next()).charValue();
                     String value = loc.getExtension(key);
                     if (value != null && value.length() > 0) {
                         setExtension(key, value);
                     }
                 }
             }
             return this;
         }

         /**
          * Resets the builder to match the provided language tag.  The previous state
          * of the builder is discarded.
          * @param langtag the language tag
          * @return this builder
          * @throws IllformedLocaleException if <code>langtag</code> is ill-formed.
          * @see #forLanguageTag(String)
          *
          * @draft ICU 4.2
          * @provisional This API might change or be removed in a future release.
          */
         public Builder setLanguageTag(String langtag) {
             clear();
             LanguageTag tag = null;
             try {
                 tag = LanguageTag.parse(langtag);
             } catch (LocaleSyntaxException e) {
                 throw new IllformedLocaleException(e.getMessage(), e.getErrorIndex());
             }

             // base locale fields
             setLanguage(tag.getLanguage()).setScript(tag.getScript())
                 .setRegion(tag.getRegion()).setVariant(tag.getVariant());

             // extensions
             Set exts = tag.getExtensions();
             if (exts != null) {
                 Iterator itr = exts.iterator();
                 while (itr.hasNext()) {
                     Extension e = (Extension)itr.next();
                     setExtension(e.getSingleton(), e.getValue());
                     //TODO: setExtension may throw an IllformedLocaleException.
                     //      In this csae, error index must be recalculated.
                 }
             }
             // private use
             setExtension(PRIVATE_USE_EXTENSION, tag.getPrivateUse());
             return this;
         }

         /**
          * Sets the language.  If language is the empty string,
          * the language is defaulted.  Language should be a two or
          * three-letter language code as defined in ISO639.
          * Well-formed values are any string of two to eight ASCII letters.
          * @param language the language
          * @return this builder
          * @throws IllformedLocaleException if <code>language</code> is ill-formed
          *
          * @draft ICU 4.2
          * @provisional This API might change or be removed in a future release.
          */
         public Builder setLanguage(String language) {
             try {
                 _locbld.setLanguage(language);
             } catch (LocaleSyntaxException e) {
                 throw new IllformedLocaleException(e.getMessage(), e.getErrorIndex());
             }
             return this;
         }

         /**
          * Sets the script.  If script is
          * the empty string, the script is defaulted.  Scripts should
          * be a four-letter script code as defined in ISO 15924.
          * Well-formed values are any string of four ASCII letters.
          * @param script the script
          * @return this builder
          * @throws IllformedLocaleException if <code>script</code> is ill-formed
          *
          * @draft ICU 4.2
          * @provisional This API might change or be removed in a future release.
          */
         public Builder setScript(String script) {
             try {
                 _locbld.setScript(script);
             } catch (LocaleSyntaxException e) {
                 throw new IllformedLocaleException(e.getMessage(), e.getErrorIndex());
             }
             return this;
         }

         /**
          * Sets the region.  If region is
          * the empty string, the region is defaulted.  Regions should
          * be a two-letter ISO 3166 code or a three-digit M. 49 code.
          * Well-formed values are any two-letter or three-digit
          * string.
          * @param region the region
          * @return this builder
          * @throws IllformedLocaleException if <code>region</code> is ill-formed
          *
          * @draft ICU 4.2
          * @provisional This API might change or be removed in a future release.
          */
         public Builder setRegion(String region) {
             try {
                 _locbld.setRegion(region);
             } catch (LocaleSyntaxException e) {
                 throw new IllformedLocaleException(e.getMessage(), e.getErrorIndex());
             }
             return this;
         }

         /**
          * Sets the variant.  If variant is
          * or the empty string, the variant is defaulted.  Variants
          * should be registered variants (see
          * <a href="http://www.iana.org/assignments/language-subtag-registry">
          * IANA Language Subtag Registry</a>) for the prefix.  Well-formed
          * variants are any series of fields of either four characters
          * starting with a digit, or five to eight alphanumeric
          * characters, separated by hyphen or underscore.
          * @param variant the variant
          * @return this builder
          * @throws IllformedLocaleException if <code>variant</code> is ill-formed
          *
          * @draft ICU 4.2
          * @provisional This API might change or be removed in a future release.
          */
         public Builder setVariant(String variant) {
             try {
                 _locbld.setVariant(variant);
             } catch (LocaleSyntaxException e) {
                 throw new IllformedLocaleException(e.getMessage(), e.getErrorIndex());
             }
             return this;
         }

         /**
          * Sets the extension for the given key.  If the value is
          * the empty string, the extension is removed.  Legal
          * keys are the <code>[0-9A-WY-Za-wy-z]</code>.  Well-formed
          * values are any series of fields of two to eight
          * alphanumeric characters, separated by hyphen or underscore.
          * <p>
          * <b>note</b>:The extension 'u' is used for LDML Keywords.
          * Setting the 'u' extension replaces any existing LDML
          * keywords with those defined in the extension.  To be
          * well-formed, a value for the 'u' extension must meet the
          * additional constraint that the number of fields be even
          * (fields represent key value pairs, where the value is
          * mandatory), and that the keys and values be legal locale
          * extension keys and values.
          * @param key the extension key
          * @param value the extension value
          * @return this builder
          * @throws IllformedLocaleException if <code>key</code> is illegal
          * or <code>value</code> is ill-formed
          * @see #setLDMLExtensionValue
          *
          * @draft ICU 4.2
          * @provisional This API might change or be removed in a future release.
          */
         public Builder setExtension(char key, String value) {
             try {
                 _locbld.setExtension(key, value);
             } catch (LocaleSyntaxException e) {
                 throw new IllformedLocaleException(e.getMessage(), e.getErrorIndex());
             }
             return this;
         }

         /**
          * Sets the LDML keyword value ('type') for the given key.  If the
          * value is the empty string, the LDML keyword is removed.
          * Well-formed keys are strings of two alphanumeric characters. Well-formed
          * values are strings of three to eight alphanumeric characters.
          * <p>
          * <b>Note</b>:Setting the 'u' extension replaces all LDML
          * keywords with those defined in the extension.
          * @param key the LDML extension key
          * @param value the LDML extension value
          * @return this builder
          * @throws IllformedLocaleException if <code>key</code> or <code>value</code>
          * is ill-formed
          * @see #setExtension(char, String)
          *
          * @draft ICU 4.2
          * @provisional This API might change or be removed in a future release.
          */
         public Builder setLDMLExtensionValue(String key, String value) {
             try {
                 _locbld.setLDMLExtensionValue(key, value);
             } catch (LocaleSyntaxException e) {
                 throw new IllformedLocaleException(e.getMessage(), e.getErrorIndex());
             }
             return this;
         }

         /**
          * Resets the builder to its initial, default state.
          * @return this builder
          *
          * @draft ICU 4.2
          * @provisional This API might change or be removed in a future release.
          */
         public Builder clear() {
             _locbld.clear();
             return this;
         }

         /**
          * Resets the extensions to their initial, default state.
          * Language, script, region and variant are unchanged.
          * @return this builder
          * @see #setExtension(char, String)
          *
          * @draft ICU 4.2
          * @provisional This API might change or be removed in a future release.
          */
         public Builder clearExtensions() {
             _locbld.removeLocaleExtensions();
             return this;
         }

         /**
          * Returns an instance of locale created from the fields set
          * on this builder.
          * @return a new locale
          *
          * @draft ICU 4.2
          * @provisional This API might change or be removed in a future release.
          */
         public ULocale create() {
             return getInstance(_locbld.getBaseLocale(), _locbld.getLocaleExtensions());
         }
     }

     private static ULocale getInstance(BaseLocale base, LocaleExtensions ext) {
         StringBuffer id = new StringBuffer(base.getID());

         TreeMap kwds = null;
         Set extKeys = ext.getExtensionKeys();
         if (extKeys != null) {
             // legacy locale ID assume LDML keywords and
             // other extensions are at the same level.
             // e.g. @a=ext-for-aa;calendar=japanese;m=ext-for-mm;x=priv-use
             kwds = new TreeMap();
             Iterator itr = extKeys.iterator();
             boolean hasLDMLKeywords = false;
             while (itr.hasNext()) {
                 Character key = (Character)itr.next();
                 if (key.charValue() == 'u') {
                     // LDML keywords
                     hasLDMLKeywords = true;
                     continue;
                 }
                 String value = ext.getExtensionValue(key.charValue());
                 kwds.put(String.valueOf(key), value);
             }

             if (hasLDMLKeywords) {
                 Set ldmlKeys = ext.getLDMLKeywordKeys();
                 if (ldmlKeys != null) {
                     Iterator litr = ldmlKeys.iterator();
                     while (litr.hasNext()) {
                         String bcpKey = (String)litr.next();
                         String bcpValue = ext.getLDMLKeywordType(bcpKey);
                         // transform to legacy key/type
                         String lkey = bcp47ToLDMLKey(bcpKey);
                         String ltype = bcp47ToLDMLType(lkey, bcpValue);
                         kwds.put(lkey, ltype);
                     }
                 }
             }

             if (kwds.size() > 0) {
                 id.append("@");
                 Set kset = kwds.entrySet();
                 Iterator kitr = kset.iterator();
                 boolean insertSep = false;
                 while (kitr.hasNext()) {
                     if (insertSep) {
                         id.append(";");
                     } else {
                         insertSep = true;
                     }
                     Map.Entry kwd = (Map.Entry)kitr.next();
                     id.append(kwd.getKey());
                     id.append("=");
                     id.append(kwd.getValue());
                 }
             }
         }

         return new ULocale(id.toString());
     }

     private BaseLocale base() {
         String language = getLanguage();
         if (equals(ULocale.ROOT)) {
             language = "";
         }
         return BaseLocale.getInstance(language, getScript(), getCountry(), getVariant());
     }

     private LocaleExtensions extensions() {
         Iterator kwitr = getKeywords();
         if (kwitr == null) {
             return LocaleExtensions.EMPTY_EXTENSIONS;
         }

         TreeMap extMap = null;
         TreeMap ldmlKwMap = null;

         while (kwitr.hasNext()) {
             String key = (String)kwitr.next();
             String value = getKeywordValue(key);
             if (key.length() == 1) {
                 // non LDML extension or private use
                 if (extMap == null) {
                     extMap = new TreeMap();
                 }
                 extMap.put(new Character(key.charAt(0)), value.intern());
             } else {
                 // LDML keyword
                 String bcpKey = ldmlKeyToBCP47(key);
                 String bcpVal = ldmlTypeToBCP47(key, value);
                 if (ldmlKwMap == null) {
                     ldmlKwMap = new TreeMap();
                 }
                 ldmlKwMap.put(bcpKey.intern(), bcpVal.intern());
             }
         }

         if (ldmlKwMap != null) {
             // create LDML extension string
             StringBuffer buf = new StringBuffer();
             LocaleExtensions.keywordsToString(ldmlKwMap, buf);
             if (extMap == null) {
                 extMap = new TreeMap();
             }
             extMap.put(new Character('u'), buf.toString().intern());
         }

         return LocaleExtensions.getInstance(extMap, ldmlKwMap);
     }

     //
     // LDML legacy/BCP47 key and type mapping functions
     //
     private static String ldmlKeyToBCP47(String key) {
         UResourceBundle supplemental = UResourceBundle.getBundleInstance(
                                             ICUResourceBundle.ICU_BASE_NAME,
                                             "supplementalData",
                                             ICUResourceBundle.ICU_DATA_CLASS_LOADER);
         UResourceBundle bcp47Mappings = supplemental.get("bcp47KeywordMappings");
         UResourceBundle keyMaps = bcp47Mappings.get("key");

         // normalize key to lowercase
         key = AsciiUtil.toLowerString(key);
         String bcpKey = null;
         try {
             bcpKey = keyMaps.getString(key);
         } catch (MissingResourceException mre) {
             // fall through
         }

         if (bcpKey == null) {
             if (key.length() == 2) {
                 return key;
             }
             throw new IllegalArgumentException("Unknown LDML key name: " + key);
         }
         return bcpKey;
     }

     private static String bcp47ToLDMLKey(String bcpKey) {
         UResourceBundle supplemental = UResourceBundle.getBundleInstance(
                                             ICUResourceBundle.ICU_BASE_NAME,
                                             "supplementalData",
                                             ICUResourceBundle.ICU_DATA_CLASS_LOADER);
         UResourceBundle bcp47Mappings = supplemental.get("bcp47KeywordMappings");
         UResourceBundle keyMaps = bcp47Mappings.get("key");

         // normalize bcp key to lowercase
         bcpKey = AsciiUtil.toLowerString(bcpKey);
         String key = null;
         for (int i = 0; i < keyMaps.getSize(); i++) {
             UResourceBundle keyMap = keyMaps.get(i);
             if (bcpKey.equals(keyMap.getString())) {
                 key = keyMap.getKey();
                 break;
             }
         }
         if (key == null) {
             return bcpKey;
         }
         return key;
     }

     private static String ldmlTypeToBCP47(String key, String type) {
         UResourceBundle supplemental = UResourceBundle.getBundleInstance(
                                             ICUResourceBundle.ICU_BASE_NAME,
                                             "supplementalData",
                                             ICUResourceBundle.ICU_DATA_CLASS_LOADER);
         UResourceBundle bcp47Mappings = supplemental.get("bcp47KeywordMappings");

         // normalize key/type to lowercase
         key = AsciiUtil.toLowerString(key);
         type = AsciiUtil.toLowerString(type);
         String bcpType = null;
         try {
             UResourceBundle typeMaps = bcp47Mappings.get(key);
             String tmp = key.equals("timezone") ? Utility.replaceAll(type, "/", ":") : type;
             bcpType = typeMaps.getString(tmp);
         } catch (MissingResourceException mre) {
             // fall through
         }

         if (bcpType == null) {
             int typeLen = type.length();
             if (typeLen >= 3 && typeLen <= 8) {
                 return type;
             }
             throw new IllegalArgumentException("Unknown LDML type name: " + key);
         }
         return bcpType;
     }

     private static String bcp47ToLDMLType(String key, String bcpType) {
         UResourceBundle supplemental = UResourceBundle.getBundleInstance(
                 ICUResourceBundle.ICU_BASE_NAME,
                 "supplementalData",
                 ICUResourceBundle.ICU_DATA_CLASS_LOADER);
         UResourceBundle bcp47Mappings = supplemental.get("bcp47KeywordMappings");

         // normalize key/bcpType to lowercase
         key = AsciiUtil.toLowerString(key);
         bcpType = AsciiUtil.toLowerString(bcpType);

         String type = null;
         try {
             UResourceBundle typeMaps = bcp47Mappings.get(key);

             // Note:    Linear search for time zone ID might be too slow.
             //          ICU services do not use timezone keywords for now.
             //          In future, we may need to build the optimized inverse
             //          lookup table.

             for (int i = 0; i < typeMaps.getSize(); i++) {
                 UResourceBundle typeMap = typeMaps.get(i);
                 if (bcpType.equals(typeMap.getString())) {
                     type = typeMap.getKey();
                     if (key.equals("timezone")) {
                         type = Utility.replaceAll(type, ":", "/");
                     }
                     break;
                 }
             }
         } catch (MissingResourceException mre) {
             // fall through
         }

         if (type == null) {
             return bcpType;
         }
         return type;
     }
 }