data/root.txt - external/github.com/unicode-org/icu - Git at Google

 // *******************************************************************************
 // *
 // *   Copyright (C) 1997-2001, International Business Machines
 // *   Corporation and others.  All Rights Reserved.
 // *
 // *******************************************************************************
 //  Date        Name        Description
 //  11/17/99    aliu        Added support for transliterators.

 // Please search for 'DUP FIXME' - duplicate lang/country names commented out


 root {
     Version { "3.1.1" }

     // each variant name that occurs in locales should be listed with %% and a display string
     "%%EURO" { "Euro" }         // Euro variant display name
     "%%B"    { "Bokm\u00e5l" }  // Norwegian variant display name
     "%%NY"   { "Nynorsk" }      // Norwegian variant display name
     "%%AL"   { "\u00C5land" }   // Aland variant display name

     "%%POSIX" { "POSIX" }

     // variants for collation (traditional may also be used for traditional chinese)
     "%%PHONEBOOK" { "Phonebook Order" }
     "%%PINYIN" { "Pinyin Order" }
     "%%TRADITIONAL" { "Traditional" }
     "%%STROKE" { "Stroke Order" }
     "%%DIRECT" { "Direct Order" }

     // this is a special tag that makes genrb include UCARules.txt for collation
     "%%UCARULES" { "UCARules.txt"} // UCARules

     // no collation elements any more
     // CollationElements {
     //	    Version { "1.0" }
     //		Override { "FALSE" }
     //		Sequence { "" }
     // }
     // Formats for the display name of a locale, for a list of
     // items, and for composing two items in a list into one item.
     // The list patterns are used in the variant name and in the
     // full display name.
     //
     // This is the language-neutral form of this resource.
     //
     LocaleNamePatterns {
          {
             "{0,choice,0#|1#{1}|2#{1} ({2})}", // Display name
             "{0,choice,0#|1#{1}|2#{1},{2}|3#{1},{2},{3}}", // List
             "{0},{1}" // List composition
          }
     }

     //------------------------------------------------------------
     // BEGIN Transliterator support
     //------------------------------------------------------------

     // See also icu/data/translit/index.txt

     TransliteratorNamePattern {
         // Format for the display name of a Transliterator.
         // This is the language-neutral form of this resource.
         "{0,choice,0#|1#{1}|2#{1}-{2}}" // Display name
     }

     //------------------------------------------------------------
     // END Transliterator support
     //------------------------------------------------------------

     //------------------------------------------------------------
     // BEGIN BreakIterator support
     //------------------------------------------------------------

     CharacterBreakRules {
         // ignore non-spacing marks and enclosing marks (since we never
         // put a break before ignore characters, this keeps combining
         // accents with the base characters they modify)
         "$ignore=[[:Mn:][:Me:]];"

         // other category definitions
         "choseong=[\u1100-\u115f];"
         "jungseong=[\u1160-\u11a7];"
         "jongseong=[\u11a8-\u11ff];"
         "surr-hi=[\ud800-\udbff];"
         "surr-lo=[\udc00-\udfff];"

         // break after every character, except as follows:
         ".;"

         // keep CRLF sequences together
         "\r\n;"

         // keep surrogate pairs together
         "{surr-hi}{surr-lo};"

         // keep Hangul syllables spelled out using conjoining jamo together
         "{choseong}*{jungseong}*{jongseong}*;"

         // various additions for Hindi support
         "nukta=[\u093c];"
         "danda=[\u0964\u0965];"
         "virama=[\u094d];"
         "devVowelSign=[\u093e-\u094c\u0962\u0963];"
         "devConsonant=[\u0915-\u0939];"
         "devNuktaConsonant=[\u0958-\u095f];"
         "devCharEnd=[\u0902\u0903\u0951-\u0954];"
         "zwj=[\u200d];"

         "devCAMN=({devConsonant}{nukta}?);"
         "devConsonant1=({devNuktaConsonant}|{devCAMN});"
         "devConjunct=(({devConsonant1}{virama}{zwj}?)?{devConsonant1});"

         "{devConjunct}{devVowelSign}?{devCharEnd}?;"
         "{danda}{nukta};"
     }

     // default rules for finding word boundaries
     WordBreakRules {
         // ignore non-spacing marks, enclosing marks, and format characters,
         // all of which should not influence the algorithm
         "$ignore=[[:Mn:][:Me:][:Cf:]];"

         // Hindi phrase separator, kanji, katakana, hiragana, CJK diacriticals,
         // other letters, and digits
         "danda=[\u0964\u0965];"
         "kanji=[\u3005\u4e00-\u9fa5\uf900-\ufa2d];"
         "kata=[\u3099-\u309c\u30a1-\u30fe];"
         "hira=[\u3041-\u309e\u30fc];"
         "let=[[[:L:][:Mc:]]-[{kanji}{kata}{hira}]];"
         "dgt=[:N:];"

         // punctuation that can occur in the middle of a word: currently
         // dashes, apostrophes, quotation marks, and periods
         "mid-word=[[:Pd:]\u00ad\u2027\\\"\\\'\\.];"

         // punctuation that can occur in the middle of a number: currently
         // apostrophes, qoutation marks, periods, commas, and the Arabic
         // decimal point
         "mid-num=[\\\"\\\'\\,\u066b\\.];"

         // punctuation that can occur at the beginning of a number: currently
         // the period, the number sign, and all currency symbols except the cents sign
         "pre-num=[[[:Sc:]-[\u00a2]]\\#\\.];"

         // punctuation that can occur at the end of a number: currently
         // the percent, per-thousand, per-ten-thousand, and Arabic percent
         // signs, the cents sign, and the ampersand
         "post-num=[\\%\\&\u00a2\u066a\u2030\u2031];"

         // line separators: currently LF, FF, PS, and LS
         "ls=[\n\u000c\u2028\u2029];"

         // whitespace: all space separators and the tab character
         "ws=[[:Zs:]\t];"

         // a word is a sequence of letters that may contain internal
         // punctuation, as long as it begins and ends with a letter and
         // never contains two punctuation marks in a row
         "word=({let}+({mid-word}{let}+)*{danda}?);"

         // a number is a sequence of digits that may contain internal
         // punctuation, as long as it begins and ends with a digit and
         // never contains two punctuation marks in a row.
         "number=({dgt}+({mid-num}{dgt}+)*);"

         // break after every character, with the following exceptions
         // (this will cause punctuation marks that aren't considered
         // part of words or numbers to be treated as words unto themselves)
         ".;"

         // keep together any sequence of contiguous words and numbers
         // (including just one of either), plus an optional trailing
         // number-suffix character
         "{word}?({number}{word})*({number}{post-num}?)?;"

         // keep together and sequence of contiguous words and numbers
         // that starts with a number-prefix character and a number,
         // and may end with a number-suffix character
         "{pre-num}({number}{word})*({number}{post-num}?)?;"

         // keep together runs of whitespace (optionally with a single trailing
         // line separator or CRLF sequence)
         "{ws}*\r?{ls}?;"

         // keep together runs of Katakana
         "{kata}*;"

         // keep together runs of Hiragana
         "{hira}*;"

         // keep together runs of Kanji
         "{kanji}*;"
     }

     // default rules for determining legal line-breaking positions
     LineBreakRules {
         // ignore non-spacing marks, enclosing marks, and format characters
         "$ignore=[[:Mn:][:Me:][:Cf:]];"

         // Hindi phrase separators
         "danda=[\u0964\u0965];"

         // characters that always cause a break: ETX, tab, LF, FF, LS, and PS
         "break=[\u0003\t\n\f\u2028\u2029];"

         // characters that always prevent a break: the non-breaking space
         // and similar characters
         "nbsp=[\u00a0\u2007\u2011\ufeff];"

         // whitespace: space separators and control characters, except for
         // CR and the other characters mentioned above
         "space=[[[:Zs:][:Cc:]]-[{nbsp}{break}\r]];"

         // dashes: dash punctuation and the discretionary hyphen, except for
         // non-breaking hyphens
         "dash=[[[:Pd:]\u00ad]-[{nbsp}]];"

         // characters that stick to a word if they precede it: currency symbols
         // (except the cents sign) and starting punctuation
         "pre-word=[[[:Sc:]-[\u00a2]][:Ps:]\\\"\\\'];"

         // characters that stick to a word if they follow it: ending punctuation,
         // other punctuation that usually occurs at the end of a sentence,
         // small Kana characters, some CJK diacritics, etc.
         "post-word=[[:Pe:]\\!\\\"\\\'\\%\\.\\,\\:\\;\\?\u00a2\u00b0\u066a\u2030-\u2034"
                 "\u2103\u2105\u2109\u3001\u3002\u3005\u3041\u3043\u3045\u3047\u3049\u3063"
                 "\u3083\u3085\u3087\u308e\u3099-\u309e\u30a1\u30a3\u30a5\u30a7\u30a9"
                 "\u30c3\u30e3\u30e5\u30e7\u30ee\u30f5\u30f6\u30fc-\u30fe\uff01\uff0c"
                 "\uff0e\uff1f];"

         // Kanji: actually includes both Kanji and Kana, except for small Kana and
         // CJK diacritics
         "kanji=[[\u4e00-\u9fa5\uf900-\ufa2d\u3041-\u3094\u30a1-\u30fa]-[{post-word}{$ignore}]];"

         // digits
         "digit=[[:Nd:][:No:]];"

         // punctuation that can occur in the middle of a number: periods and commas
         "mid-num=[\\.\\,];"

         // everything not mentioned above, plus the quote marks (which are both
         // <pre-word>, <post-word>, and <char>)
         "char=[^{break}{space}{dash}{kanji}{nbsp}{$ignore}{pre-word}{post-word}{mid-num}{danda}\r\\\"\\\'];"

         // a "number" is a run of prefix characters and dashes, followed by one or
         // more digits with isolated number-punctuation characters interspersed
         "number=([{pre-word}{dash}]*{digit}+({mid-num}{digit}+)*);"

         // the basic core of a word can be either a "number" as defined above, a single
         // "Kanji" character, or a run of any number of not-explicitly-mentioned
         // characters (this includes Latin letters)
         "word-core=([{pre-word}{char}]*|{kanji}|{number});"

         // a word may end with an optional suffix that be either a run of one or
         // more dashes or a run of word-suffix characters, followed by an optional
         // run of whitespace
         "word-suffix=(({dash}+|{post-word}*){space}*);"

         // a word, thus, is an optional run of word-prefix characters, followed by
         // a word core and a word suffix (the syntax of <word-core> and <word-suffix>
         // actually allows either of them to match the empty string, putting a break
         // between things like ")(" or "aaa(aaa"
         "word=({pre-word}*{word-core}{word-suffix});"

         // finally, the rule that does the work: Keep together any run of words that
         // are joined by runs of one of more non-spacing mark.  Also keep a trailing
         // line-break character or CRLF combination with the word.  (line separators
         // "win" over nbsp's)
         "{word}({nbsp}+{word})*\r?{break}?;"
     }

     // default rules for finding sentence boundaries
     SentenceBreakRules {
         // ignore non-spacing marks, enclosing marks, and format characters
         "$ignore=[[:Mn:][:Me:][:Cf:]];"

         // lowercase letters
         "lc=[:Ll:];"

         // uppercase Latin letters
         "ucLatin=[A-Z];"

         // whitespace (line separators are treated as whitespace)
         "space=[\t\r\f\n\u2028[:Zs:]];"

         // punctuation which may occur at the beginning of a sentence: "starting
         // punctuation" and quotation marks
         "start=[[:Ps:]\\\"\\\'];"

         // punctuation with may occur at the end of a sentence: "ending punctuation"
         // and quotation marks
         "end=[[:Pe:]\\\"\\\'];"

         // digits
         "digit=[:N:];"

         // characters that unambiguously signal the end of a sentence
         "term=[\\!\\?\u3002\uff01\uff1f];"

         // periods, which MAY signal the end of a sentence
         "period=[\\.\uff0e];"

         // characters that may occur at the beginning of a sentence: basically anything
         // not mentioned above (lowercase letters and digits are specifically excluded)
         "sent-start=[^{lc}{ucLatin}{space}{start}{end}{digit}{term}{period}\u2029{$ignore}];"

         // Hindi phrase separator
         "danda=[\u0964\u0965];"

         // always break sentences after paragraph separators
         ".*?\u2029?;"

         // always break after a danda, if it's followed by whitespace
         ".*?{danda}{space}*;"

         // if you see a period, skip over additional periods and ending punctuation
         // and if the next character is a paragraph separator, break after the
         // paragraph separator
         ".*?{period}[{period}{end}]*{space}*\u2029;"

         // if you see a period, skip over additional periods and ending punctuation,
         // followed by optional whitespace, followed by optional starting punctuation,
         // and if the next character is something that can start a sentence
         // (basically, a capital letter), then put the sentence break between the
         // whitespace and the opening punctuation
         ".*?{period}[{period}{end}]*{space}*/({start}*{sent-start}|{start}+{ucLatin});"

         // same as above, except that there's a sentence break before a Latin capital
         // letter only if there's at least one space after the period
         ".*?{period}[{period}{end}]*{space}+/{ucLatin};"

         // if you see a sentence-terminating character, skip over any additional
         // terminators, periods, or ending punctuation, followed by any whitespace,
         // followed by a SINGLE optional paragraph separator, and put the break there
         ".*?{term}[{term}{period}{end}]*{space}*\u2029?;"

         // The following rules are here to aid in backwards iteration.  The automatically
         // generated backwards state table will rewind to the beginning of the
         // paragraph all the time (or all the way to the beginning of the document
         // if the document doesn't use the Unicode PS character) because the only
         // unambiguous character pairs are those involving paragraph separators.
         // These specify a few more unambiguous breaking situations.

         // if you see a sentence-starting character, followed by starting punctuation
         // (remember, we're iterating backwards), followed by an optional run of
         // whitespace, followed by an optional run of ending punctuation, followed
         // by a period, this is a safe place to turn around
         "![{sent-start}{ucLatin}]{start}*{space}+{end}*{period};"

         // if you see a letter or a digit, followed by an optional run of
         // starting punctuation, followed by an optional run of whitespace,
         // followed by an optional run of ending punctuation, followed by
         // a sentence terminator, this is a safe place to turn around
         "![{sent-start}{lc}{digit}]{start}*{space}*{end}*{term};"
     }

     //------------------------------------------------------------
     // END BreakIterator support
     //------------------------------------------------------------

     AmPmMarkers {
             "AM",
             "PM",
     }
     Countries {
         AF { "Afghanistan" }
         AL { "Albania" }
         DZ { "Algeria" }
         AS { "American Samoa" }
         AD { "Andorra" }
         AO { "Angola" }
         AI { "Anguilla" }
         AR { "Argentina" }
         AM { "Armenia" }
         AW { "Aruba" }
         AU { "Australia" }
         AT { "Austria" }
         AZ { "Azerbaijan" }
         BS { "Bahamas" }
         BH { "Bahrain" }
         BD { "Bangladesh" }
         BB { "Barbados" }
         BY { "Belarus" }
         BE { "Belgium" }
         BZ { "Belize" }
         BJ { "Benin" }
         BM { "Bermuda" }
         BT { "Bhutan" }
         BO { "Bolivia" }
         BA { "Bosnia and Herzegovina" }
         BW { "Botswana" }
         BR { "Brazil" }
         BN { "Brunei" }
         BG { "Bulgaria" }
         BF { "Burkina Faso" }
         BI { "Burundi" }
         KH { "Cambodia" }
         CM { "Cameroon" }
         CA { "Canada" }
         CV { "Cape Verde" }
         CF { "Central African Republic" }
         TD { "Chad" }
         CL { "Chile" }
         CN { "China" }
         CO { "Colombia" }
         KM { "Comoros" }
         CG { "Congo" }
         CR { "Costa Rica" }
         CI { "C\u00F4te d'Ivoire" }
         HR { "Croatia" }
         CU { "Cuba" }
         CY { "Cyprus" }
         CZ { "Czech Republic" }
         DK { "Denmark" }
         DJ { "Djibouti" }
         DM { "Dominica" }
         DO { "Dominican Republic" }
         TP { "East Timor" }
         EC { "Ecuador" }
         EG { "Egypt" }
         SV { "El Salvador" }
         GQ { "Equatorial Guinea" }
         ER { "Eritrea" }
         EE { "Estonia" }
         ET { "Ethiopia" }
         FJ { "Fiji" }
         FI { "Finland" }
         FO { "Faroe Islands" } // http://www.din.de/gremien/nas/nabd/iso3166ma/codlstp1/en_listp1.html
         FR { "France" }
         GF { "French Guiana" }
         GL { "Greenland" } // http://www.din.de/gremien/nas/nabd/iso3166ma/codlstp1/en_listp1.html
         PF { "French Polynesia" }
         TF { "French Southern Territories" }
         GA { "Gabon" }
         GM { "Gambia" }
         GE { "Georgia" }
         DE { "Germany" }
         GH { "Ghana" }
         GR { "Greece" }
         GP { "Guadeloupe" }
         GU { "Guam" }
         GT { "Guatemala" }
         GN { "Guinea" }
         GW { "Guinea-Bissau" }
         GY { "Guyana" }
         HT { "Haiti" }
         HN { "Honduras" }
         HK { "Hong Kong S.A.R., China" }
         HU { "Hungary" }
         IS { "Iceland" }
         IN { "India" }
         ID { "Indonesia" }
         IR { "Iran" }
         IQ { "Iraq" }
         IE { "Ireland" }
         IL { "Israel" }
         IT { "Italy" }
         JM { "Jamaica" }
         JP { "Japan" }
         JO { "Jordan" }
         KZ { "Kazakhstan" }
         KE { "Kenya" }
         KI { "Kiribati" }
         KP { "North Korea" }
         KR { "South Korea" }
         KW { "Kuwait" }
         KG { "Kyrgyzstan" }
         LA { "Laos" }
         LV { "Latvia" }
         LB { "Lebanon" }
         LS { "Lesotho" }
         LR { "Liberia" }
         LY { "Libya" }
         LI { "Liechtenstein" }
         LT { "Lithuania" }
         LU { "Luxembourg" }
         MK { "Macedonia" }
         MG { "Madagascar" }
         MY { "Malaysia" }
         ML { "Mali" }
         MT { "Malta" }
         MP { "Northern Mariana Islands"}
         MH { "Marshall Islands"}
         MQ { "Martinique" }
         MR { "Mauritania" }
         MU { "Mauritius" }
         YT { "Mayotte" }
         MX { "Mexico" }
         FM { "Micronesia" }
         MD { "Moldova" }
         MC { "Monaco" }
         MN { "Mongolia" }
         MS { "Montserrat" }
         MA { "Morocco" }
         MZ { "Mozambique" }
         MM { "Myanmar" }
         NA { "Namibia" }
         NP { "Nepal" }
         NL { "Netherlands" }
         AN { "Netherlands Antilles" }
         NC { "New Caledonia" }
         NZ { "New Zealand" }
         NI { "Nicaragua" }
         NE { "Niger" }
         NG { "Nigeria" }
         NU { "Niue" }
         NO { "Norway" }
         OM { "Oman" }
         PK { "Pakistan" }
         PA { "Panama" }
         PG { "Papua New Guinea" }
         PY { "Paraguay" }
         PE { "Peru" }
         PH { "Philippines" }
         PL { "Poland" }
         PT { "Portugal" }
         PR { "Puerto Rico" }
         QA { "Qatar" }
         RO { "Romania" }
         RU { "Russia" }
         RW { "Rwanda" }
         SA { "Saudi Arabia" }
         SN { "Senegal" }
         SP { "Serbia" }
         SC { "Seychelles" }
         SL { "Sierra Leone" }
         SG { "Singapore" }
         SK { "Slovakia" }
         SI { "Slovenia" }
         SO { "Somalia" }
         ZA { "South Africa" }
         ES { "Spain" }
         LK { "Sri Lanka" }
         SD { "Sudan" }
         SR { "Suriname" }
         SZ { "Swaziland" }
         SE { "Sweden" }
         CH { "Switzerland" }
         SY { "Syria" }
         TW { "Taiwan" }
         TJ { "Tajikistan" }
         TZ { "Tanzania" }
         TH { "Thailand" }
         TG { "Togo" }
         TK { "Tokelau" }
         TO { "Tonga" }
         TT { "Trinidad and Tobago" }
         TN { "Tunisia" }
         TR { "Turkey" }
         TM { "Turkmenistan" }
         UG { "Uganda" }
         UA { "Ukraine" }
         AE { "United Arab Emirates" }
         GB { "United Kingdom" }
         US { "United States" }
         UY { "Uruguay" }
         UZ { "Uzbekistan" }
         VU { "Vanuatu" }
         VA { "Vatican" }
         VE { "Venezuela" }
         VN { "Vietnam" }
         VG { "British Virgin Islands" }
         VI { "U.S. Virgin Islands" }
         EH { "Western Sahara" }
         YE { "Yemen" }
         YU { "Yugoslavia" }
         ZR { "Zaire" }
         ZM { "Zambia" }
         ZW { "Zimbabwe" }
     }
     CurrencyElements {
             "\u00A4",
             "XXX",
             "",
     }
     DateTimeElements {
             "1",
             "1",
     }
     DateTimePatterns {
             "h:mm:ss a z",
             "h:mm:ss a z",
             "h:mm:ss a",
             "h:mm a",
             "EEEE, MMMM d, yyyy",
             "MMMM d, yyyy",
             "MMM d, yyyy",
             "M/d/yy",
             "{1} {0}",
     }
     DayAbbreviations {
             "Sun",
             "Mon",
             "Tue",
             "Wed",
             "Thu",
             "Fri",
             "Sat",
     }
     DayNames {
             "Sunday",
             "Monday",
             "Tuesday",
             "Wednesday",
             "Thursday",
             "Friday",
             "Saturday",
     }
     Eras {
             "BC",
             "AD",
     }
     Languages {
         aa  { "Afar" }
         ab  { "Abkhazian" }
         ace { "Achinese" }
         ach { "Acoli" }
         ada { "Adangme" }
         ae  { "Avestan" }
         af  { "Afrikaans" }
         afa { "Afro-Asiatic (Other)" }
         afh { "Afrihili" }
         aka { "Akan" }
         akk { "Akkadien" }
         ale { "Aleut" }
         alg {  "Algonquian Languages" }
         am  { "Amharic" }
         ang { "English, Old (ca.450-1100)" }
         apa { "Apache Languages"}
         ar  { "Arabic" }
         arc { "Aramaic" }
         arn { "Araucanian" }
         arp { "Arapaho" }
         art { "Artificial (Other)" }
         arw { "Arawak" }
         as  { "Assamese" }
         ath { "Athapaskan Languages" }
         aus { "Australian Languages" }
         ava { "Avaric" }
         awa { "Awadhi" }
         ay  { "Aymara" }
         az  { "Azerbaijani" }
         ba  { "Bashkir" }
         bad { "Banda" }
         bai { "Bamileke Languages" }
         bal { "Baluuchi" }
         bam { "Bambara" }
         ban { "Balinese" }
         bas { "Basa" }
         bat { "Baltic (Other)" }
         be  { "Belarusian" }
         bej { "Beja" }
         bem { "Bemba" }
         ber { "Beber" }
         bg  { "Bulgarian" }
         bh  { "Bihari" }
         bho { "Bhojpuri" }
         bi  { "Bislama" }
         bik { "Bikol" }
         bin { "Bini" }
         bla { "Siksika" }
         bn  { "Bengali" }
         bnt { "Bantu" }
         bo  { "Tibetan" }
         br  { "Brenton" }
         bra { "Braj" }
         bs  { "Bosnian"}
         btk { "Batak" }
         bua { "Buriat" }
         bug { "Buginese" }
         ca  { "Catalan" }
         cad { "Caddo" }
         cai { "Central American Indian (Other)" }
         car { "Carib" }
         cau { "Caucasian (Other) " }
         ce  { "Chechen" }
         ceb { "Cebuano" }
         cel { "Celtic (Other)" }
         ch  { "Chamorro" }
         chb { "Chibcha" }
         chg { "Chagatai" }
         chk { "Chuukese" }
         chm { "Mari" }
         chn { "Chinook Jargon" }
         cho { "Choctaw" }
         chp { "Chipewyan" }
         chr { "Cherokee" }
         chy { "Cheyenne" }
         cmc { "Chamic Languages" }
         co  { "Corsican" }
         cop { "Coptic" }
         cpe { "Creoles and Pidgins, English-based (Other)" }
         cpf { "Creoles and Pidgins, French-based (Other)" }
         cre { "Cree" }
         crp { "Creoles and Pidgins (Other)" }
         cs  { "Czech" }
         cu  { "Church Slavic" }
         cus { "Cushitic (Other)" }
         cv  { "Chuvash" }
         cy  { "Welsh" }
         da  { "Danish" }
         dak { "Dakota" }
         day { "Dayak" }
         de  { "German" }
         del { "Delaware" }
         den { "Slave" }
         dgr { "Dogrib" }
         din { "Dinka" }
         div { "Divehi" }
         doi { "Dogri" }
         dra { "Dravidian (Other)" }
         dua { "Duala" }
         dum { "Dutch, Middle (ca. 1050-1350)" }
         dyu { "Dyula" }
         dz  { "Bhutani" }
         dzo { "Dzongkha" }
         efi { "Efik" }
         egy { "Egyptian (Ancient)" }
         eka { "Ekajuk" }
         el  { "Greek" } //  Modern (1453-)
         elx { "Elamite" }
         en  { "English" }
         enm { "English, Middle( 1100 -1500)" }
         eo  { "Esperanto" }
         es  { "Spanish" }
         et  { "Estonian" }
         eu  { "Basque" }
         ewe { "Ewe" }
         ewo { "Ewondo" }
         fa  { "Persian" }
         fan { "Fang" }
         fat { "Fanti" }
         fi  { "Finnish" }
         fiu { "Finno - Ugrian" }
         fj  { "Fiji" }
         fo  { "Faeroese" }
         fon { "Fon" }
         fr  { "French" }
         frm { "French, Middle (ca.1400-1600)" }
         fro { "French, Old (842-ca.1400)" }
         ful { "Fulah" }
         fur { "Friulian" }
         fy  { "Frisian" }
         ga  { "Irish" }
         gaa { "Ga" }
         gay { "Gayo" }
         gba {"Gbaya" }
         gd  { "Scots Gaelic" }
         gem { "Germanic (Other)" }
         gil { "Gilbertese" }
 		gl  { "Gallegan" }
         gla { "Gaelic (Scots)" }
         gmh { "German, Middle High (ca.1050-1500)" }
         gn  { "Guarani" }
         goh { " German, Old High (ca.750-1050)" }
         gon { "Gondi" }
         gor { "Gorontalo" }
         got { "Gothic" }
         grb { "Gerbo" }
         grc { "Greek, Ancient (to 1453)" }
         gu  { "Gujarati" }
         gv  { "Manx" }
         gwi { "Gwich'in" }
         hai { "Haida" }
         hau { "Hausa" }
         haw { "Hawaiian" }
         he  { "Hebrew" }
         hi  { "Hindi" }
         him { "Himachali" }
         hit { "Hittite" }
         hmn { "Hmong" }
         ho  { "Hiri Motu" }
         hr  { "Croatian" }
         hu  { "Hungarian" }
         hup { "Hupa" }
         hy  { "Armenian" }
         hz  { "Herero" }
         ia  { "Interlingua" }
         iba { "Iban" }
         ibo { "Igbo" }
         id  { "Indonesian" }
         ie  { "Interlingue" }
         ijo { "Ijo" }
         ik  { "Inupiak" }
         ilo { "Iloko" }
         inc { "Indic (Other)" }
         ine { "Indo-European" }
         ira { "Iranian " }
         iro { "Iroguoian  Languages" }
         is  { "Icelandic" }
         it  { "Italian" }
         iu  { "Inukitut" }
         iw  { "Hebrew" }
         ja  { "Japanese" }
         jpr { "Judeo-Persian" }
         jrb { "Judeo-Arabic" }
         jw  { "Javanese" }
         ka  { "Georgian" }
         kaa { "Kara-Kalpak" }
         kab { "Kabyle" }
         kac { "Kachin" }
         kam { "Kamba" }
         kar { "Karen" }
         kau { "Kanuri" }
         kaw { "Kawi" }
         kha { "Khasi" }
         khi { "Khoisan" }
         kho { "Khotanese" }
         ki  { "Kikuyu" }
         kk  { "Kazakh" }
         kl  { "Kalaallisut" }
         km  { "Khmer" }
         kmb { "Kimbundu" }
         kn  { "Kannada" }
         ko  { "Korean" }
         kok { "Konkani" }
         kon { "Kongo" }
         kos { "Kosrean" }
         kpe { "Kpelle" }
         kro { "Kru" }
         kru { "Kuruckh" }
         ks  { "Kashmiri" }
         ku  { "Kurdish" }
         kum { "Kumyk" }
         kut { "Kutenai" }
         kv  { "Komi" }
         kw  { "Cornish" }
         ky  { "Kirghiz" }
         la  { "Latin" }
         lad { "Ladino" }
         lah { "Lahnda" }
         lam { "Lamba" }
         lb  { "Letzeburgesch" }
         lez { "Lezghian" }
         lin { "Lingala" }
         lit { "Lithuanian" }
         ln  { "Lingala" }
         lo  { "Lao" }
         lol { "Mongo" }
         loz { "Lozi" }
         lt  { "Lithuanian" }
         lua { "Luba-Lulua" }
         lub { "Luba-Katanga" }
         lug { "Ganda" }
         lui { "Luiseeno" }
         lun { "Lunda" }
         luo { "Lua" }
         lus { "Lushai" }
         lv  { "Latvian (Lettish)" }
         mad { "Madurese" }
         mag { "Magahi" }
         mai { "Maithili" }
         mak { "Makasar" }
         man { "Mandingue" }
         map { "Austronesian" }
         mas { "Masai" }
         mdr { "Mandar" }
         men { "Mende" }
         mg  { "Malagasy" }
         mga { "Irish, Middle (900-1200)" }
         mh  { "Marshall"}
         mi  { "Maori" }
         mic { "Mic-Mac" }
         min { "Minangkabau" }
         mis { "Miscellaneous Languages" }
         mk  { "Macedonian" }
         mkh { "Mon-Khmer (Ohter)" }
         ml  { "Malayalam" }
         mn  { "Mongolian" }
         mnc { "Manchu" }
         mni { "Manipuri" }
         mno { "Manobo Languages" }
         mo  { "Moldavian" }
         moh { "Mohawk" }
         mos { "Mossi" }
         mr  { "Marathi" }
         ms  { "Malay" }
         mt  { "Maltese" }
         mul { "Multiple Languages" }
         mun { "Munda Languages" }
         mus { "Creek" }
         mwr { "Marwari" }
         my  { "Burmese" }
         myn { "Mayan" }
         na  { "Nauru" }
         nah { "Nahuatl" }
         nai { "North American Indian (Ohter)" }
         nb  { "Norwegian Bokm\u00e5l" }
         nd  { "Ndebele, North" }
         nds { "Low German; Low Saxon" }
         ne  { "Nepali" }
         new { "Newari" }
         ng  { "Ndonga" }
         nia { "Nias" }
         nic { "Niger - Kordofanian" }
         niu { "Niuean" }
         nl  { "Dutch" }
         nn  { "Norwegian Nynorsk" }
         no  { "Norwegian" }
         non { "Norse, Old" }
         nr  { "Ndebele, South" }
         nso { "Sotho, Northern" }
         nub { "Nubian Languages" }
         nv  {"Navajo"}
         ny  { " Chichewa; Nyanja" }
         nym { "Nyamwezi" }
         nyo { "Nyoro" }
         nzi { "Nzima" }
         oc  { "Proven\u00E7al; Occitan (post 1500)"}
         oji { "Ojibwa" }
         om  { "Oromo (Afan)" }
         or  { "Oriya" }
         os  { "Ossetic" }
         osa { "Osage" }
         ota { "Turkish (Ottoman Empire)" }
         oto { "Otomian Languages" }
         pa  { "Punjabi" }
         paa { "Papuan (Ohter)" }
         pag { "Pangasinan" }
         pal { "Pahlavi" }
         pam { "pampamga" }
         pap { "Papiamento" }
         pau { "Palauan" }
         peo { "Persian Old (ca.600-400 B.C.)"  }
         phi { "Philippine (Other)" }
         phn { "Phoenician" }
         pi  { "Pali" }
         pl  { "Polish" }
         pon { "Pohnpeian" }
         pra { "Prakrit Languages" }
         pro { "Proven\u00E7al, Old (to 1500)" }
         ps  { "Pashto (Pushto)" }
         pt  { "Portuguese" }
         qu  { "Quechua" }
         raj { "Rajastani" }
         rap { "Rapanui" }
         rar { "Rarotongan" }
         rm  { "Rhaeto-Romance" }
         rn  { "Rundi" }
         ro  { "Romanian" }
         roa { "Romance (Other)" }
         rom { "Romany" }
         ru  { "Russian" }
         rw  { "Kinyarwanda" }
         sa  { "Sanskrit" }
         sad { "Sandawe" }
         sah { "Yakut" }
         sai { "South American Indian (Ohter)" }
         sal { "Salishan" }
         sam { "Samritan" }
         sas { "Saska" }
         sat { "Santali" }
         sc  { "Sardinian" }
         sco { "Scots" }
         sd  { "Sindhi" }
         se  { "Northern Sami" }
 // http://lcweb.loc.gov/standards/iso639-2/englangn.html
 // should provide the correct language code soon
 //        se { "Sami Languages" }        // DUP FIXME
         sel { "Selkup" }
         sem { "Semitic" }
         sg  { "Sango" }
         sga { "Irish, Old (to 900)" }
         sgn { "Sign Languages" }
         sh  { "Serbo-Croatian" }
         shn { "Shan" }
         si  { "Sinhalese" }
         sid { "Sidamo" }
         sio { "Siouan Languages" }
         sit { "Sino-Tibetan (Other)" }
         sk  { "Slovak" }
         sl  { "Slovenian" }
         sm  { "Samoan" }
         sn  { "Shona" }
         snk { "Soninke" }
         so  { "Somali" }
         sog { "Sogdien" }
         son { "Songhai" }
         sq  { "Albanian" }
         sr  { "Serbian" }
         srr { "Serer" }
         ss  { "Swati" }
         ssa { "Nilo-Saharam" }
         st  { "Sotho, Southern" }
         su  { "Sundanese" }
         suk { "Sukuma" }
         sus { "Susu" }
         sux { "Sumerian"}
         sv  { "Swedish" }
         sw  { "Swahili" }
         syr { "Syriac" }
         ta  { "Tamil" }
         tai { "Tai (Other)" }
         te  { "Telugu" }
         tem { "Timne" }
         ter { "Tereno" }
         tet { "Tetum" }
         tg  { "Tajik" }
         th  { "Thai" }
         tig { "Tigre" }
         tir { "Tigrinya" }
         tiv { "Tiv" }
         tk  { "Turkmen" }
         tl  { "Tagalog" }
         tli { "Tlingit" }
         tmh { "Tamashek" }
         tn  { "Tswana" }
         tog { "Tonga (Nyasa)" }
         ton { "Tongan (Tonga Islands)" }
         tr  { "Turkish" }
         ts  { "Tsonga" }
         tsi { "Tsimshian" }
         tt  { "Tatar" }
         tum { "Tumbuka" }
         tur { "Turkish" }
         tut { "Altaic (Other)" }
         tvl { "Tuvalu" }
         tw  { "Twi" }
         ty  { "Tahitian" }
         tyv { "Tuvinian" }
         ug  { "Uighur" }
         uga { "Ugaritic" }
         uk  { "Ukrainian" }
         umb { "Umbundu" }
         und { "Undetermined" }
         ur  { "Urdu" }
         uz  { "Uzbek" }
         vai { "Vai" }
         ven { "Venda" }
         vi  { "Vietnamese" }
         vo  { "Volapuk" }
         vot  { "Votic" }
         wak { "Wakashan Languages" }
         wal { "Walamo" }
         war { "Waray" }
         was { "Washo" }
         wen { "Sorbian Languages" }
         wo  { "Wolof" }
         xh  { "Xhosa" }
         yao { "Yao" }
         yap { "Yapese" }
         yi  { "Yiddish" }
         yor  { "Yoruba" }
         ypk { "Yupik Languages" }
         za  { "Zhuang" }
         zap { "Zapotec" }
         zen { "Zenaga" }
         zh  { "Chinese" }
         znd { "Zande" }
         zu  { "Zulu" }
         zun { "Zuni" }
     }
     LocaleID { "0000" }
     LocaleString { "en" }
     MonthAbbreviations {
             "Jan",
             "Feb",
             "Mar",
             "Apr",
             "May",
             "Jun",
             "Jul",
             "Aug",
             "Sep",
             "Oct",
             "Nov",
             "Dec",
             "",
     }
     MonthNames {
             "January",
             "February",
             "March",
             "April",
             "May",
             "June",
             "July",
             "August",
             "September",
             "October",
             "November",
             "December",
             "",
     }
     NumberElements {
             ".",
             ",",
             ";",
             "%",
             "0",
             "#",
             "-",
             "E",
             "\u2030",
             "\u221E",
             "\uFFFD",
     }
     NumberPatterns {
             "#,##0.###;-#,##0.###",
             "\u00A4 #,##0.00;-\u00A4 #,##0.00",
             "#,##0%",
 	    "#E0"
     }
     ShortCountry { "" }
     ShortLanguage { "eng" }
     localPatternChars { "GyMdkHmsSEDFwWahKzYe" }
     zoneStrings {
         {
                 "PST",
                 "Pacific Standard Time",
                 "PST",
                 "Pacific Daylight Time",
                 "PDT",
                 "San Francisco",
         }
         {
                 "MST",
                 "Mountain Standard Time",
                 "MST",
                 "Mountain Daylight Time",
                 "MDT",
                 "Denver",
         }
         {
                 "PNT",
                 "Mountain Standard Time",
                 "MST",
                 "Mountain Standard Time",
                 "MST",
                 "Phoenix",
         }
         {
                 "CST",
                 "Central Standard Time",
                 "CST",
                 "Central Daylight Time",
                 "CDT",
                 "Chicago",
         }
         {
                 "EST",
                 "Eastern Standard Time",
                 "EST",
                 "Eastern Daylight Time",
                 "EDT",
                 "New York",
         }
         {
                 "IET",
                 "Eastern Standard Time",
                 "EST",
                 "Eastern Standard Time",
                 "EST",
                 "Indianapolis",
         }
         {
                 "PRT",
                 "Atlantic Standard Time",
                 "AST",
                 "Atlantic Daylight Time",
                 "ADT",
                 "Halifax",
         }
         {
                 "HST",
                 "Hawaii Standard Time",
                 "HST",
                 "Hawaii Daylight Time",
                 "HDT",
                 "Honolulu",
         }
         {
                 "AST",
                 "Alaska Standard Time",
                 "AST",
                 "Alaska Daylight Time",
                 "ADT",
                 "Anchorage",
         }
     }


     LocaleScript{
         "Latn",
     }

     //------------------------------------------------------------
     // Rule Based Number Format Support
     //------------------------------------------------------------

         /*
          * Default used to be English (US) rules, but now default just formats
          * like DecimalFormat.  The former default rules are now the _en rules.
          */
         SpelloutRules {
           "=#,##0.######=;\n"
         }

         OrdinalRules {
           "=#,##0=;\n"
         }

         DurationRules {
           "=#,##0=;\n"
         }

     Scripts {
         ARAB { "Arabic" }
         ARMN { "Armenian" }
         BENG { "Bengali" }
         BOPO { "Bopomofo" }
         CANS { "Unified Canadian Aboriginal Symbols" }
         CHER { "Cherokee" }
         CYRL { "Cyrillic" }
         DEVA { "Devanagari" }
         DSRT { "Deseret" }
         ETHI { "Ethiopic" }
         GEOR { "Georgian" }
         GOTH { "Gothic" }
         GREK { "Greek" }
         GUJR { "Gujarati" }
         GURU { "Gurmukhi" }
         HANG { "Hangul" }
         HANI { "Han" }
         HEBR { "Hebrew" }
         HIRA { "Hiragana" }
         ITAL { "Old_italic" }
         KANA { "Katakana" }
         KHMR { "Khmer" }
         KNDA { "Kannada" }
         LAO  { "Lao" }
         LATN { "Latin" }
         MLYM { "Malayalam" }
         MONG { "Mongolian" }
         MYMR { "Myanmar" }
         OGAM { "Ogham" }
         ORYA { "Oriya" }
         QAAC { "Coptic" }
         QAAI { "Inherited" }
         RUNR { "Runic" }
         SINH { "Sinhala" }
         SYRC { "Syriac" }
         TAML { "Tamil" }
         TELU { "Telugu" }
         THAA { "Thana" }
         THAI { "Thai" }
         TIBT { "Tibetan" }
         YIII { "Yi" }
         ZYYY { "Common" }
    }
 }