blob: dbe1c710c4c6bbda0d57996110750ebbdc518c3a [file] [log] [blame]
# © 2016 and later: Unicode, Inc. and others.
# License & terms of use: http://www.unicode.org/copyright.html
# Generated using tools/cldr/cldr-to-icu/build-icu-data.xml
#
# File: blt_blt_FONIPA.txt
# Generated from CLDR
#
# Output phonemes
# ---------------
# Nasals: m mʷ n nʷ ɲ ɲʷ ŋ ŋʷ
# Plosives: p pʰ pʰʷ pʷ b t tʷ tʰ d dʷ k kʰ kʰʷ kʷ ɡ ɡʷ ʔ
# Fricatives: f fʷ v s sʷ h hʷ x xʷ
# Other consonants: w j l
# Affricates: t\u0361ɕ t\u0361ɕʷ t\u0361ɕʰ t\u0361ɕʰʷ
# Vowels: i ɨ u ɛ e ə ɔ o a aː
# Diphthongs: iə\u032F ɨə\u032F uə\u032F ai\u032F
# Tones: ˨ ˧˥ ˨˩ ˥ ˦ ˧˩
#
#
# Limitations
# -----------
# Currently, these rules only support tone marks, but not tone letters.
#
#
# References
# ----------
# [1] Jim Brase, SIL International: Proposal to encode the Tai Viet script
# in the UCS. ISO/IEC JTC1/SC2/WG2 N3220. March 20, 2007.
# http://std.dkuug.dk/jtc1/sc2/wg2/docs/n3220.pdf
#
# [2] ScriptSource: Tai Viet Vowels.
# http://scriptsource.org/entry/eusd5ehysa
#
# [3] ScriptSource: Tai Viet Consonants.
# http://scriptsource.org/entry/lbwpkrqk7b
#
# [4] http://www.seasite.niu.edu/tai/TaiDam/tones.htm
$LO = [ꪀ ꪮ];
$HI = [ꪁ ꪯ];
$C = [$LO $HI];
$V1 = [ꪵ ꪼ]; # vowels written before consonant
$V2 = [ \uAAB0 \uAAB2 \uAAB3 \uAAB4 \uAAB7 \uAAB8 \uAABE]; # vowels written above or below consonant
$V3 = [ꪱ ꪽ]; # vowels written after consonant
$DIGRAPHS = [{ꪹ \uAAB8} {ꪹ \uAAB7} {ꪹ ꪱ}];
$V12 = [$V1 $V2 $DIGRAPHS];
$V123 = [$V12 $V3];
$W = [ꪫ]; # labialization marker
$F = [$C]; # syllable-final consonant
$IPA_TONE = ˦ ˧ ˨ ˩];
$NOT_IPA_TONE = [^$IPA_TONE];
$BOUNDARY = [^[:L:][:M:][:N:]];
# Consonants at the end of “checked” syllables.
$CHK = [ꪜ ꪯ];
# The Tai Viet script uses visual ordering. Convert to logical order.
($V1) ($C $W?) $2 $1;
::null;
# Special handling for stand-alone ꪽ ‘that’.
$BOUNDARY {ꪽ} $BOUNDARY nan˧˩;
# Convert tones for checked syllables (those ending in /p/, /t/, /k/, /ʔ/)
$LO $W? $V12 {($CHK)} $1 ˧˥; # Tone class 2: High-rising tone
$LO $W? {($V3 $CHK)} $1 ˧˥; # Tone class 2: High-rising tone
$HI $W? $V12 {($CHK)} $1 ˦; # Tone class 5: High-mid tone
$HI $W? {($V3 $CHK)} $1 ˦; # Tone class 5: High-mid tone
# Convert tones for unchecked syllables with vowels that are written
# after the consonant (V3).
# TODO: Also support tone letters, not just tone marks.
$LO $W? { \uAABF ($V3 $F?)} $1 ˧˥; # Tone class 2: High-rising tone
$LO $W? { \uAAC1 ($V3 $F?)} $1 ˨˩; # Tone class 3: Low-falling tone
$HI $W? { \uAABF ($V3 $F?)} $1 ˦; # Tone class 5: High-mid tone
$HI $W? { \uAAC1 ($V3 $F?)} $1 ˧˩; # Tone class 6: Mid-falling tone
# Convert tones for unchecked syllables with vowels that are either written
# before the consonant (V1) or vowels that are written above or below it (V2).
# TODO: Also support tone letters, not just tone marks.
$LO $W? $V12 { \uAABF ($F?)} $1 ˧˥; # Tone class 2: High-rising tone
$LO $W? $V12 { \uAAC1 ($F?)} $1 ˨˩; # Tone class 3: Low-falling tone
$HI $W? $V12 { \uAABF ($F?)} $1 ˦; # Tone class 5: High-mid tone
$HI $W? $V12 { \uAAC1 ($F?)} $1 ˧˩; # Tone class 6: Mid-falling tone
::null;
{($LO $W? $V123 $F?)} $NOT_IPA_TONE $1 ˨; # Tone class 1: Low-mid tone.
{($HI $W? $V123 $F?)} $NOT_IPA_TONE $1 ˥; # Tone class 4: High tone.
::null;
# Harden syllable-final consonants.
$C $W? $V123 {ꪒ} ꪔ; # /d/ → /t/
::null;
# Convert labialization marker.
$C {$W} $V123 ʷ;
::null;
[ꪀ ꪁ] k;
[ꪂ ꪃ] kʰ; # Tai Dón; not used in Tai Dam according to [3]
[ꪄ ꪅ] x;
[ꪆ ꪇ] ɡ; # only in loanwords, according to [3]
[ꪈ ꪉ] ŋ;
[ꪊ ꪋ] t\u0361ɕ; # Tai Dón; not used in Tai Dam according to [3]
[ꪌ ꪍ] t\u0361ɕʰ; # Tai Dón; not used in Tai Dam according to [3]
[ꪎ ꪏ] s;
[ꪐ ꪑ] ɲ;
[ꪒ ꪓ] d;
[ꪔ ꪕ] t;
[ꪖ ꪗ] tʰ;
[ꪘ ꪙ] n;
[ꪚ ꪛ] b;
[ꪜ ꪝ] p;
[ꪞ ꪟ] pʰ; # Tai Dón; not used in Tai Dam according to [3]
[ꪠ ꪡ] f;
[ꪢ ꪣ] m;
[ꪤ ꪥ] j;
[ꪦ ꪧ] r; # only in loanwords, according to [3]
[ꪨ ꪩ] l;
{[ꪪ ꪫ]} $IPA_TONE w; # at the end of a syllable (before tone letters)
[ꪪ ꪫ] v; # not at the end of a syllable
[ꪬ ꪭ] h;
ʔ {[ꪮ ꪯ]} ɔ; # eg. ꪮꪮꪀ
[ꪮ ꪯ] ʔ;
# Digraphs.
\uAAB8 e;
\uAAB7 ə;
aːw;
# Vowels.
\uAAB0 a;
aː;
\uAAB2 i;
\uAAB3 ɨ;
\uAAB4 u;
ɛ;
o;
\uAAB7 ɔ;
ɔ;
uə\u032F;
an;
ɨə\u032F;
\uAAB8 iə\u032F;
əw;
ai\u032F;
\uAABE am;
# Word ligature symbols.
kon˥;
nɨŋ˦;