• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1<?xml version="1.0" encoding="UTF-8" ?>
2<!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd">
3<!--
4Copyright © 1991-2017 Unicode, Inc.
5CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/)
6For terms of use, see http://www.unicode.org/copyright.html
7-->
8<supplementalData>
9	<version number="$Revision: 13680 $"/>
10	<transforms>
11		<transform source="blt" target="blt_FONIPA" direction="forward" alias="blt-fonipa-t-blt">
12			<tRule><![CDATA[
13# Output phonemes
14# ---------------
15# Nasals:           m mʷ n nʷ ɲ ɲʷ ŋ ŋʷ
16# Plosives:         p pʰ pʰʷ pʷ b t tʷ tʰ d dʷ k kʰ kʰʷ kʷ ɡ ɡʷ ʔ
17# Fricatives:       f fʷ v s sʷ h hʷ x xʷ
18# Other consonants: w j l
19# Affricates:       t͡ɕ t͡ɕʷ t͡ɕʰ t͡ɕʰʷ
20# Vowels:           i ɨ u ɛ e ə ɔ o a aː
21# Diphthongs:       iə̯ ɨə̯ uə̯ ai̯
22# Tones:            ˨ ˧˥ ˨˩ ˥ ˦ ˧˩
23#
24#
25# Limitations
26# -----------
27# Currently, these rules only support tone marks, but not tone letters.
28#
29#
30# References
31# ----------
32# [1] Jim Brase, SIL International: Proposal to encode the Tai Viet script
33#     in the UCS. ISO/IEC JTC1/SC2/WG2 N3220. March 20, 2007.
34#     http://std.dkuug.dk/jtc1/sc2/wg2/docs/n3220.pdf
35#
36# [2] ScriptSource: Tai Viet Vowels.
37#     http://scriptsource.org/entry/eusd5ehysa
38#
39# [3] ScriptSource: Tai Viet Consonants.
40#     http://scriptsource.org/entry/lbwpkrqk7b
41#
42# [4] http://www.seasite.niu.edu/tai/TaiDam/tones.htm
43
44$LO = [ꪀ ꪂ ꪄ ꪆ ꪈ ꪊ ꪌ ꪎ ꪐ ꪒ ꪔ ꪖ ꪘ ꪚ ꪜ ꪞ ꪠ ꪢ ꪤ ꪦ ꪨ ꪪ ꪬ ꪮ];
45$HI = [ꪁ ꪃ ꪅ ꪇ ꪉ ꪋ ꪍ ꪏ ꪑ ꪓ ꪕ ꪗ ꪙ ꪛ ꪝ ꪟ ꪡ ꪣ ꪥ ꪧ ꪩ ꪫ ꪭ ꪯ];
46$C = [$LO $HI];
47$V1 = [ꪵ ꪶ ꪹ ꪻ ꪼ];  # vowels written before consonant
48$V2 = [ ꪰ ꪲ ꪳ ꪴ ꪷ ꪸ ꪾ];  # vowels written above or below consonant
49$V3 = [ꪱ ꪮ ꪺ ꪽ];  # vowels written after consonant
50$DIGRAPHS = [{ꪹ  ꪸ} {ꪹ  ꪷ} {ꪹ ꪱ}];
51$V12 = [$V1 $V2 $DIGRAPHS];
52$V123 = [$V12 $V3];
53$W = [ꪫ];  # labialization marker
54$F = [$C]; # syllable-final consonant
55$IPA_TONE = [˥ ˦ ˧ ˨ ˩];
56$NOT_IPA_TONE = [^$IPA_TONE];
57$BOUNDARY = [^[:L:][:M:][:N:]];
58
59# Consonants at the end of “checked” syllables.
60$CHK = [ꪜ ꪝ ꪞ ꪟ ꪔ ꪕ ꪖ ꪗ ꪀ ꪁ ꪂ ꪃ ꪮ ꪯ];
61
62# The Tai Viet script uses visual ordering. Convert to logical order.
63($V1) ($C $W?) → $2 $1;
64::null;
65
66# Special handling for stand-alone ꪽ ‘that’.
67$BOUNDARY {ꪽ} $BOUNDARY → nan˧˩;
68
69# Convert tones for checked syllables (those ending in /p/, /t/, /k/, /ʔ/)
70$LO $W? $V12 {($CHK)} → $1 ˧˥;  # Tone class 2: High-rising tone
71$LO $W? {($V3 $CHK)} → $1 ˧˥;  # Tone class 2: High-rising tone
72$HI $W? $V12 {($CHK)} → $1 ˦;  # Tone class 5: High-mid tone
73$HI $W? {($V3 $CHK)} → $1 ˦;  # Tone class 5: High-mid tone
74
75# Convert tones for unchecked syllables with vowels that are written
76# after the consonant (V3).
77# TODO: Also support tone letters, not just tone marks.
78$LO $W? { ꪿ ($V3 $F?)} → $1 ˧˥;  # Tone class 2: High-rising tone
79$LO $W? { ꫁ ($V3 $F?)} → $1 ˨˩;  # Tone class 3: Low-falling tone
80$HI $W? { ꪿ ($V3 $F?)} → $1 ˦;   # Tone class 5: High-mid tone
81$HI $W? { ꫁ ($V3 $F?)} → $1 ˧˩;  # Tone class 6: Mid-falling tone
82
83# Convert tones for unchecked syllables with vowels that are either written
84# before the consonant (V1) or vowels that are written above or below it (V2).
85# TODO: Also support tone letters, not just tone marks.
86$LO $W? $V12 { ꪿ ($F?)} → $1 ˧˥;  # Tone class 2: High-rising tone
87$LO $W? $V12 { ꫁ ($F?)} → $1 ˨˩;  # Tone class 3: Low-falling tone
88$HI $W? $V12 { ꪿ ($F?)} → $1 ˦;   # Tone class 5: High-mid tone
89$HI $W? $V12 { ꫁ ($F?)} → $1 ˧˩;  # Tone class 6: Mid-falling tone
90::null;
91
92{($LO $W? $V123 $F?)} $NOT_IPA_TONE → $1 ˨;  # Tone class 1: Low-mid tone.
93{($HI $W? $V123 $F?)} $NOT_IPA_TONE → $1 ˥;  # Tone class 4: High tone.
94::null;
95
96
97# Harden syllable-final consonants.
98$C $W? $V123 {ꪒ} → ꪔ;  # /d/ → /t/
99::null;
100
101# Convert labialization marker.
102$C {$W} $V123 → ʷ;
103::null;
104
105[ꪀ ꪁ] → k;
106[ꪂ ꪃ] → kʰ;  # Tai Dón; not used in Tai Dam according to [3]
107[ꪄ ꪅ] → x;
108[ꪆ ꪇ] → ɡ;  # only in loanwords, according to [3]
109[ꪈ ꪉ] → ŋ;
110[ꪊ ꪋ] → t͡ɕ;  # Tai Dón; not used in Tai Dam according to [3]
111[ꪌ ꪍ] → t͡ɕʰ;  # Tai Dón; not used in Tai Dam according to [3]
112[ꪎ ꪏ] → s;
113[ꪐ ꪑ] → ɲ;
114[ꪒ ꪓ] → d;
115[ꪔ ꪕ] → t;
116[ꪖ ꪗ] → tʰ;
117[ꪘ ꪙ] → n;
118[ꪚ ꪛ] → b;
119[ꪜ ꪝ] → p;
120[ꪞ ꪟ] → pʰ;  # Tai Dón; not used in Tai Dam according to [3]
121[ꪠ ꪡ] → f;
122[ꪢ ꪣ] → m;
123[ꪤ ꪥ] → j;
124[ꪦ ꪧ] → r;  # only in loanwords, according to [3]
125[ꪨ ꪩ] → l;
126{[ꪪ ꪫ]} $IPA_TONE → w;  # at the end of a syllable (before tone letters)
127[ꪪ ꪫ] → v;  # not at the end of a syllable
128[ꪬ ꪭ] → h;
129ʔ {[ꪮ ꪯ]} → ɔ;  # eg. ꪮꪮꪀ
130[ꪮ ꪯ] → ʔ;
131
132# Digraphs.
133ꪹ  ꪸ → e;
134ꪹ  ꪷ → ə;
135ꪹ ꪱ → aːw;
136
137# Vowels.
138 ꪰ → a;
139ꪱ → aː;
140 ꪲ → i;
141 ꪳ → ɨ;
142 ꪴ → u;
143ꪵ → ɛ;
144ꪶ → o;
145 ꪷ → ɔ;
146ꪮ → ɔ;
147ꪺ → uə̯;
148ꪽ → an;
149ꪹ → ɨə̯;
150 ꪸ → iə̯;
151ꪻ → əw;
152ꪼ → ai̯;
153 ꪾ → am;
154
155# Word ligature symbols.
156ꫛ → kon˥;
157ꫜ → nɨŋ˦;
158			]]></tRule>
159		</transform>
160	</transforms>
161</supplementalData>
162