• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1<?xml version="1.0" encoding="UTF-8" ?>
2<!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd">
3<!--
4Copyright © 1991-2015 Unicode, Inc.
5CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/)
6For terms of use, see http://www.unicode.org/copyright.html
7-->
8<supplementalData>
9	<version number="$Revision$"/>
10	<transforms>
11		<transform source="und_FONIPA" target="und_FONXSAMP" direction="both" alias="IPA-XSampa und-fonxsamp-t-und-fonipa" backwardAlias="XSampa-IPA und-fonipa-t-und-fonxsamp">
12			<tRule><![CDATA[
13
14# Conversion between IPA and X-SAMPA phonetic transcription.
15#
16# See http://www.phon.ucl.ac.uk/home/sampa/x-sampa.htm for a description of
17# X-SAMPA, an ASCII encoding of the International Phonetic Alphabet.
18#
19# The following obsolete or extended IPA symbols have no X-SAMPA equivalents
20# and remain unaffected by this transform:
21#
22#   ʞ  LATIN SMALL LETTER TURNED K
23#   ʩ  LATIN SMALL LETTER FENG DIGRAPH
24#   ʪ  LATIN SMALL LETTER LS DIGRAPH
25#   ʫ  LATIN SMALL LETTER LZ DIGRAPH
26#   ʬ  LATIN LETTER BILABIAL PERCUSSIVE
27#   ʭ  LATIN LETTER BIDENTAL PERCUSSIVE
28#
29# An IPA tie bar is transformed to an X-SAMPA underscore, per the official
30# X-SAMPA guidelines.  This can result in certain ambiguities: For example, the
31# labial-velar nasal (http://en.wikipedia.org/wiki/Labial-velar_nasal) can be
32# either written as [ŋ͡m] or [m͡ŋ] in IPA.  However, neither version can be
33# represented unambiguously in X-SAMPA: IPA [ŋ͡m] becomes X-SAMPA [N_m], which
34# is also used to represent a hypothetical laminal (_m) velar nasal, IPA [ŋ̻];
35# and IPA [m͡ŋ] becomes X-SAMPA [m_N], which can also represent a linguolabial
36# (_N) nasal, IPA [m̼], which is more appropriately written [n̼].  To avoid
37# unintended ambiguities, it may therefore be advisable to write affricates
38# without tie bars.
39#
40$t = '_';  # X-SAMPA representation of IPA tie bar.
41
42::NFD(NFC);
43
44# 5-character X-SAMPA representations
45
46ʯ ↔ 'z`_w=';      # LATIN SMALL LETTER TURNED H WITH FISHHOOK AND TAIL
47
48# Alternative 5-character X-SAMPA representations
49
50n\u031F\u030A ← 'n_+_0';
51n\u0320\u030A ← 'n_-_0';
52n\u032A\u030A ← 'n_d_0';
53n\u033A\u030A ← 'n_a_0';
54n\u033B\u030A ← 'n_m_0';
55n\u033C\u030A ← 'n_N_0';
56ɻ\u030A ← 'r\`_0';
57
58# 4-character X-SAMPA representations
59
60ǁ ↔ '|\|\';       # LATIN LETTER LATERAL CLICK
61ʄ ↔ 'J\_<';    # LATIN SMALL LETTER DOTLESS J WITH STROKE AND HOOK
62ʛ ↔ 'G\_<';    # LATIN LETTER SMALL CAPITAL G WITH HOOK
63ʮ ↔ 'z_w=';       # LATIN SMALL LETTER TURNED H WITH FISHHOOK
64\u1DC4 ↔ '_H_T';  # COMBINING MACRON-ACUTE
65\u1DC5 ↔ '_B_L';  # COMBINING GRAVE-MACRON
66\u1DC8 ↔ '_R_F';  # COMBINING GRAVE-ACUTE-GRAVE
67
68# Alternative 4-character X-SAMPA representations
69
70ɭ\u030A ← 'l`_0';
71ɰ\u030A ← 'M\_0';
72ɳ\u030A ← 'n`_0';
73ɽ\u030A ← 'r`_0';
74
75# 3-character X-SAMPA representations
76
77ɓ ↔ 'b_<';     # LATIN SMALL LETTER B WITH HOOK
78ɗ ↔ 'd_<';     # LATIN SMALL LETTER D WITH HOOK
79ɠ ↔ 'g_<';     # LATIN SMALL LETTER G WITH HOOK
80ɻ ↔ 'r\`';        # LATIN SMALL LETTER TURNED R WITH HOOK
81↗ ↔ '<R>';  # NORTH EAST ARROW
82↘ ↔ '<F>';  # SOUTH EAST ARROW
83
84# Alternative 3-character X-SAMPA representations
85
86j\u030A ← 'j_0';
87ŋ\u030A ← 'N_0';
88ɥ\u030A ← 'H_0';
89ɱ\u030A ← 'F_0';
90ɲ\u030A ← 'J_0';
91
92# 2-character X-SAMPA representations
93
94ħ ↔ 'X\';      # LATIN SMALL LETTER H WITH STROKE
95ǀ ↔ '|\';      # LATIN LETTER DENTAL CLICK
96ǂ ↔ '=\';      # LATIN LETTER ALVEOLAR CLICK
97ǃ ↔ '!\';      # LATIN LETTER RETROFLEX CLICK
98ɕ ↔ 's\';      # LATIN SMALL LETTER C WITH CURL
99ɖ ↔ 'd`';      # LATIN SMALL LETTER D WITH TAIL
100ɘ ↔ '@\';      # LATIN SMALL LETTER REVERSED E
101ɚ ↔ '@`';      # LATIN SMALL LETTER SCHWA WITH HOOK
102ɝ ↔ '3`';      # LATIN SMALL LETTER REVERSED OPEN E WITH HOOK
103ɞ ↔ '3\';      # LATIN SMALL LETTER CLOSED REVERSED OPEN E
104ɟ ↔ 'J\';      # LATIN SMALL LETTER DOTLESS J WITH STROKE
105ɢ ↔ 'G\';      # LATIN LETTER SMALL CAPITAL G
106ɦ ↔ 'h\';      # LATIN SMALL LETTER H WITH HOOK
107ɧ ↔ 'x\';      # LATIN SMALL LETTER HENG WITH HOOK
108ɭ ↔ 'l`';      # LATIN SMALL LETTER L WITH RETROFLEX HOOK
109ɮ ↔ 'K\';      # LATIN SMALL LETTER LEZH
110ɰ ↔ 'M\';      # LATIN SMALL LETTER TURNED M WITH LONG LEG
111ɳ ↔ 'n`';      # LATIN SMALL LETTER N WITH RETROFLEX HOOK
112ɴ ↔ 'N\';      # LATIN LETTER SMALL CAPITAL N
113ɸ ↔ 'p\';      # LATIN SMALL LETTER PHI
114ɹ ↔ 'r\';      # LATIN SMALL LETTER TURNED R
115ɺ ↔ 'l\';      # LATIN SMALL LETTER TURNED R WITH LONG LEG
116ɽ ↔ 'r`';      # LATIN SMALL LETTER R WITH TAIL
117ʀ ↔ 'R\';      # LATIN LETTER SMALL CAPITAL R
118ʂ ↔ 's`';      # LATIN SMALL LETTER S WITH HOOK
119ʈ ↔ 't`';      # LATIN SMALL LETTER T WITH RETROFLEX HOOK
120ʐ ↔ 'z`';      # LATIN SMALL LETTER Z WITH RETROFLEX HOOK
121ʑ ↔ 'z\';      # LATIN SMALL LETTER Z WITH CURL
122ʕ ↔ '?\';      # LATIN LETTER PHARYNGEAL VOICED FRICATIVE
123ʘ ↔ 'O\';      # LATIN LETTER BILABIAL CLICK
124ʙ ↔ 'B\';      # LATIN LETTER SMALL CAPITAL B
125ʜ ↔ 'H\';      # LATIN LETTER SMALL CAPITAL H
126ʝ ↔ 'j\';      # LATIN SMALL LETTER J WITH CROSSED-TAIL
127ʟ ↔ 'L\';      # LATIN LETTER SMALL CAPITAL L
128ʡ ↔ '>\';      # LATIN LETTER GLOTTAL STOP WITH STROKE
129ʢ ↔ '<\';      # LATIN LETTER REVERSED GLOTTAL STOP WITH STROKE
130ʰ ↔ '_h';      # MODIFIER LETTER SMALL H
131ʷ ↔ '_w';      # MODIFIER LETTER SMALL W
132ʼ ↔ '_>';      # MODIFIER LETTER APOSTROPHE
133ˆ ↔ '_\';      # MODIFIER LETTER CIRCUMFLEX ACCENT
134ˇ ↔ '_/';      # CARON
135ˑ ↔ ':\';      # MODIFIER LETTER HALF TRIANGULAR COLON
136ˠ ↔ '_G';      # MODIFIER LETTER SMALL GAMMA
137ˡ ↔ '_l';      # MODIFIER LETTER SMALL L
138ˤ ↔ '_?\';     # MODIFIER LETTER SMALL REVERSED GLOTTAL STOP
139\u0300 ↔ '_L';    # COMBINING GRAVE ACCENT
140\u0301 ↔ '_H';    # COMBINING ACUTE ACCENT
141\u0302 ↔ '_F';    # COMBINING CIRCUMFLEX ACCENT
142\u0304 ↔ '_M';    # COMBINING MACRON
143\u0306 ↔ '_X';    # COMBINING BREVE
144\u0308 ↔ '_"';    # COMBINING DIAERESIS
145\u030B ↔ '_T';    # COMBINING DOUBLE ACUTE ACCENT
146\u030C ↔ '_R';    # COMBINING CARON
147\u030F ↔ '_B';    # COMBINING DOUBLE GRAVE ACCENT
148\u0318 ↔ '_A';    # COMBINING LEFT TACK BELOW
149\u0319 ↔ '_q';    # COMBINING RIGHT TACK BELOW
150\u031A ↔ '_}';    # COMBINING LEFT ANGLE ABOVE
151\u031C ↔ '_c';    # COMBINING LEFT HALF RING BELOW
152\u031D ↔ '_r';    # COMBINING UP TACK BELOW
153\u031E ↔ '_o';    # COMBINING DOWN TACK BELOW
154\u031F ↔ '_+';    # COMBINING PLUS SIGN BELOW
155\u0320 ↔ '_-';    # COMBINING MINUS SIGN BELOW
156\u0324 ↔ '_t';    # COMBINING DIAERESIS BELOW
157\u0325 ↔ '_0';    # COMBINING RING BELOW
158\u032A ↔ '_d';    # COMBINING BRIDGE BELOW
159\u032C ↔ '_v';    # COMBINING CARON BELOW
160\u032F ↔ '_^';    # COMBINING INVERTED BREVE BELOW
161\u0330 ↔ '_k';    # COMBINING TILDE BELOW
162\u0334 ↔ '_e';    # COMBINING TILDE OVERLAY
163\u0339 ↔ '_O';    # COMBINING RIGHT HALF RING BELOW
164\u033A ↔ '_a';    # COMBINING INVERTED BRIDGE BELOW
165\u033B ↔ '_m';    # COMBINING SQUARE BELOW
166\u033C ↔ '_N';    # COMBINING SEAGULL BELOW
167\u033D ↔ '_x';    # COMBINING X ABOVE
168ᵻ ↔ 'I\';      # LATIN SMALL CAPITAL LETTER I WITH STROKE
169ᵿ ↔ 'U\';      # LATIN SMALL CAPITAL LETTER U WITH STROKE
170ⁿ ↔ '_n';      # MODIFIER LETTER LATIN SMALL LETTER N
171
172# Alternative 2-character X-SAMPA representations
173
174ʋ ← 'v\';         # LATIN SMALL LETTER V WITH HOOK
175ʲ ← '_j';         # MODIFIER LETTER SMALL J
176\u0303 ← '_~';    # COMBINING TILDE
177\u0329 ← '_=';    # COMBINING VERTICAL LINE BELOW
178
179# 1-character X-SAMPA representations
180
181c\u0327 ↔ C;      # LATIN SMALL LETTER C WITH CEDILLA (decomposed)
182æ ↔ '{';          # LATIN SMALL LETTER AE
183ð ↔ D;            # LATIN SMALL LETTER ETH
184ø ↔ 2;            # LATIN SMALL LETTER O WITH STROKE
185ŋ ↔ N;            # LATIN SMALL LETTER ENG
186œ ↔ 9;            # LATIN SMALL LIGATURE OE
187ɐ ↔ 6;            # LATIN SMALL LETTER TURNED A
188ɑ ↔ A;            # LATIN SMALL LETTER ALPHA
189ɒ ↔ Q;            # LATIN SMALL LETTER TURNED ALPHA
190ɔ ↔ O;            # LATIN SMALL LETTER OPEN O
191ə ↔ '@';          # LATIN SMALL LETTER SCHWA
192ɛ ↔ E;            # LATIN SMALL LETTER OPEN E
193ɜ ↔ 3;            # LATIN SMALL LETTER REVERSED OPEN E
194ɡ ↔ g;            # LATIN SMALL LETTER SCRIPT G
195ɣ ↔ G;            # LATIN SMALL LETTER GAMMA
196ɤ ↔ 7;            # LATIN SMALL LETTER RAMS HORN
197ɥ ↔ H;            # LATIN SMALL LETTER TURNED H
198ɨ ↔ 1;            # LATIN SMALL LETTER I WITH STROKE
199ɪ ↔ I;            # LATIN LETTER SMALL CAPITAL I
200ɫ ↔ 5;            # LATIN SMALL LETTER L WITH MIDDLE TILDE
201ɬ ↔ K;            # LATIN SMALL LETTER L WITH BELT
202ɯ ↔ M;            # LATIN SMALL LETTER TURNED M
203ɱ ↔ F;            # LATIN SMALL LETTER M WITH HOOK
204ɲ ↔ J;            # LATIN SMALL LETTER N WITH LEFT HOOK
205ɵ ↔ 8;            # LATIN SMALL LETTER BARRED O
206ɶ ↔ '&';          # LATIN LETTER SMALL CAPITAL OE
207ɾ ↔ 4;            # LATIN SMALL LETTER R WITH FISHHOOK
208ʁ ↔ R;            # LATIN LETTER SMALL CAPITAL INVERTED R
209ʃ ↔ S;            # LATIN SMALL LETTER ESH
210ʉ ↔ '}';          # LATIN SMALL LETTER U BAR
211ʊ ↔ U;            # LATIN SMALL LETTER UPSILON
212ʋ ↔ P;            # LATIN SMALL LETTER V WITH HOOK
213ʌ ↔ V;            # LATIN SMALL LETTER TURNED V
214ʍ ↔ W;            # LATIN SMALL LETTER TURNED W
215ʎ ↔ L;            # LATIN SMALL LETTER TURNED Y
216ʏ ↔ Y;            # LATIN LETTER SMALL CAPITAL Y
217ʒ ↔ Z;            # LATIN SMALL LETTER EZH
218ʔ ↔ '?';          # LATIN LETTER GLOTTAL STOP
219ʲ ↔ \';           # MODIFIER LETTER SMALL J
220ˈ ↔ '"';          # MODIFIER LETTER VERTICAL LINE
221ˌ ↔ '%';          # MODIFIER LETTER LOW VERTICAL LINE
222ː ↔ ':';          # MODIFIER LETTER TRIANGULAR COLON
223˞ ↔ '`';          # MODIFIER LETTER RHOTIC HOOK
224\u0303 ↔ '~';     # COMBINING TILDE
225\u0329 ↔ '=';     # COMBINING VERTICAL LINE BELOW
226\u0361 ↔ $t;      # COMBINING DOUBLE INVERTED BREVE
227β ↔ B;            # GREEK SMALL LETTER BETA
228θ ↔ T;            # GREEK SMALL LETTER THETA
229χ ↔ X;            # GREEK SMALL LETTER CHI
230↑ ↔ '^';          # UPWARDS ARROW
231↓ ↔ '!';          # DOWNWARDS ARROW
232
233# Compatibility rules for variant or obsolete IPA symbols
234
235g → g;            # LATIN SMALL LETTER G (redundant, for additional clarity)
236ȵ → J;            # LATIN SMALL LETTER N WITH CURL
237ɩ → I;            # LATIN SMALL LETTER IOTA
238ɷ → U;            # LATIN SMALL LETTER CLOSED OMEGA
239ɼ → 'r_r';        # LATIN SMALL LETTER R WITH LONG LEG
240ɿ → 'z=';         # LATIN SMALL LETTER REVERSED R WITH FISHHOOK
241ʅ → 'z`=';        # LATIN SMALL LETTER SQUAT REVERSED ESH
242ʆ → S\';          # LATIN SMALL LETTER ESH WITH CURL
243ʇ → '|\' ;        # LATIN SMALL LETTER TURNED T
244ʓ → Z\';          # LATIN SMALL LETTER EZH WITH CURL
245ʖ → '|\|\';       # LATIN LETTER INVERTED GLOTTAL STOP
246ʗ → '!\';         # LATIN LETTER STRETCHED C
247ʚ → '3\';         # LATIN SMALL LETTER CLOSED OPEN E
248ʠ → 'G\_<_0';  # LATIN SMALL LETTER Q WITH HOOK
249ʣ → d $t z;       # LATIN SMALL LETTER DZ DIGRAPH
250ʤ → d $t Z;       # LATIN SMALL LETTER DEZH DIGRAPH
251ʥ → d $t 'z\';    # LATIN SMALL LETTER DZ DIGRAPH WITH CURL
252ʦ → t $t s;       # LATIN SMALL LETTER TS DIGRAPH
253ʧ → t $t S;       # LATIN SMALL LETTER TESH DIGRAPH
254ʨ → t $t 's\';    # LATIN SMALL LETTER TC DIGRAPH WITH CURL
255˔ → '_r';         # MODIFIER LETTER UP TACK
256˕ → '_o';         # MODIFIER LETTER DOWN TACK
257\u030A → '_0';    # COMBINING RING ABOVE
258φ → 'p\';         # GREEK SMALL LETTER PHI
259ꞎ → 'K`';         # LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT
260
261::NFC(NFD);
262
263			]]></tRule>
264		</transform>
265	</transforms>
266</supplementalData>
267