UNPKG

cldr

Version:

Library for extracting data from CLDR (the Unicode Common Locale Data Repository)

267 lines (242 loc) 11.7 kB
<?xml version="1.0" encoding="UTF-8" ?> <!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd"> <!-- Copyright © 1991-2015 Unicode, Inc. CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/) For terms of use, see http://www.unicode.org/copyright.html --> <supplementalData> <version number="$Revision$"/> <transforms> <transform source="und_FONIPA" target="und_FONXSAMP" direction="both" alias="IPA-XSampa und-fonxsamp-t-und-fonipa" backwardAlias="XSampa-IPA und-fonipa-t-und-fonxsamp"> <tRule><![CDATA[ # Conversion between IPA and X-SAMPA phonetic transcription. # # See http://www.phon.ucl.ac.uk/home/sampa/x-sampa.htm for a description of # X-SAMPA, an ASCII encoding of the International Phonetic Alphabet. # # The following obsolete or extended IPA symbols have no X-SAMPA equivalents # and remain unaffected by this transform: # # ʞ LATIN SMALL LETTER TURNED K # ʩ LATIN SMALL LETTER FENG DIGRAPH # ʪ LATIN SMALL LETTER LS DIGRAPH # ʫ LATIN SMALL LETTER LZ DIGRAPH # ʬ LATIN LETTER BILABIAL PERCUSSIVE # ʭ LATIN LETTER BIDENTAL PERCUSSIVE # # An IPA tie bar is transformed to an X-SAMPA underscore, per the official # X-SAMPA guidelines. This can result in certain ambiguities: For example, the # labial-velar nasal (http://en.wikipedia.org/wiki/Labial-velar_nasal) can be # either written as [ŋ͡m] or [m͡ŋ] in IPA. However, neither version can be # represented unambiguously in X-SAMPA: IPA [ŋ͡m] becomes X-SAMPA [N_m], which # is also used to represent a hypothetical laminal (_m) velar nasal, IPA [ŋ̻]; # and IPA [m͡ŋ] becomes X-SAMPA [m_N], which can also represent a linguolabial # (_N) nasal, IPA [m̼], which is more appropriately written [n̼]. To avoid # unintended ambiguities, it may therefore be advisable to write affricates # without tie bars. # $t = '_'; # X-SAMPA representation of IPA tie bar. ::NFD(NFC); # 5-character X-SAMPA representations ʯ 'z`_w='; # LATIN SMALL LETTER TURNED H WITH FISHHOOK AND TAIL # Alternative 5-character X-SAMPA representations n\u031F\u030A 'n_+_0'; n\u0320\u030A 'n_-_0'; n\u032A\u030A 'n_d_0'; n\u033A\u030A 'n_a_0'; n\u033B\u030A 'n_m_0'; n\u033C\u030A 'n_N_0'; ɻ\u030A 'r\`_0'; # 4-character X-SAMPA representations ǁ '|\|\'; # LATIN LETTER LATERAL CLICK ʄ 'J\_<'; # LATIN SMALL LETTER DOTLESS J WITH STROKE AND HOOK ʛ 'G\_<'; # LATIN LETTER SMALL CAPITAL G WITH HOOK ʮ 'z_w='; # LATIN SMALL LETTER TURNED H WITH FISHHOOK \u1DC4 '_H_T'; # COMBINING MACRON-ACUTE \u1DC5 '_B_L'; # COMBINING GRAVE-MACRON \u1DC8 '_R_F'; # COMBINING GRAVE-ACUTE-GRAVE # Alternative 4-character X-SAMPA representations ɭ\u030A 'l`_0'; ɰ\u030A 'M\_0'; ɳ\u030A 'n`_0'; ɽ\u030A 'r`_0'; # 3-character X-SAMPA representations ɓ 'b_<'; # LATIN SMALL LETTER B WITH HOOK ɗ 'd_<'; # LATIN SMALL LETTER D WITH HOOK ɠ 'g_<'; # LATIN SMALL LETTER G WITH HOOK ɻ 'r\`'; # LATIN SMALL LETTER TURNED R WITH HOOK '<R>'; # NORTH EAST ARROW '<F>'; # SOUTH EAST ARROW # Alternative 3-character X-SAMPA representations j\u030A 'j_0'; ŋ\u030A 'N_0'; ɥ\u030A 'H_0'; ɱ\u030A 'F_0'; ɲ\u030A 'J_0'; # 2-character X-SAMPA representations ħ 'X\'; # LATIN SMALL LETTER H WITH STROKE ǀ '|\'; # LATIN LETTER DENTAL CLICK ǂ '=\'; # LATIN LETTER ALVEOLAR CLICK ǃ '!\'; # LATIN LETTER RETROFLEX CLICK ɕ 's\'; # LATIN SMALL LETTER C WITH CURL ɖ 'd`'; # LATIN SMALL LETTER D WITH TAIL ɘ '@\'; # LATIN SMALL LETTER REVERSED E ɚ '@`'; # LATIN SMALL LETTER SCHWA WITH HOOK ɝ '3`'; # LATIN SMALL LETTER REVERSED OPEN E WITH HOOK ɞ '3\'; # LATIN SMALL LETTER CLOSED REVERSED OPEN E ɟ 'J\'; # LATIN SMALL LETTER DOTLESS J WITH STROKE ɢ 'G\'; # LATIN LETTER SMALL CAPITAL G ɦ 'h\'; # LATIN SMALL LETTER H WITH HOOK ɧ 'x\'; # LATIN SMALL LETTER HENG WITH HOOK ɭ 'l`'; # LATIN SMALL LETTER L WITH RETROFLEX HOOK ɮ 'K\'; # LATIN SMALL LETTER LEZH ɰ 'M\'; # LATIN SMALL LETTER TURNED M WITH LONG LEG ɳ 'n`'; # LATIN SMALL LETTER N WITH RETROFLEX HOOK ɴ 'N\'; # LATIN LETTER SMALL CAPITAL N ɸ 'p\'; # LATIN SMALL LETTER PHI ɹ 'r\'; # LATIN SMALL LETTER TURNED R ɺ 'l\'; # LATIN SMALL LETTER TURNED R WITH LONG LEG ɽ 'r`'; # LATIN SMALL LETTER R WITH TAIL ʀ 'R\'; # LATIN LETTER SMALL CAPITAL R ʂ 's`'; # LATIN SMALL LETTER S WITH HOOK ʈ 't`'; # LATIN SMALL LETTER T WITH RETROFLEX HOOK ʐ 'z`'; # LATIN SMALL LETTER Z WITH RETROFLEX HOOK ʑ 'z\'; # LATIN SMALL LETTER Z WITH CURL ʕ '?\'; # LATIN LETTER PHARYNGEAL VOICED FRICATIVE ʘ 'O\'; # LATIN LETTER BILABIAL CLICK ʙ 'B\'; # LATIN LETTER SMALL CAPITAL B ʜ 'H\'; # LATIN LETTER SMALL CAPITAL H ʝ 'j\'; # LATIN SMALL LETTER J WITH CROSSED-TAIL ʟ 'L\'; # LATIN LETTER SMALL CAPITAL L ʡ '>\'; # LATIN LETTER GLOTTAL STOP WITH STROKE ʢ '<\'; # LATIN LETTER REVERSED GLOTTAL STOP WITH STROKE ʰ '_h'; # MODIFIER LETTER SMALL H ʷ '_w'; # MODIFIER LETTER SMALL W ʼ '_>'; # MODIFIER LETTER APOSTROPHE ˆ '_\'; # MODIFIER LETTER CIRCUMFLEX ACCENT ˇ '_/'; # CARON ˑ ':\'; # MODIFIER LETTER HALF TRIANGULAR COLON ˠ '_G'; # MODIFIER LETTER SMALL GAMMA ˡ '_l'; # MODIFIER LETTER SMALL L ˤ '_?\'; # MODIFIER LETTER SMALL REVERSED GLOTTAL STOP \u0300 '_L'; # COMBINING GRAVE ACCENT \u0301 '_H'; # COMBINING ACUTE ACCENT \u0302 '_F'; # COMBINING CIRCUMFLEX ACCENT \u0304 '_M'; # COMBINING MACRON \u0306 '_X'; # COMBINING BREVE \u0308 '_"'; # COMBINING DIAERESIS \u030B '_T'; # COMBINING DOUBLE ACUTE ACCENT \u030C '_R'; # COMBINING CARON \u030F '_B'; # COMBINING DOUBLE GRAVE ACCENT \u0318 '_A'; # COMBINING LEFT TACK BELOW \u0319 '_q'; # COMBINING RIGHT TACK BELOW \u031A '_}'; # COMBINING LEFT ANGLE ABOVE \u031C '_c'; # COMBINING LEFT HALF RING BELOW \u031D '_r'; # COMBINING UP TACK BELOW \u031E '_o'; # COMBINING DOWN TACK BELOW \u031F '_+'; # COMBINING PLUS SIGN BELOW \u0320 '_-'; # COMBINING MINUS SIGN BELOW \u0324 '_t'; # COMBINING DIAERESIS BELOW \u0325 '_0'; # COMBINING RING BELOW \u032A '_d'; # COMBINING BRIDGE BELOW \u032C '_v'; # COMBINING CARON BELOW \u032F '_^'; # COMBINING INVERTED BREVE BELOW \u0330 '_k'; # COMBINING TILDE BELOW \u0334 '_e'; # COMBINING TILDE OVERLAY \u0339 '_O'; # COMBINING RIGHT HALF RING BELOW \u033A '_a'; # COMBINING INVERTED BRIDGE BELOW \u033B '_m'; # COMBINING SQUARE BELOW \u033C '_N'; # COMBINING SEAGULL BELOW \u033D '_x'; # COMBINING X ABOVE 'I\'; # LATIN SMALL CAPITAL LETTER I WITH STROKE ᵿ 'U\'; # LATIN SMALL CAPITAL LETTER U WITH STROKE '_n'; # MODIFIER LETTER LATIN SMALL LETTER N # Alternative 2-character X-SAMPA representations ʋ 'v\'; # LATIN SMALL LETTER V WITH HOOK ʲ '_j'; # MODIFIER LETTER SMALL J \u0303 '_~'; # COMBINING TILDE \u0329 '_='; # COMBINING VERTICAL LINE BELOW # 1-character X-SAMPA representations c\u0327 C; # LATIN SMALL LETTER C WITH CEDILLA (decomposed) æ '{'; # LATIN SMALL LETTER AE ð D; # LATIN SMALL LETTER ETH ø 2; # LATIN SMALL LETTER O WITH STROKE ŋ N; # LATIN SMALL LETTER ENG œ 9; # LATIN SMALL LIGATURE OE ɐ 6; # LATIN SMALL LETTER TURNED A ɑ A; # LATIN SMALL LETTER ALPHA ɒ Q; # LATIN SMALL LETTER TURNED ALPHA ɔ O; # LATIN SMALL LETTER OPEN O ə '@'; # LATIN SMALL LETTER SCHWA ɛ E; # LATIN SMALL LETTER OPEN E ɜ 3; # LATIN SMALL LETTER REVERSED OPEN E ɡ g; # LATIN SMALL LETTER SCRIPT G ɣ G; # LATIN SMALL LETTER GAMMA ɤ 7; # LATIN SMALL LETTER RAMS HORN ɥ H; # LATIN SMALL LETTER TURNED H ɨ 1; # LATIN SMALL LETTER I WITH STROKE ɪ I; # LATIN LETTER SMALL CAPITAL I ɫ 5; # LATIN SMALL LETTER L WITH MIDDLE TILDE ɬ K; # LATIN SMALL LETTER L WITH BELT ɯ M; # LATIN SMALL LETTER TURNED M ɱ F; # LATIN SMALL LETTER M WITH HOOK ɲ J; # LATIN SMALL LETTER N WITH LEFT HOOK ɵ 8; # LATIN SMALL LETTER BARRED O ɶ '&'; # LATIN LETTER SMALL CAPITAL OE ɾ 4; # LATIN SMALL LETTER R WITH FISHHOOK ʁ R; # LATIN LETTER SMALL CAPITAL INVERTED R ʃ S; # LATIN SMALL LETTER ESH ʉ '}'; # LATIN SMALL LETTER U BAR ʊ U; # LATIN SMALL LETTER UPSILON ʋ P; # LATIN SMALL LETTER V WITH HOOK ʌ V; # LATIN SMALL LETTER TURNED V ʍ W; # LATIN SMALL LETTER TURNED W ʎ L; # LATIN SMALL LETTER TURNED Y ʏ Y; # LATIN LETTER SMALL CAPITAL Y ʒ Z; # LATIN SMALL LETTER EZH ʔ '?'; # LATIN LETTER GLOTTAL STOP ʲ \'; # MODIFIER LETTER SMALL J ˈ '"'; # MODIFIER LETTER VERTICAL LINE ˌ '%'; # MODIFIER LETTER LOW VERTICAL LINE ː ':'; # MODIFIER LETTER TRIANGULAR COLON ˞ '`'; # MODIFIER LETTER RHOTIC HOOK \u0303 '~'; # COMBINING TILDE \u0329 '='; # COMBINING VERTICAL LINE BELOW \u0361 $t; # COMBINING DOUBLE INVERTED BREVE β B; # GREEK SMALL LETTER BETA θ T; # GREEK SMALL LETTER THETA χ X; # GREEK SMALL LETTER CHI '^'; # UPWARDS ARROW '!'; # DOWNWARDS ARROW # Compatibility rules for variant or obsolete IPA symbols g g; # LATIN SMALL LETTER G (redundant, for additional clarity) ȵ J; # LATIN SMALL LETTER N WITH CURL ɩ I; # LATIN SMALL LETTER IOTA ɷ U; # LATIN SMALL LETTER CLOSED OMEGA ɼ 'r_r'; # LATIN SMALL LETTER R WITH LONG LEG ɿ 'z='; # LATIN SMALL LETTER REVERSED R WITH FISHHOOK ʅ 'z`='; # LATIN SMALL LETTER SQUAT REVERSED ESH ʆ S\'; # LATIN SMALL LETTER ESH WITH CURL ʇ '|\' ; # LATIN SMALL LETTER TURNED T ʓ Z\'; # LATIN SMALL LETTER EZH WITH CURL ʖ '|\|\'; # LATIN LETTER INVERTED GLOTTAL STOP ʗ '!\'; # LATIN LETTER STRETCHED C ʚ '3\'; # LATIN SMALL LETTER CLOSED OPEN E ʠ 'G\_<_0'; # LATIN SMALL LETTER Q WITH HOOK ʣ d $t z; # LATIN SMALL LETTER DZ DIGRAPH ʤ d $t Z; # LATIN SMALL LETTER DEZH DIGRAPH ʥ d $t 'z\'; # LATIN SMALL LETTER DZ DIGRAPH WITH CURL ʦ t $t s; # LATIN SMALL LETTER TS DIGRAPH ʧ t $t S; # LATIN SMALL LETTER TESH DIGRAPH ʨ t $t 's\'; # LATIN SMALL LETTER TC DIGRAPH WITH CURL ˔ '_r'; # MODIFIER LETTER UP TACK ˕ '_o'; # MODIFIER LETTER DOWN TACK \u030A '_0'; # COMBINING RING ABOVE φ 'p\'; # GREEK SMALL LETTER PHI 'K`'; # LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT ::NFC(NFD); ]]></tRule> </transform> </transforms> </supplementalData>