scuffed-code/icu4c/source/data/translit/dv_dv_Latn_BGN.txt
2017-12-02 00:02:56 +00:00

178 lines
3.6 KiB
Plaintext
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

# © 2016 and later: Unicode, Inc. and others.
# License & terms of use: http://www.unicode.org/copyright.html#License
#
# File: dv_dv_Latn_BGN.txt
# Generated from CLDR
#
# BGN/PCGN 1988 Agreement, with modifications 2009
#
# This romanization system supersedes the one which was approved by
# the BGN and the PCGN in 1972. This official system was submitted
# to the PCGN by the Maldivian government in 1987 and approved by BGN
# and PCGN in 1988. The system presented here reflects the 1988 Agreement
# with minor modifications introduced by the government of the Maldives
# in 2009.
#
# In our rules, we also convert Arabic punctuation characters to Latin.
# These appears to be used in Maldivian text, for example in the Universal
# Declaration of Human Rights.
::[[:block=thaana:][،؛؟٪٫٬]\uFDF2] ;
::NFD;
$wordBoundary = [^[:L:][:M:][:N:]] ;
$vowel = [\u07A6-\u07AF] ;
$sukun = \u07B0 ;
$sign = [$sukun $vowel] ;
$rule4 = [އށ] $sukun ; # see note 4
### Consonants
# HAA
$rule4 ހ → hh ;
ހ → h ;
# NOONU
# See note 5: "romanized n when appearing without any vowel or auxiliary sign"
$rule4 ނ } $sign → nn ;
$rule4 ނ → nn\' ;
ނ } $sign → n ;
ނ → n\' ;
# RAA
$rule4 ރ → rr ;
ރ → r ;
# BAA
$rule4 ބ → bb ;
ބ → b ;
# LHAVIYANI
$rule4 ޅ → hlh ;
ޅ → lh;
# KAAFU
$rule4 ކ → kk ;
ކ → k ;
# VAAVU
$rule4 ވ → vv ;
ވ → v ;
# MEEMU
$rule4 މ → mm ;
މ → m ;
# FAAFU
$rule4 ފ → ff ;
ފ → f;
# DHAALU
$rule4 ދ → hdh ;
ދ → dh;
# THAA
# See note 6: "romanized iy when appearing in combination with a supercircle"
$rule4 ތ $sukun → hiy ;
$rule4 ތ → hth ;
\u07A8 ތ $sukun → iy ;
ތ $sukun → iy ;
ތ → th ;
# LAAMU
$rule4 ލ → ll ;
ލ → l ;
# GAAFU
$rule4 ގ → gg ;
ގ → g ;
# GNAVIYANI
$rule4 ޏ → hgn ;
ޏ → gn ;
# SEENU
$rule4 ސ → ss ;
ސ → s ;
# DAVIYANI
$rule4 ޑ → dd ;
ޑ → d ;
# ZAVIYANI
$rule4 ޒ → zz ;
ޒ → z ;
# TAVIYANI
$rule4 ޓ → tt ;
ޓ → t ;
# YAA
$rule4 ޔ → yy ;
ޔ → y ;
# PAVIYANI
$rule4 ޕ → pp ;
ޕ → p ;
# JAVIYANI
$rule4 ޖ → jj ;
ޖ → j ;
# CHAVIYANI
$rule4 ޗ → hch ;
ޗ → ch ;
### Borrowed Consonants (See Rule 7)
# SAADHU
$rule4 ޞ → şş ;
ޞ → ş ;
# SHEENU
$rule4 ޝ → hsh ;
ޝ → sh ;
# ZAA
$rule4 ޜ → zz ;
ޜ → z;
# KHAA
$rule4 ޚ → hkh ;
ޚ → kh;
# HHAA
$rule4 ޙ → ḩḩ ;
ޙ → ḩ ;
# THAALU
$rule4 ޛ → hdh ;
ޛ → dh ;
# TTAA
$rule4 ޘ → hth ;
ޘ → th ;
# WAAVU
$rule4 ޥ → ww ;
ޥ → w ;
# QAAFU
$rule4 ޤ → qq ;
ޤ → q ;
# GHAINU
$rule4 ޣ → hgh ;
ޣ → gh ;
# AINU
$rule4 ޢ → \'\' ;
ޢ → \' ;
# ZO
$rule4 ޡ → z\u0327z\u0327 ;
ޡ → z\u0327 ;
# TO
$rule4 ޠ → ţţ ;
ޠ → ţ ;
# DAADHU
$rule4 ޟ → ḑḑ ;
ޟ → ḑ ;
# NOTE: not in Maldivian BGN system, but for completeness of Thaana block
# NAA
$rule4 ޱ → n\u0332n\u0332 ;
ޱ → n\u0332 ;
# Rule 4 in word-final position
$rule4 } $wordBoundary → h;
# SHAVIYANI (placed last to avoid masking)
$rule4 ށ → hsh;
ށ → sh;
# Otherwise, these signs are not romanized elsewhere
$rule4 → ;
\u07B0 → ;
އ → ;
# NOTE: not in Maldivian BGN system, but common in names (e.g. Abdullah)
($vowel) \uFDF2 → | $1 llāh ;
\uFDF2 → allāh;
### Vowels
\u07A6 → a; # ABAFILI
\u07A7 → aa; # AABAAFILI
\u07AC → e; # EBEFILI
\u07AD → ey; # EYBEYFILI
\u07A8 → i; # IBIFILI
\u07A9 → ee; # EEBEEFILI
\u07AE → o; # OBOFILI
\u07AF → oa; # OABOAFILI
\u07AA → u; # UBUFILI
\u07AB → oo; # OOBOOFILI
، → ','; # U+060C ARABIC COMMA
؛ → ';'; # U+061B ARABIC SEMICOLON
؟ → '?'; # U+061F ARABIC QUESTION MARK
٪ → '%'; # U+066A ARABIC PERCENT SIGN
٫ → '.'; # U+066B ARABIC DECIMAL SEPARATOR
٬ → ','; # U+066C ARABIC THOUSANDS SEPARATOR