Xml文件  |  105行  |  1.85 KB

<?xml version="1.0" encoding="UTF-8" ?>
<!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd">
<!--
Copyright © 1991-2017 Unicode, Inc.
CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/)
For terms of use, see http://www.unicode.org/copyright.html
-->
<supplementalData>
	<version number="$Revision: 13868 $"/>
	<transforms>
		<transform source="fa" target="fa_FONIPA" direction="forward" alias="fa-fonipa-t-fa">
			<tRule><![CDATA[
[\u200c \u200d] → ;  # Strip off ZWJ and ZWNJ.
::NFD;

# Rewrite similarly-looking Arabic letters to Persian.
ي → ی;
ى → ی;
ك → ک;
ە → ه;
::NULL;

$VOWEL = [ َ ِ  ُ  ٓ ا و ی];
$BOUNDARY = [^[:L:][:M:][:N:]];
$IPA_CONSONANT = [ m n p b t d k ɡ ʔ f v s z ʃ ʒ ʁ ɢ h χ {t͡ʃ} {d͡ʒ} l ɾ ];

# Vowels
یّ → jj;
($VOWEL)ّ → ّ | $1;
َیْ → æj;
ِیْ → ej;

َوْ → ov;
ِی → iː;

َه → æ;
[^ːeoæ] {ه} $BOUNDARY → e;
[e] {ه} $BOUNDARY → ;
اَ → æ;
اً $BOUNDARY → æn;
َ → æ;
یه → je;
{هٔ} $BOUNDARY → jæ;
یٰ → ɒː;
{ی} $VOWEL → j;
ی → iː;

$BOUNDARY {ای} → iː;
ا\u0653 → ɒː;
آ → ɒː;
اِ → e;
اُ → o;
او → uː;
ا → ɒː; # Probably [^$BOUNDARY]
ِ → e;
هِ → e;

{و} $VOWEL → v;
$IPA_CONSONANT {و} → uː;
ُ{و} $IPA_CONSONANT → uː;

$BOUNDARY {و} $BOUNDARY → va;
و → ;
ُ → o;

# Consonants
پ → p;
ب → b;
[ت ط] → t;
د → d;
ک → k;
گ → ɡ;
[ع ء] → ʔ;
چ → t͡ʃ;
ج → d͡ʒ;
ف → f;
[س ص ث] → s;
[ز ذ ض ظ] → z;
ش → ʃ;
ژ → ʒ;
خ → χ;
غ → ʁ;
ق → ɢ;
ح → h;
م → m;
ن → n;
ه → h;
ل → l;
ر → ɾ;

ْ → ;
::NULL;

# TODO: How to handle these?
([$IPA_CONSONANT|$VOWEL]){ّ} → $1;

[ ّ ٔ ً ٰ ] → ;

::NFC;

			]]></tRule>
		</transform>
	</transforms>
</supplementalData>