# © 2016 and later: Unicode, Inc. and others. # License & terms of use: http://www.unicode.org/copyright.html#License # # File: InterIndic_Arabic.txt # Generated from CLDR # $nonword = [^\uE000-\uE0FF]; $wordBoundary = [^[:L:][:M:][:N:]]; \uE015\uE03F\uE02F\uE03E } $nonword→كيا; # किया \uE026\uE03F\uE02F\uE03E } $nonword→ديا; # दिया \uE015\uE03F } $nonword→كي; # कि at word end \uE039\uE048→هي; # ह\u0948 \uE001 } $nonword→ن; # chandrabindu at end to noon \uE001→ن; # chandrabindu not at end to noon \uE002 } $nonword→ن; # anusvara to noon at end \uE002→ن; # anusvara to noon \u0902 \uE003→ه ا; # viarga to ha + alif ः \uE004→ا; # short a to alif ऄ \uE005→ا; # अ \uE006→ا \u0653; # alif with mad आ [[:L:][:M:]] {\uE007}→ي; # इ after another letter or mark \uE007→إ; # इ at beginning of word [[:L:][:M:]] {\uE008}→ي; # ई after another letter or mark \uE008→إ; # ई at beginning of word \uE009→و; # उ \uE00A→و; # ऊ \uE00B→ر; # ऋ \uE00C→ل; # ऌ \uE00D→ا ي; # ऍ \uE00E→ي; # ऎ $wordBoundary {\uE00F} → إي; # word-initial ए \uE00F } $nonword→ي; # ए use ي when at end \uE00F→ي; # ए use ي when not at end \uE010 } $nonword→ا ي; # ऐ use ي when at end \uE010→ا ي; # ऐ use ي when not at end \uE011→ا و; # ऑ \uE012→ا و; # ऒ \uE013→ا و; # ओ \uE014→ا و; # औ \uE015→ك; # क \uE016→كه; # ख \uE017→ج; # ग \uE018→جه; # घ \uE019→نج; # ङ \uE01A→تش; # च \uE01B→تشه; # छ \uE01C→ج; # ज \uE01D→جه; # झ \uE01E→ن; # ञ \uE01F→ط; # ट \uE020→طه; # ठ \uE021→د; # ड \uE022→ده; # ढ \uE023→ن; # ण \uE024→ت; # त \uE025→ته; # थ \uE026→د; # द \uE027→ده; # ध \uE028→ن; # न \uE029→ن; # ऩ \uE02A→ب; # प \uE02B→به; # फ \uE02C→ب; # ब \uE02D→به; # भ \uE02E→م; # म \uE02F→ي; # य \uE030→ر; # र \uE031→ر; # ऱ \uE032→ل; # ल \uE033→ر; # ळ \uE034→ر; # ऴ \uE035→و; # व \uE036→ش; # श \uE037→ش; # ष \uE038→س; # स \uE039→ه; # ह \uE03C→; # \u093C \uE03D→; # ऽ \uE03E→ا; # ा \uE03F→ي; # ि \uE040→ي; # ी \uE041→و; # \u0941 \uE042→و; # \u0942 \uE043→ر; # \u0943 \uE044→ر; # \u0944 \uE045→ن; # \u0945 \uE046→ي; # \u0946 \uE047 } $nonword→ي; # \u0947 use ي when at end \uE047→ي; # \u0947 use ي when not at end \uE048 } $nonword→ا ي; # \u0948 use ي when at end \uE048→ا ي; # \u0948 use ي when not at end \uE049→و; # ॉ \uE04A→ا و; # ॊ \uE04B→و; # ो \uE04C→ا و; # ौ \uE04D→; # \u094D \uE050→ا و; # ॐ \uE051→; # \u0951 \uE052→; # \u0952 \uE053→; # \u0953 \uE054→; # \u0954 \uE058→ق; # क़ \uE059→خ; # ख़ \uE05A→غ; # ग़ \uE05B→ز; # ज़ \uE05C→ر; # ड़ \uE05D→ره; # ढ़ \uE05E→ف; # फ़ \uE05F→ي; # य़ \uE060→ر; # ॠ \uE061→ل; # ॡ \uE062→ل; # \u0962 \uE063→ل; # \u0963 \uE064→۔; # । \uE065→۔; # ॥ \uE066→\.; # ० \uE067→١; # १ \uE068→٢; # २ \uE069→٣; # ३ \uE06A→٤; # ४ \uE06B→٥; # ५ \uE06C→٦; # ६ \uE06D→٧; # ७ \uE06E→٨; # ८ \uE06F→٩; # ९ \uE070→\.; # ॰ \uE082→; # ॽ # Remove sequences of alif characters. # For example, transform पाओला → بااولا → باولا. ::null; $alif = [أإآا] [:M:]*; ($alif) $alif+ → $1;