# © 2016 and later: Unicode, Inc. and others. # License & terms of use: http://www.unicode.org/copyright.html#License # # File: Hebr_Latn.txt # Generated from CLDR # # Transliteration table for Hebrew # Based on the UNGEGN table at: # http://www.eki.ee/wgrs/rom1_he.pdf # # Exceptions: # - Accents are added to disambiguate letters # - Combinations of dagesh, shin/sin dot that produce different # letters are not yet encoded. # # To test, open: # http://www.ibm.com/software/globalization/icu/demo/transform # Click Edit, paste in this file, Save As hebrew-latin/XXX # (where XXX is a username) # Now go back to the main window, and try it out. # Use hebrew-latin/XXX for Output 1, and (Inverse) for Output 2 # Paste in hebrew text in Input, and hit Transliterate. # # For more information, see: # http://icu.sourceforge.net/userguide/Transform.html :: [[:Hebrew:] [:^ccc=0:] [\u05B0-\u05B9\u05BB-\u05BC\u05C1-\u05C2ℵ-ℸ\u0304\u05BF] - [\u05BD]] ; :: nfkd (nfc) ; $letterAfter = [:M:]* [:L:] ; # move longer items here to avoid masking ח ↔ h\u0331 ; צ ↔ z\u0331 } $letterAfter; ץ ↔ z\u0331 ; ש ↔ s\u0327 ; ת ↔ t\u0327 ; א ↔ ʼ ; ב ↔ b ; ג ↔ g ; ד ↔ d ; ה ↔ h ; ו ↔ w ; ז ↔ z ; ט ↔ t ; י ↔ y ; כ ↔ k } $letterAfter; ך ↔ k ; ל ↔ l ; מ ↔ m } $letterAfter; ם ↔ m ; נ ↔ n } $letterAfter; ן ↔ n ; ס ↔ s ; ע ↔ ʻ ; פ ↔ p } $letterAfter; ף ↔ p ; ק ↔ q ; ר ↔ r ; װ → | וו; # HEBREW LIGATURE YIDDISH DOUBLE VAV ױ → | וי; # HEBREW LIGATURE YIDDISH VAV YOD ײ → | יי ; # HEBREW LIGATURE YIDDISH DOUBLE YOD \u05BC ↔ \u0307 ; # dagesh just goes to overdot for now \u05C1 ↔ \u030C ; # shin dot -→ sh \u05C2 ↔ \u0302 ; # sin dot -→ s # points $above = [^[:ccc=0:][:ccc=230:]]*; ‎\u05B2‎ → à ; ‎\u05B2‎ $1← a ($above) \u0300; ‎\u05B8‎ → á ; ‎\u05B8‎ $1 ← a ($above) \u0301; ‎\u05B1‎ → è ; ‎\u05B1‎ $1 ← e ($above) \u0300; ‎\u05B5‎ → é ; ‎\u05B5‎ $1 ← e ($above) \u0301; ‎\u05B0‎ → e \u0306 ; ‎\u05B0‎ $1 ← e ($above) \u0306; ‎\u05B9‎ → ò ; ‎\u05B9‎ $1 ← o ($above) \u0300; \u05B4 ↔ i ; \u05BB ↔ u ; \u05B7 ↔ a ; \u05B6 ↔ e ; \u05B3 ↔ o ; \u05BF ↔ \u0304 ; # fallbacks ק ← c ; פ ← f } $letterAfter; ף ← f ; ז ← j ; ו ← v ; כס ← x ; :: (lower); :: nfc (nfd) ; :: ([[:Latin:] [:^ccc=0:] [ʻ-ʼ\u0300-\u0302\u0307\u030C\u0327\u0331\u0340-\u0341 \u0304 ]]);