diff --git a/data/10.0.0-indic-positional-category.txt b/data/10.0.0-indic-positional-category.txt new file mode 100644 index 0000000..40d8b37 --- /dev/null +++ b/data/10.0.0-indic-positional-category.txt @@ -0,0 +1,697 @@ +# IndicPositionalCategory-10.0.0.txt +# Date: 2017-05-31, 01:07:00 GMT [RP] +# © 2017 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# +# For documentation, see UAX #44: Unicode Character Database, +# at http://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Positional_Category enumerated property +# +# Scope: This property is aimed at the problem of +# the specification of syllabic structure for Indic scripts. +# Because dependent vowels (matras), visible viramas, and other +# characters are placed in notional slots around the consonant (or +# consonant cluster) core of an Indic syllable, there may be +# cooccurrence constraints or other interactions. Also, it may be +# desirable, in cases where more than one such character may occur in +# sequence, as for example, in a top slot and a bottom slot, to +# specify preferred orders for spelling. As such, this property +# is designed primarily to supplement the Indic_Syllabic_Category +# property. +# +# Note that this property is *not* intended as +# a prescriptive property regarding display or font design, +# for a number of reasons. Good font design requires information +# that is outside the context of a character encoding standard, +# and is best handled in other venues. For Indic dependent +# vowels and similar characters, in particular: +# +# 1. Matra placement may vary somewhat based on typeface design. +# 2. Matra placement, even within a single script, may vary +# somewhat according to historic period or local conventions. +# 3. Matra placement may be changed by explicit orthographic reform +# decisions. +# 4. Matras may ligate in various ways with a consonant (or even +# other elements of a syllable) instead of occurring in a +# discrete location. +# 5. Matra display may be contextually determined. This is +# notable, for example, in the Tamil script, where the shape +# and placement of -u and -uu vowels depends strongly on +# which consonant they adjoin. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Positional_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as containing dependent vowels or similar characters +# in the structural sense used for the Indic_Positional_Category are the +# following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Grantha, Gujarati, Gurmukhi, Hanunoo, +# Javanese, Kaithi, Kannada, Kharoshthi, Khmer, Khojki, Khudawadi, +# Lao, Lepcha, Limbu, Malayalam, Marchen, Masaram Gondi, Meetei +# Mayek, Modi, Myanmar, Newa, New Tai Lue, Oriya, Rejang, Saurashtra, +# Sharada, Siddham, Sinhala, Soyombo, Sundanese, Syloti Nagri, +# Tagalog, Tagbanwa, Tai Tham, Tai Viet, Takri, Tamil, Telugu, Thai, +# Tibetan, Tirhuta, and Zanabazar Square. +# +# All characters for all other scripts not in that list +# take the default value for this property. +# +# See IndicSyllabicCategory.txt for a slightly more extended +# list of Indic scripts, including those which do not have +# positional characters. Currently, those additional +# Indic scripts without positional characters are +# Kayah Li, Mahajani, Multani, Phags-pa, and Tai Le. +# +# Note: The following characters are all assigned the positional category +# Right, but may have different positions in some cases: +# * U+0BC1 TAMIL VOWEL SIGN U and U+0BC2 TAMIL VOWEL SIGN UU have +# contextually variable placement in Tamil. +# * U+0D41 MALAYALAM VOWEL SIGN U and U+0D42 MALAYALAM VOWEL SIGN UU form +# complex ligatures with consonants in older Malayalam orthography. +# * U+11341 GRANTHA VOWEL SIGN U and U+11342 GRANTHA VOWEL SIGN UU have +# contextually variable placement in Grantha. + +# ================================================ + +# Property: Indic_Positional_Category +# +# All code points not explicitly listed for Indic_Positional_Category +# have the value NA (not applicable). +# +# @missing: 0000..10FFFF; NA + +# ------------------------------------------------ + +# Indic_Positional_Category=Right + +0903 ; Right # Mc DEVANAGARI SIGN VISARGA +093B ; Right # Mc DEVANAGARI VOWEL SIGN OOE +093E ; Right # Mc DEVANAGARI VOWEL SIGN AA +0940 ; Right # Mc DEVANAGARI VOWEL SIGN II +0949..094C ; Right # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094F ; Right # Mc DEVANAGARI VOWEL SIGN AW +0982..0983 ; Right # Mc [2] BENGALI SIGN ANUSVARA..BENGALI SIGN VISARGA +09BE ; Right # Mc BENGALI VOWEL SIGN AA +09C0 ; Right # Mc BENGALI VOWEL SIGN II +09D7 ; Right # Mc BENGALI AU LENGTH MARK +0A03 ; Right # Mc GURMUKHI SIGN VISARGA +0A3E ; Right # Mc GURMUKHI VOWEL SIGN AA +0A40 ; Right # Mc GURMUKHI VOWEL SIGN II +0A83 ; Right # Mc GUJARATI SIGN VISARGA +0ABE ; Right # Mc GUJARATI VOWEL SIGN AA +0AC0 ; Right # Mc GUJARATI VOWEL SIGN II +0ACB..0ACC ; Right # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0B02..0B03 ; Right # Mc [2] ORIYA SIGN ANUSVARA..ORIYA SIGN VISARGA +0B3E ; Right # Mc ORIYA VOWEL SIGN AA +0B40 ; Right # Mc ORIYA VOWEL SIGN II +0BBE..0BBF ; Right # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC1..0BC2 ; Right # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BD7 ; Right # Mc TAMIL AU LENGTH MARK +0C01..0C03 ; Right # Mc [3] TELUGU SIGN CANDRABINDU..TELUGU SIGN VISARGA +0C41..0C44 ; Right # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C82..0C83 ; Right # Mc [2] KANNADA SIGN ANUSVARA..KANNADA SIGN VISARGA +0CBE ; Right # Mc KANNADA VOWEL SIGN AA +0CC1..0CC4 ; Right # Mc [4] KANNADA VOWEL SIGN U..KANNADA VOWEL SIGN VOCALIC RR +0CD5..0CD6 ; Right # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0D02..0D03 ; Right # Mc [2] MALAYALAM SIGN ANUSVARA..MALAYALAM SIGN VISARGA +0D3E..0D40 ; Right # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D42 ; Right # Mn [2] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN UU +0D57 ; Right # Mc MALAYALAM AU LENGTH MARK +0D82..0D83 ; Right # Mc [2] SINHALA SIGN ANUSVARAYA..SINHALA SIGN VISARGAYA +0DCF..0DD1 ; Right # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD8 ; Right # Mc SINHALA VOWEL SIGN GAETTA-PILLA +0DDF ; Right # Mc SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Right # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Right # Lo THAI CHARACTER SARA A +0E32..0E33 ; Right # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E45 ; Right # Lo THAI CHARACTER LAKKHANGYAO +0EB0 ; Right # Lo LAO VOWEL SIGN A +0EB2..0EB3 ; Right # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0F3E ; Right # Mc TIBETAN SIGN YAR TSHES +0F7F ; Right # Mc TIBETAN SIGN RNAM BCAD +102B..102C ; Right # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +1038 ; Right # Mc MYANMAR SIGN VISARGA +103B ; Right # Mc MYANMAR CONSONANT SIGN MEDIAL YA +1056..1057 ; Right # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1062..1064 ; Right # Mc [3] MYANMAR VOWEL SIGN SGAW KAREN EU..MYANMAR TONE MARK SGAW KAREN KE PHO +1067..106D ; Right # Mc [7] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1083 ; Right # Mc MYANMAR VOWEL SIGN SHAN AA +1087..108C ; Right # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108F ; Right # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109C ; Right # Mc [3] MYANMAR SIGN KHAMTI TONE-1..MYANMAR VOWEL SIGN AITON A +17B6 ; Right # Mc KHMER VOWEL SIGN AA +17C7..17C8 ; Right # Mc [2] KHMER SIGN REAHMUK..KHMER SIGN YUUKALEAPINTU +1923..1924 ; Right # Mc [2] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AI +1929..192B ; Right # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1930..1931 ; Right # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Right # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +19B0..19B4 ; Right # Lo [5] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN UU +19B8..19B9 ; Right # Lo [2] NEW TAI LUE VOWEL SIGN OA..NEW TAI LUE VOWEL SIGN UE +19BB..19C0 ; Right # Lo [6] NEW TAI LUE VOWEL SIGN AAY..NEW TAI LUE VOWEL SIGN IY +19C8..19C9 ; Right # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A1A ; Right # Mc BUGINESE VOWEL SIGN O +1A57 ; Right # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A61 ; Right # Mc TAI THAM VOWEL SIGN A +1A63..1A64 ; Right # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A6D ; Right # Mc TAI THAM VOWEL SIGN OY +1B04 ; Right # Mc BALINESE SIGN BISAH +1B35 ; Right # Mc BALINESE VOWEL SIGN TEDUNG +1B44 ; Right # Mc BALINESE ADEG ADEG +1B82 ; Right # Mc SUNDANESE SIGN PANGWISAD +1BA1 ; Right # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA7 ; Right # Mc SUNDANESE VOWEL SIGN PANOLONG +1BAA ; Right # Mc SUNDANESE SIGN PAMAAEH +1BE7 ; Right # Mc BATAK VOWEL SIGN E +1BEA..1BEC ; Right # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BEE ; Right # Mc BATAK VOWEL SIGN U +1BF2..1BF3 ; Right # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +1C24..1C26 ; Right # Mc [3] LEPCHA SUBJOINED LETTER YA..LEPCHA VOWEL SIGN AA +1C2A..1C2B ; Right # Mc [2] LEPCHA VOWEL SIGN U..LEPCHA VOWEL SIGN UU +1CE1 ; Right # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF7 ; Right # Mc VEDIC SIGN ATIKRAMA +A823..A824 ; Right # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A827 ; Right # Mc SYLOTI NAGRI VOWEL SIGN OO +A880..A881 ; Right # Mc [2] SAURASHTRA SIGN ANUSVARA..SAURASHTRA SIGN VISARGA +A8B4..A8C3 ; Right # Mc [16] SAURASHTRA CONSONANT SIGN HAARU..SAURASHTRA VOWEL SIGN AU +A952..A953 ; Right # Mc [2] REJANG CONSONANT SIGN H..REJANG VIRAMA +A983 ; Right # Mc JAVANESE SIGN WIGNYAN +A9B4..A9B5 ; Right # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9BD..A9BE ; Right # Mc [2] JAVANESE CONSONANT SIGN KERET..JAVANESE CONSONANT SIGN PENGKAL +AA33 ; Right # Mc CHAM CONSONANT SIGN YA +AA4D ; Right # Mc CHAM CONSONANT SIGN FINAL H +AA7B ; Right # Mc MYANMAR SIGN PAO KAREN TONE +AA7D ; Right # Mc MYANMAR SIGN TAI LAING TONE-5 +AAB1 ; Right # Lo TAI VIET VOWEL AA +AABA ; Right # Lo TAI VIET VOWEL UA +AABD ; Right # Lo TAI VIET VOWEL AN +AAEF ; Right # Mc MEETEI MAYEK VOWEL SIGN AAU +AAF5 ; Right # Mc MEETEI MAYEK VOWEL SIGN VISARGA +ABE3..ABE4 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE6..ABE7 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE9..ABEA ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +ABEC ; Right # Mc MEETEI MAYEK LUM IYEK +11000 ; Right # Mc BRAHMI SIGN CANDRABINDU +11002 ; Right # Mc BRAHMI SIGN VISARGA +11082 ; Right # Mc KAITHI SIGN VISARGA +110B0 ; Right # Mc KAITHI VOWEL SIGN AA +110B2 ; Right # Mc KAITHI VOWEL SIGN II +110B7..110B8 ; Right # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11182 ; Right # Mc SHARADA SIGN VISARGA +111B3 ; Right # Mc SHARADA VOWEL SIGN AA +111B5 ; Right # Mc SHARADA VOWEL SIGN II +111C0 ; Right # Mc SHARADA SIGN VIRAMA +1122C..1122E ; Right # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +11235 ; Right # Mc KHOJKI SIGN VIRAMA +112E0 ; Right # Mc KHUDAWADI VOWEL SIGN AA +112E2 ; Right # Mc KHUDAWADI VOWEL SIGN II +11302..11303 ; Right # Mc [2] GRANTHA SIGN ANUSVARA..GRANTHA SIGN VISARGA +1133E..1133F ; Right # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11341..11344 ; Right # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +1134D ; Right # Mc GRANTHA SIGN VIRAMA +11357 ; Right # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Right # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +11435 ; Right # Mc NEWA VOWEL SIGN AA +11437 ; Right # Mc NEWA VOWEL SIGN II +11440..11441 ; Right # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +11445 ; Right # Mc NEWA SIGN VISARGA +114B0 ; Right # Mc TIRHUTA VOWEL SIGN AA +114B2 ; Right # Mc TIRHUTA VOWEL SIGN II +114BD ; Right # Mc TIRHUTA VOWEL SIGN SHORT O +114C1 ; Right # Mc TIRHUTA SIGN VISARGA +115AF ; Right # Mc SIDDHAM VOWEL SIGN AA +115B1 ; Right # Mc SIDDHAM VOWEL SIGN II +115BE ; Right # Mc SIDDHAM SIGN VISARGA +11630..11632 ; Right # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +1163B..1163C ; Right # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +1163E ; Right # Mc MODI SIGN VISARGA +116AC ; Right # Mc TAKRI SIGN VISARGA +116AF ; Right # Mc TAKRI VOWEL SIGN II +116B6 ; Right # Mc TAKRI SIGN VIRAMA +11720..11721 ; Right # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +11A39 ; Right # Mc ZANABAZAR SQUARE SIGN VISARGA +11A57..11A58 ; Right # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A97 ; Right # Mc SOYOMBO SIGN VISARGA +11C2F ; Right # Mc BHAIKSUKI VOWEL SIGN AA +11C3E ; Right # Mc BHAIKSUKI SIGN VISARGA +11CA9 ; Right # Mc MARCHEN SUBJOINED LETTER YA +11CB4 ; Right # Mc MARCHEN VOWEL SIGN O + +# Indic_Positional_Category=Left + +093F ; Left # Mc DEVANAGARI VOWEL SIGN I +094E ; Left # Mc DEVANAGARI VOWEL SIGN PRISHTHAMATRA E +09BF ; Left # Mc BENGALI VOWEL SIGN I +09C7..09C8 ; Left # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +0A3F ; Left # Mc GURMUKHI VOWEL SIGN I +0ABF ; Left # Mc GUJARATI VOWEL SIGN I +0B47 ; Left # Mc ORIYA VOWEL SIGN E +0BC6..0BC8 ; Left # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0D46..0D48 ; Left # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0DD9 ; Left # Mc SINHALA VOWEL SIGN KOMBUVA +0DDB ; Left # Mc SINHALA VOWEL SIGN KOMBU DEKA +0F3F ; Left # Mc TIBETAN SIGN MAR TSHES +1031 ; Left # Mc MYANMAR VOWEL SIGN E +1084 ; Left # Mc MYANMAR VOWEL SIGN SHAN E +17C1..17C3 ; Left # Mc [3] KHMER VOWEL SIGN E..KHMER VOWEL SIGN AI +1A19 ; Left # Mc BUGINESE VOWEL SIGN E +1A55 ; Left # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A6E..1A72 ; Left # Mc [5] TAI THAM VOWEL SIGN E..TAI THAM VOWEL SIGN THAM AI +1B3E..1B3F ; Left # Mc [2] BALINESE VOWEL SIGN TALING..BALINESE VOWEL SIGN TALING REPA +1BA6 ; Left # Mc SUNDANESE VOWEL SIGN PANAELAENG +1C27..1C28 ; Left # Mc [2] LEPCHA VOWEL SIGN I..LEPCHA VOWEL SIGN O +1C34..1C35 ; Left # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A9BA..A9BB ; Left # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +AA2F..AA30 ; Left # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA34 ; Left # Mc CHAM CONSONANT SIGN RA +AAEB ; Left # Mc MEETEI MAYEK VOWEL SIGN II +AAEE ; Left # Mc MEETEI MAYEK VOWEL SIGN AU +110B1 ; Left # Mc KAITHI VOWEL SIGN I +1112C ; Left # Mc CHAKMA VOWEL SIGN E +111B4 ; Left # Mc SHARADA VOWEL SIGN I +112E1 ; Left # Mc KHUDAWADI VOWEL SIGN I +11347..11348 ; Left # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +11436 ; Left # Mc NEWA VOWEL SIGN I +114B1 ; Left # Mc TIRHUTA VOWEL SIGN I +114B9 ; Left # Mc TIRHUTA VOWEL SIGN E +115B0 ; Left # Mc SIDDHAM VOWEL SIGN I +115B8 ; Left # Mc SIDDHAM VOWEL SIGN E +116AE ; Left # Mc TAKRI VOWEL SIGN I +11726 ; Left # Mc AHOM VOWEL SIGN E +11CB1 ; Left # Mc MARCHEN VOWEL SIGN I + +# Indic_Positional_Category=Visual_Order_Left + +# These are dependent vowels that occur to the left of the consonant +# letter in a syllable, but which occur in scripts using the visual order +# model, instead of the logical order model. Because of the different +# model, these left-side vowels occur first in the backing store (before +# the consonant letter) and are not reordered during text rendering. +# +# [Derivation: Logical_Order_Exception=Yes] + +0E40..0E44 ; Visual_Order_Left # Lo [5] THAI CHARACTER SARA E..THAI CHARACTER SARA AI MAIMALAI +0EC0..0EC4 ; Visual_Order_Left # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +19B5..19B7 ; Visual_Order_Left # Lo [3] NEW TAI LUE VOWEL SIGN E..NEW TAI LUE VOWEL SIGN O +19BA ; Visual_Order_Left # Lo NEW TAI LUE VOWEL SIGN AY +AAB5..AAB6 ; Visual_Order_Left # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB9 ; Visual_Order_Left # Lo TAI VIET VOWEL UEA +AABB..AABC ; Visual_Order_Left # Lo [2] TAI VIET VOWEL AUE..TAI VIET VOWEL AY + +# Indic_Positional_Category=Left_And_Right + +09CB..09CC ; Left_And_Right # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +0B4B ; Left_And_Right # Mc ORIYA VOWEL SIGN O +0BCA..0BCC ; Left_And_Right # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0D4A..0D4C ; Left_And_Right # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0DDC ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA +0DDE ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA +17C0 ; Left_And_Right # Mc KHMER VOWEL SIGN IE +17C4..17C5 ; Left_And_Right # Mc [2] KHMER VOWEL SIGN OO..KHMER VOWEL SIGN AU +1B40..1B41 ; Left_And_Right # Mc [2] BALINESE VOWEL SIGN TALING TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1134B..1134C ; Left_And_Right # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +114BC ; Left_And_Right # Mc TIRHUTA VOWEL SIGN O +114BE ; Left_And_Right # Mc TIRHUTA VOWEL SIGN AU +115BA ; Left_And_Right # Mc SIDDHAM VOWEL SIGN O + +# Indic_Positional_Category=Top + +0900..0902 ; Top # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +093A ; Top # Mn DEVANAGARI VOWEL SIGN OE +0945..0948 ; Top # Mn [4] DEVANAGARI VOWEL SIGN CANDRA E..DEVANAGARI VOWEL SIGN AI +0951 ; Top # Mn DEVANAGARI STRESS SIGN UDATTA +0953..0955 ; Top # Mn [3] DEVANAGARI GRAVE ACCENT..DEVANAGARI VOWEL SIGN CANDRA LONG E +0981 ; Top # Mn BENGALI SIGN CANDRABINDU +0A01..0A02 ; Top # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A47..0A48 ; Top # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Top # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0A70..0A71 ; Top # Mn [2] GURMUKHI TIPPI..GURMUKHI ADDAK +0A81..0A82 ; Top # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0AC5 ; Top # Mn GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Top # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AFA..0AFF ; Top # Mn [6] GUJARATI SIGN SUKUN..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B01 ; Top # Mn ORIYA SIGN CANDRABINDU +0B3F ; Top # Mn ORIYA VOWEL SIGN I +0B56 ; Top # Mn ORIYA AI LENGTH MARK +0B82 ; Top # Mn TAMIL SIGN ANUSVARA +0BC0 ; Top # Mn TAMIL VOWEL SIGN II +0BCD ; Top # Mn TAMIL SIGN VIRAMA +0C00 ; Top # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C3E..0C40 ; Top # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C46..0C47 ; Top # Mn [2] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN EE +0C4A..0C4D ; Top # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA +0C55 ; Top # Mn TELUGU LENGTH MARK +0C81 ; Top # Mn KANNADA SIGN CANDRABINDU +0CBF ; Top # Mn KANNADA VOWEL SIGN I +0CC6 ; Top # Mn KANNADA VOWEL SIGN E +0CCC..0CCD ; Top # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA +0D00..0D01 ; Top # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU +0D3B..0D3C ; Top # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA +0D4D ; Top # Mn MALAYALAM SIGN VIRAMA +0DCA ; Top # Mn SINHALA SIGN AL-LAKUNA +0DD2..0DD3 ; Top # Mn [2] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN DIGA IS-PILLA +0E31 ; Top # Mn THAI CHARACTER MAI HAN-AKAT +0E34..0E37 ; Top # Mn [4] THAI CHARACTER SARA I..THAI CHARACTER SARA UEE +0E47..0E4E ; Top # Mn [8] THAI CHARACTER MAITAIKHU..THAI CHARACTER YAMAKKAN +0EB1 ; Top # Mn LAO VOWEL SIGN MAI KAN +0EB4..0EB7 ; Top # Mn [4] LAO VOWEL SIGN I..LAO VOWEL SIGN YY +0EBB ; Top # Mn LAO VOWEL SIGN MAI KON +0EC8..0ECD ; Top # Mn [6] LAO TONE MAI EK..LAO NIGGAHITA +0F39 ; Top # Mn TIBETAN MARK TSA -PHRU +0F72 ; Top # Mn TIBETAN VOWEL SIGN I +0F7A..0F7E ; Top # Mn [5] TIBETAN VOWEL SIGN E..TIBETAN SIGN RJES SU NGA RO +0F80 ; Top # Mn TIBETAN VOWEL SIGN REVERSED I +0F82..0F83 ; Top # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +0F86..0F87 ; Top # Mn [2] TIBETAN SIGN LCI RTAGS..TIBETAN SIGN YANG RTAGS +102D..102E ; Top # Mn [2] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN II +1032..1036 ; Top # Mn [5] MYANMAR VOWEL SIGN AI..MYANMAR SIGN ANUSVARA +103A ; Top # Mn MYANMAR SIGN ASAT +1071..1074 ; Top # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1085..1086 ; Top # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109D ; Top # Mn MYANMAR VOWEL SIGN AITON AI +1712 ; Top # Mn TAGALOG VOWEL SIGN I +1732 ; Top # Mn HANUNOO VOWEL SIGN I +1752 ; Top # Mn BUHID VOWEL SIGN I +1772 ; Top # Mn TAGBANWA VOWEL SIGN I +17B7..17BA ; Top # Mn [4] KHMER VOWEL SIGN I..KHMER VOWEL SIGN YY +17C6 ; Top # Mn KHMER SIGN NIKAHIT +17C9..17D1 ; Top # Mn [9] KHMER SIGN MUUSIKATOAN..KHMER SIGN VIRIAM +17D3 ; Top # Mn KHMER SIGN BATHAMASAT +17DD ; Top # Mn KHMER SIGN ATTHACAN +1920..1921 ; Top # Mn [2] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN I +1927..1928 ; Top # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Top # Mn LIMBU SIGN KEMPHRENG +1A17 ; Top # Mn BUGINESE VOWEL SIGN I +1A1B ; Top # Mn BUGINESE VOWEL SIGN AE +1A58..1A5A ; Top # Mn [3] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN LOW PA +1A62 ; Top # Mn TAI THAM VOWEL SIGN MAI SAT +1A65..1A68 ; Top # Mn [4] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN UUE +1A6B ; Top # Mn TAI THAM VOWEL SIGN O +1A73..1A7C ; Top # Mn [10] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN KHUEN-LUE KARAN +1B00..1B03 ; Top # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG +1B34 ; Top # Mn BALINESE SIGN REREKAN +1B36..1B37 ; Top # Mn [2] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN ULU SARI +1B42 ; Top # Mn BALINESE VOWEL SIGN PEPET +1B6B ; Top # Mn BALINESE MUSICAL SYMBOL COMBINING TEGEH +1B6D..1B73 ; Top # Mn [7] BALINESE MUSICAL SYMBOL COMBINING KEMPUL..BALINESE MUSICAL SYMBOL COMBINING GONG +1B80..1B81 ; Top # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR +1BA4 ; Top # Mn SUNDANESE VOWEL SIGN PANGHULU +1BA8..1BA9 ; Top # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE6 ; Top # Mn BATAK SIGN TOMPI +1BE8..1BE9 ; Top # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BED ; Top # Mn BATAK VOWEL SIGN KARO O +1BEF..1BF1 ; Top # Mn [3] BATAK VOWEL SIGN U FOR SIMALUNGUN SA..BATAK CONSONANT SIGN H +1C2D..1C33 ; Top # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +1C36 ; Top # Mn LEPCHA SIGN RAN +1CD0..1CD2 ; Top # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CDA..1CDB ; Top # Mn [2] VEDIC TONE DOUBLE SVARITA..VEDIC TONE TRIPLE SVARITA +1CE0 ; Top # Mn VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CF4 ; Top # Mn VEDIC TONE CANDRA ABOVE +1DFB ; Top # Mn COMBINING DELETION MARK +A806 ; Top # Mn SYLOTI NAGRI SIGN HASANTA +A80B ; Top # Mn SYLOTI NAGRI SIGN ANUSVARA +A826 ; Top # Mn SYLOTI NAGRI VOWEL SIGN E +A8C5 ; Top # Mn SAURASHTRA SIGN CANDRABINDU +A8E0..A8F1 ; Top # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +A94A ; Top # Mn REJANG VOWEL SIGN AI +A94F..A951 ; Top # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A980..A982 ; Top # Mn [3] JAVANESE SIGN PANYANGGA..JAVANESE SIGN LAYAR +A9B3 ; Top # Mn JAVANESE SIGN CECAK TELU +A9B6..A9B7 ; Top # Mn [2] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN WULU MELIK +A9BC ; Top # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Top # Mn MYANMAR SIGN SHAN SAW +AA29..AA2C ; Top # Mn [4] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN EI +AA2E ; Top # Mn CHAM VOWEL SIGN OE +AA31 ; Top # Mn CHAM VOWEL SIGN AU +AA43 ; Top # Mn CHAM CONSONANT SIGN FINAL NG +AA4C ; Top # Mn CHAM CONSONANT SIGN FINAL M +AA7C ; Top # Mn MYANMAR SIGN TAI LAING TONE-2 +AAB0 ; Top # Mn TAI VIET MAI KANG +AAB2..AAB3 ; Top # Mn [2] TAI VIET VOWEL I..TAI VIET VOWEL UE +AAB7..AAB8 ; Top # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AABE..AABF ; Top # Mn [2] TAI VIET VOWEL AM..TAI VIET TONE MAI EK +AAC1 ; Top # Mn TAI VIET TONE MAI THO +AAED ; Top # Mn MEETEI MAYEK VOWEL SIGN AAI +ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP +10A05 ; Top # Mn KHAROSHTHI VOWEL SIGN E +10A0F ; Top # Mn KHAROSHTHI SIGN VISARGA +10A38 ; Top # Mn KHAROSHTHI SIGN BAR ABOVE +11001 ; Top # Mn BRAHMI SIGN ANUSVARA +11038..1103B ; Top # Mn [4] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN II +11042..11046 ; Top # Mn [5] BRAHMI VOWEL SIGN E..BRAHMI VIRAMA +11080..11081 ; Top # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +110B5..110B6 ; Top # Mn [2] KAITHI VOWEL SIGN E..KAITHI VOWEL SIGN AI +11100..11102 ; Top # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA +11127..11129 ; Top # Mn [3] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN II +1112D ; Top # Mn CHAKMA VOWEL SIGN AI +11130 ; Top # Mn CHAKMA VOWEL SIGN OI +11134 ; Top # Mn CHAKMA MAAYYAA +11180..11181 ; Top # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +111BC..111BE ; Top # Mn [3] SHARADA VOWEL SIGN E..SHARADA VOWEL SIGN O +111CB ; Top # Mn SHARADA VOWEL MODIFIER MARK +11230..11231 ; Top # Mn [2] KHOJKI VOWEL SIGN E..KHOJKI VOWEL SIGN AI +11234 ; Top # Mn KHOJKI SIGN ANUSVARA +11236..11237 ; Top # Mn [2] KHOJKI SIGN NUKTA..KHOJKI SIGN SHADDA +1123E ; Top # Mn KHOJKI SIGN SUKUN +112DF ; Top # Mn KHUDAWADI SIGN ANUSVARA +112E5..112E8 ; Top # Mn [4] KHUDAWADI VOWEL SIGN E..KHUDAWADI VOWEL SIGN AU +11301 ; Top # Mn GRANTHA SIGN CANDRABINDU +11340 ; Top # Mn GRANTHA VOWEL SIGN II +11366..1136C ; Top # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Top # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA +1143E..1143F ; Top # Mn [2] NEWA VOWEL SIGN E..NEWA VOWEL SIGN AI +11443..11444 ; Top # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +114BA ; Top # Mn TIRHUTA VOWEL SIGN SHORT E +114BF..114C0 ; Top # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Top # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +11639..1163A ; Top # Mn [2] MODI VOWEL SIGN E..MODI VOWEL SIGN AI +1163D ; Top # Mn MODI SIGN ANUSVARA +11640 ; Top # Mn MODI SIGN ARDHACANDRA +116AB ; Top # Mn TAKRI SIGN ANUSVARA +116AD ; Top # Mn TAKRI VOWEL SIGN AA +116B2..116B5 ; Top # Mn [4] TAKRI VOWEL SIGN E..TAKRI VOWEL SIGN AU +1171F ; Top # Mn AHOM CONSONANT SIGN MEDIAL LIGATING RA +11722..11723 ; Top # Mn [2] AHOM VOWEL SIGN I..AHOM VOWEL SIGN II +11727 ; Top # Mn AHOM VOWEL SIGN AW +11729..1172B ; Top # Mn [3] AHOM VOWEL SIGN AI..AHOM SIGN KILLER +11A01 ; Top # Mn ZANABAZAR SQUARE VOWEL SIGN I +11A04..11A09 ; Top # Mn [6] ZANABAZAR SQUARE VOWEL SIGN E..ZANABAZAR SQUARE VOWEL SIGN REVERSED I +11A35..11A38 ; Top # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A51 ; Top # Mn SOYOMBO VOWEL SIGN I +11A54..11A56 ; Top # Mn [3] SOYOMBO VOWEL SIGN E..SOYOMBO VOWEL SIGN OE +11A96 ; Top # Mn SOYOMBO SIGN ANUSVARA +11A98 ; Top # Mn SOYOMBO GEMINATION MARK +11C30..11C31 ; Top # Mn [2] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN II +11C38..11C3D ; Top # Mn [6] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI SIGN ANUSVARA +11CB3 ; Top # Mn MARCHEN VOWEL SIGN E +11CB5..11CB6 ; Top # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D31..11D35 ; Top # Mn [5] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN UU +11D3A ; Top # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Top # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F..11D41 ; Top # Mn [3] MASARAM GONDI VOWEL SIGN AU..MASARAM GONDI SIGN VISARGA +11D43 ; Top # Mn MASARAM GONDI SIGN CANDRA + +# Indic_Positional_Category=Bottom + +093C ; Bottom # Mn DEVANAGARI SIGN NUKTA +0941..0944 ; Bottom # Mn [4] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN VOCALIC RR +094D ; Bottom # Mn DEVANAGARI SIGN VIRAMA +0952 ; Bottom # Mn DEVANAGARI STRESS SIGN ANUDATTA +0956..0957 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN UE..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BC ; Bottom # Mn BENGALI SIGN NUKTA +09C1..09C4 ; Bottom # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09CD ; Bottom # Mn BENGALI SIGN VIRAMA +09E2..09E3 ; Bottom # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3C ; Bottom # Mn GURMUKHI SIGN NUKTA +0A41..0A42 ; Bottom # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A4D ; Bottom # Mn GURMUKHI SIGN VIRAMA +0A75 ; Bottom # Mn GURMUKHI SIGN YAKASH +0ABC ; Bottom # Mn GUJARATI SIGN NUKTA +0AC1..0AC4 ; Bottom # Mn [4] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN VOCALIC RR +0ACD ; Bottom # Mn GUJARATI SIGN VIRAMA +0AE2..0AE3 ; Bottom # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3C ; Bottom # Mn ORIYA SIGN NUKTA +0B41..0B44 ; Bottom # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B4D ; Bottom # Mn ORIYA SIGN VIRAMA +0B62..0B63 ; Bottom # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0C56 ; Bottom # Mn TELUGU AI LENGTH MARK +0C62..0C63 ; Bottom # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBC ; Bottom # Mn KANNADA SIGN NUKTA +0CE2..0CE3 ; Bottom # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D43..0D44 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC R..MALAYALAM VOWEL SIGN VOCALIC RR +0D62..0D63 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DD4 ; Bottom # Mn SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Bottom # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0E38..0E3A ; Bottom # Mn [3] THAI CHARACTER SARA U..THAI CHARACTER PHINTHU +0EB8..0EB9 ; Bottom # Mn [2] LAO VOWEL SIGN U..LAO VOWEL SIGN UU +0EBC ; Bottom # Mn LAO SEMIVOWEL SIGN LO +0F18..0F19 ; Bottom # Mn [2] TIBETAN ASTROLOGICAL SIGN -KHYUD PA..TIBETAN ASTROLOGICAL SIGN SDONG TSHUGS +0F35 ; Bottom # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Bottom # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0F71 ; Bottom # Mn TIBETAN VOWEL SIGN AA +0F74..0F75 ; Bottom # Mn [2] TIBETAN VOWEL SIGN U..TIBETAN VOWEL SIGN UU +0F84 ; Bottom # Mn TIBETAN MARK HALANTA +0F8D..0F97 ; Bottom # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Bottom # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +0FC6 ; Bottom # Mn TIBETAN SYMBOL PADMA GDAN +102F..1030 ; Bottom # Mn [2] MYANMAR VOWEL SIGN U..MYANMAR VOWEL SIGN UU +1037 ; Bottom # Mn MYANMAR SIGN DOT BELOW +103D..103E ; Bottom # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +1058..1059 ; Bottom # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +105E..1060 ; Bottom # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Bottom # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +108D ; Bottom # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +1713..1714 ; Bottom # Mn [2] TAGALOG VOWEL SIGN U..TAGALOG SIGN VIRAMA +1733..1734 ; Bottom # Mn [2] HANUNOO VOWEL SIGN U..HANUNOO SIGN PAMUDPOD +1753 ; Bottom # Mn BUHID VOWEL SIGN U +1773 ; Bottom # Mn TAGBANWA VOWEL SIGN U +17BB..17BD ; Bottom # Mn [3] KHMER VOWEL SIGN U..KHMER VOWEL SIGN UA +1922 ; Bottom # Mn LIMBU VOWEL SIGN U +1932 ; Bottom # Mn LIMBU SMALL LETTER ANUSVARA +1939 ; Bottom # Mn LIMBU SIGN MUKPHRENG +193B ; Bottom # Mn LIMBU SIGN SA-I +1A18 ; Bottom # Mn BUGINESE VOWEL SIGN U +1A56 ; Bottom # Mn TAI THAM CONSONANT SIGN MEDIAL LA +1A5B..1A5E ; Bottom # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1A69..1A6A ; Bottom # Mn [2] TAI THAM VOWEL SIGN U..TAI THAM VOWEL SIGN UU +1A6C ; Bottom # Mn TAI THAM VOWEL SIGN OA BELOW +1A7F ; Bottom # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1B38..1B3A ; Bottom # Mn [3] BALINESE VOWEL SIGN SUKU..BALINESE VOWEL SIGN RA REPA +1B6C ; Bottom # Mn BALINESE MUSICAL SYMBOL COMBINING ENDEP +1BA2..1BA3 ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BA5 ; Bottom # Mn SUNDANESE VOWEL SIGN PANYUKU +1BAC..1BAD ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C2C ; Bottom # Mn LEPCHA VOWEL SIGN E +1C37 ; Bottom # Mn LEPCHA SIGN NUKTA +1CD5..1CD9 ; Bottom # Mn [5] VEDIC TONE YAJURVEDIC AGGRAVATED INDEPENDENT SVARITA..VEDIC TONE YAJURVEDIC KATHAKA INDEPENDENT SVARITA SCHROEDER +1CDC..1CDF ; Bottom # Mn [4] VEDIC TONE KATHAKA ANUDATTA..VEDIC TONE THREE DOTS BELOW +1CED ; Bottom # Mn VEDIC SIGN TIRYAK +A825 ; Bottom # Mn SYLOTI NAGRI VOWEL SIGN U +A8C4 ; Bottom # Mn SAURASHTRA SIGN VIRAMA +A92B..A92D ; Bottom # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +A947..A949 ; Bottom # Mn [3] REJANG VOWEL SIGN I..REJANG VOWEL SIGN E +A94B..A94E ; Bottom # Mn [4] REJANG VOWEL SIGN O..REJANG VOWEL SIGN EA +A9B8..A9B9 ; Bottom # Mn [2] JAVANESE VOWEL SIGN SUKU..JAVANESE VOWEL SIGN SUKU MENDUT +AA2D ; Bottom # Mn CHAM VOWEL SIGN U +AA32 ; Bottom # Mn CHAM VOWEL SIGN UE +AA35..AA36 ; Bottom # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +AAB4 ; Bottom # Mn TAI VIET VOWEL U +AAEC ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UU +ABE8 ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK +10A02..10A03 ; Bottom # Mn [2] KHAROSHTHI VOWEL SIGN U..KHAROSHTHI VOWEL SIGN VOCALIC R +10A0C..10A0E ; Bottom # Mn [3] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN ANUSVARA +10A39..10A3A ; Bottom # Mn [2] KHAROSHTHI SIGN CAUDA..KHAROSHTHI SIGN DOT BELOW +1103C..11041 ; Bottom # Mn [6] BRAHMI VOWEL SIGN U..BRAHMI VOWEL SIGN VOCALIC LL +110B3..110B4 ; Bottom # Mn [2] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN UU +110B9..110BA ; Bottom # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +1112A..1112B ; Bottom # Mn [2] CHAKMA VOWEL SIGN U..CHAKMA VOWEL SIGN UU +11131..11132 ; Bottom # Mn [2] CHAKMA O MARK..CHAKMA AU MARK +11173 ; Bottom # Mn MAHAJANI SIGN NUKTA +111B6..111BB ; Bottom # Mn [6] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN VOCALIC LL +111CC ; Bottom # Mn SHARADA EXTRA SHORT VOWEL MARK +1122F ; Bottom # Mn KHOJKI VOWEL SIGN U +112E3..112E4 ; Bottom # Mn [2] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN UU +112E9..112EA ; Bottom # Mn [2] KHUDAWADI SIGN NUKTA..KHUDAWADI SIGN VIRAMA +11438..1143D ; Bottom # Mn [6] NEWA VOWEL SIGN U..NEWA VOWEL SIGN VOCALIC LL +11442 ; Bottom # Mn NEWA SIGN VIRAMA +11446 ; Bottom # Mn NEWA SIGN NUKTA +114B3..114B8 ; Bottom # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114C2..114C3 ; Bottom # Mn [2] TIRHUTA SIGN VIRAMA..TIRHUTA SIGN NUKTA +115B2..115B5 ; Bottom # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115BF..115C0 ; Bottom # Mn [2] SIDDHAM SIGN VIRAMA..SIDDHAM SIGN NUKTA +115DC..115DD ; Bottom # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11633..11638 ; Bottom # Mn [6] MODI VOWEL SIGN U..MODI VOWEL SIGN VOCALIC LL +1163F ; Bottom # Mn MODI SIGN VIRAMA +116B0..116B1 ; Bottom # Mn [2] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN UU +116B7 ; Bottom # Mn TAKRI SIGN NUKTA +1171D ; Bottom # Mn AHOM CONSONANT SIGN MEDIAL LA +11724..11725 ; Bottom # Mn [2] AHOM VOWEL SIGN U..AHOM VOWEL SIGN UU +11728 ; Bottom # Mn AHOM VOWEL SIGN O +11A02..11A03 ; Bottom # Mn [2] ZANABAZAR SQUARE VOWEL SIGN UE..ZANABAZAR SQUARE VOWEL SIGN U +11A0A ; Bottom # Mn ZANABAZAR SQUARE VOWEL LENGTH MARK +11A33..11A34 ; Bottom # Mn [2] ZANABAZAR SQUARE FINAL CONSONANT MARK..ZANABAZAR SQUARE SIGN VIRAMA +11A3B..11A3E ; Bottom # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11A52..11A53 ; Bottom # Mn [2] SOYOMBO VOWEL SIGN UE..SOYOMBO VOWEL SIGN U +11A59..11A5B ; Bottom # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11A8A..11A95 ; Bottom # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A +11C32..11C36 ; Bottom # Mn [5] BHAIKSUKI VOWEL SIGN U..BHAIKSUKI VOWEL SIGN VOCALIC L +11C3F ; Bottom # Mn BHAIKSUKI SIGN VIRAMA +11C92..11CA7 ; Bottom # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CAA..11CB0 ; Bottom # Mn [7] MARCHEN SUBJOINED LETTER RA..MARCHEN VOWEL SIGN AA +11CB2 ; Bottom # Mn MARCHEN VOWEL SIGN U +11D36 ; Bottom # Mn MASARAM GONDI VOWEL SIGN VOCALIC R +11D42 ; Bottom # Mn MASARAM GONDI SIGN NUKTA +11D44 ; Bottom # Mn MASARAM GONDI SIGN HALANTA +11D47 ; Bottom # Mn MASARAM GONDI RA-KARA + +# Indic_Positional_Category=Top_And_Bottom + +0C48 ; Top_And_Bottom # Mn TELUGU VOWEL SIGN AI +0F73 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN II +0F76..0F79 ; Top_And_Bottom # Mn [4] TIBETAN VOWEL SIGN VOCALIC R..TIBETAN VOWEL SIGN VOCALIC LL +0F81 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN REVERSED II +1B3C ; Top_And_Bottom # Mn BALINESE VOWEL SIGN LA LENGA +1112E..1112F ; Top_And_Bottom # Mn [2] CHAKMA VOWEL SIGN O..CHAKMA VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Right + +0AC9 ; Top_And_Right # Mc GUJARATI VOWEL SIGN CANDRA O +0B57 ; Top_And_Right # Mc ORIYA AU LENGTH MARK +0CC0 ; Top_And_Right # Mc KANNADA VOWEL SIGN II +0CC7..0CC8 ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +1925..1926 ; Top_And_Right # Mc [2] LIMBU VOWEL SIGN OO..LIMBU VOWEL SIGN AU +1B43 ; Top_And_Right # Mc BALINESE VOWEL SIGN PEPET TEDUNG +111BF ; Top_And_Right # Mc SHARADA VOWEL SIGN AU +11232..11233 ; Top_And_Right # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Left + +0B48 ; Top_And_Left # Mc ORIYA VOWEL SIGN AI +0DDA ; Top_And_Left # Mc SINHALA VOWEL SIGN DIGA KOMBUVA +17BE ; Top_And_Left # Mc KHMER VOWEL SIGN OE +1C29 ; Top_And_Left # Mc LEPCHA VOWEL SIGN OO +114BB ; Top_And_Left # Mc TIRHUTA VOWEL SIGN AI +115B9 ; Top_And_Left # Mc SIDDHAM VOWEL SIGN AI + +# Indic_Positional_Category=Top_And_Left_And_Right + +0B4C ; Top_And_Left_And_Right # Mc ORIYA VOWEL SIGN AU +0DDD ; Top_And_Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA +17BF ; Top_And_Left_And_Right # Mc KHMER VOWEL SIGN YA +115BB ; Top_And_Left_And_Right # Mc SIDDHAM VOWEL SIGN AU + +# Indic_Positional_Category=Bottom_And_Right + +1B3B ; Bottom_And_Right # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +A9C0 ; Bottom_And_Right # Mc JAVANESE PANGKON + +# Indic_Positional_Category=Bottom_And_Left + +A9BF ; Bottom_And_Left # Mc JAVANESE CONSONANT SIGN CAKRA + +# Indic_Positional_Category=Top_And_Bottom_And_Right + +1B3D ; Top_And_Bottom_And_Right # Mc BALINESE VOWEL SIGN LA LENGA TEDUNG + +# Indic_Positional_Category=Overstruck + +1CD4 ; Overstruck # Mn VEDIC SIGN YAJURVEDIC MIDLINE SVARITA +1CE2..1CE8 ; Overstruck # Mn [7] VEDIC SIGN VISARGA SVARITA..VEDIC SIGN VISARGA ANUDATTA WITH TAIL +10A01 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN I +10A06 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN O + +# EOF diff --git a/data/10.0.0-indic-syllabic-category.txt b/data/10.0.0-indic-syllabic-category.txt new file mode 100644 index 0000000..fcd40af --- /dev/null +++ b/data/10.0.0-indic-syllabic-category.txt @@ -0,0 +1,1226 @@ +# IndicSyllabicCategory-10.0.0.txt +# Date: 2017-05-31, 01:07:00 GMT [KW, RP] +# © 2017 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# +# For documentation, see UAX #44: Unicode Character Database, +# at http://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Syllabic_Category enumerated property +# +# Scope: This property is aimed at two general problem +# areas involving the analysis and processing of Indic scripts: +# +# 1. Specification of syllabic structure. +# 2. Specification of segmentation rules. +# +# Both of these problem areas may benefit from having defined subtypes +# of Indic script characters which are relevant to how Indic +# syllables (or aksaras) are constructed. Note that rules for +# syllabic structure in Indic scripts may differ significantly +# from how phonological syllables are defined. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Syllabic_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as Indic in the structural sense used for the +# Indic_Syllabic_Category are the following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Grantha, Gujarati, Gurmukhi, Hanunoo, +# Javanese, Kaithi, Kannada, Kayah Li, Kharoshthi, Khmer, Khojki, +# Khudawadi, Lao, Lepcha, Limbu, Mahajani, Malayalam, Marchen, +# Masaram Gondi, Meetei Mayek, Modi, Multani, Myanmar, Newa, New Tai +# Lue, Oriya, Phags-pa, Rejang, Saurashtra, Sharada, Siddham, +# Sinhala, Soyombo, Sundanese, Syloti Nagri, Tagalog, Tagbanwa, Tai +# Le, Tai Tham, Tai Viet, Takri, Tamil, Telugu, Thai, Tibetan, +# Tirhuta, and Zanabazar Square. +# +# All characters for all other scripts not in that list +# take the default value for this property, unless they +# are individually listed in this data file. +# + +# ================================================ + +# Property: Indic_Syllabic_Category +# +# All code points not explicitly listed for Indic_Syllabic_Category +# have the value Other. +# +# @missing: 0000..10FFFF; Other + +# ================================================ + +# Indic_Syllabic_Category=Bindu + +# Bindu/Anusvara (nasalization or -n) + +# [Not derivable] + +0900..0902 ; Bindu # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +0981 ; Bindu # Mn BENGALI SIGN CANDRABINDU +0982 ; Bindu # Mc BENGALI SIGN ANUSVARA +09FC ; Bindu # Lo BENGALI LETTER VEDIC ANUSVARA +0A01..0A02 ; Bindu # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A70 ; Bindu # Mn GURMUKHI TIPPI +0A81..0A82 ; Bindu # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0B01 ; Bindu # Mn ORIYA SIGN CANDRABINDU +0B02 ; Bindu # Mc ORIYA SIGN ANUSVARA +0B82 ; Bindu # Mn TAMIL SIGN ANUSVARA +0C00 ; Bindu # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C01..0C02 ; Bindu # Mc [2] TELUGU SIGN CANDRABINDU..TELUGU SIGN ANUSVARA +0C81 ; Bindu # Mn KANNADA SIGN CANDRABINDU +0C82 ; Bindu # Mc KANNADA SIGN ANUSVARA +0D00 ; Bindu # Mn MALAYALAM SIGN COMBINING ANUSVARA ABOVE +0D01 ; Bindu # Mn MALAYALAM SIGN CANDRABINDU +0D02 ; Bindu # Mc MALAYALAM SIGN ANUSVARA +0D82 ; Bindu # Mc SINHALA SIGN ANUSVARAYA +0E4D ; Bindu # Mn THAI CHARACTER NIKHAHIT +0ECD ; Bindu # Mn LAO NIGGAHITA +0F7E ; Bindu # Mn TIBETAN SIGN RJES SU NGA RO +0F82..0F83 ; Bindu # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +1036 ; Bindu # Mn MYANMAR SIGN ANUSVARA +17C6 ; Bindu # Mn KHMER SIGN NIKAHIT +1932 ; Bindu # Mn LIMBU SMALL LETTER ANUSVARA +1A74 ; Bindu # Mn TAI THAM SIGN MAI KANG +1B00..1B02 ; Bindu # Mn [3] BALINESE SIGN ULU RICEM..BALINESE SIGN CECEK +1B80 ; Bindu # Mn SUNDANESE SIGN PANYECEK +1C34..1C35 ; Bindu # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A80B ; Bindu # Mn SYLOTI NAGRI SIGN ANUSVARA +A873 ; Bindu # Lo PHAGS-PA LETTER CANDRABINDU +A880 ; Bindu # Mc SAURASHTRA SIGN ANUSVARA +A8C5 ; Bindu # Mn SAURASHTRA SIGN CANDRABINDU +A8F2..A8F3 ; Bindu # Lo [2] DEVANAGARI SIGN SPACING CANDRABINDU..DEVANAGARI SIGN CANDRABINDU VIRAMA +A980..A981 ; Bindu # Mn [2] JAVANESE SIGN PANYANGGA..JAVANESE SIGN CECAK +10A0E ; Bindu # Mn KHAROSHTHI SIGN ANUSVARA +11000 ; Bindu # Mc BRAHMI SIGN CANDRABINDU +11001 ; Bindu # Mn BRAHMI SIGN ANUSVARA +11080..11081 ; Bindu # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +11100..11101 ; Bindu # Mn [2] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN ANUSVARA +11180..11181 ; Bindu # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +11234 ; Bindu # Mn KHOJKI SIGN ANUSVARA +112DF ; Bindu # Mn KHUDAWADI SIGN ANUSVARA +11300..11301 ; Bindu # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11302 ; Bindu # Mc GRANTHA SIGN ANUSVARA +1135E..1135F ; Bindu # Lo [2] GRANTHA LETTER VEDIC ANUSVARA..GRANTHA LETTER VEDIC DOUBLE ANUSVARA +11443..11444 ; Bindu # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +114BF..114C0 ; Bindu # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Bindu # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +1163D ; Bindu # Mn MODI SIGN ANUSVARA +116AB ; Bindu # Mn TAKRI SIGN ANUSVARA +11A35..11A38 ; Bindu # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A96 ; Bindu # Mn SOYOMBO SIGN ANUSVARA +11C3C..11C3D ; Bindu # Mn [2] BHAIKSUKI SIGN CANDRABINDU..BHAIKSUKI SIGN ANUSVARA +11CB5..11CB6 ; Bindu # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D40 ; Bindu # Mn MASARAM GONDI SIGN ANUSVARA + +# ================================================ + +# Indic_Syllabic_Category=Visarga + +# Visarga (-h) +# Includes specialized case for Sanskrit: ardhavisarga +# Excludes letters for jihvamuliya and upadhmaniya, which are +# related, but structured somewhat differently. + +# [Not derivable] + +0903 ; Visarga # Mc DEVANAGARI SIGN VISARGA +0983 ; Visarga # Mc BENGALI SIGN VISARGA +0A03 ; Visarga # Mc GURMUKHI SIGN VISARGA +0A83 ; Visarga # Mc GUJARATI SIGN VISARGA +0B03 ; Visarga # Mc ORIYA SIGN VISARGA +0C03 ; Visarga # Mc TELUGU SIGN VISARGA +0C83 ; Visarga # Mc KANNADA SIGN VISARGA +0D03 ; Visarga # Mc MALAYALAM SIGN VISARGA +0D83 ; Visarga # Mc SINHALA SIGN VISARGAYA +0F7F ; Visarga # Mc TIBETAN SIGN RNAM BCAD +1038 ; Visarga # Mc MYANMAR SIGN VISARGA +17C7 ; Visarga # Mc KHMER SIGN REAHMUK +1B04 ; Visarga # Mc BALINESE SIGN BISAH +1B82 ; Visarga # Mc SUNDANESE SIGN PANGWISAD +1CF2..1CF3 ; Visarga # Mc [2] VEDIC SIGN ARDHAVISARGA..VEDIC SIGN ROTATED ARDHAVISARGA +A881 ; Visarga # Mc SAURASHTRA SIGN VISARGA +A983 ; Visarga # Mc JAVANESE SIGN WIGNYAN +AAF5 ; Visarga # Mc MEETEI MAYEK VOWEL SIGN VISARGA +10A0F ; Visarga # Mn KHAROSHTHI SIGN VISARGA +11002 ; Visarga # Mc BRAHMI SIGN VISARGA +11082 ; Visarga # Mc KAITHI SIGN VISARGA +11102 ; Visarga # Mn CHAKMA SIGN VISARGA +11182 ; Visarga # Mc SHARADA SIGN VISARGA +11303 ; Visarga # Mc GRANTHA SIGN VISARGA +11445 ; Visarga # Mc NEWA SIGN VISARGA +114C1 ; Visarga # Mc TIRHUTA SIGN VISARGA +115BE ; Visarga # Mc SIDDHAM SIGN VISARGA +1163E ; Visarga # Mc MODI SIGN VISARGA +116AC ; Visarga # Mc TAKRI SIGN VISARGA +11A39 ; Visarga # Mc ZANABAZAR SQUARE SIGN VISARGA +11A97 ; Visarga # Mc SOYOMBO SIGN VISARGA +11C3E ; Visarga # Mc BHAIKSUKI SIGN VISARGA +11D41 ; Visarga # Mn MASARAM GONDI SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Avagraha + +# Avagraha (elision of initial a- in sandhi) + +# [Not derivable] + +093D ; Avagraha # Lo DEVANAGARI SIGN AVAGRAHA +09BD ; Avagraha # Lo BENGALI SIGN AVAGRAHA +0ABD ; Avagraha # Lo GUJARATI SIGN AVAGRAHA +0B3D ; Avagraha # Lo ORIYA SIGN AVAGRAHA +0C3D ; Avagraha # Lo TELUGU SIGN AVAGRAHA +0CBD ; Avagraha # Lo KANNADA SIGN AVAGRAHA +0D3D ; Avagraha # Lo MALAYALAM SIGN AVAGRAHA +0F85 ; Avagraha # Po TIBETAN MARK PALUTA +17DC ; Avagraha # Lo KHMER SIGN AVAKRAHASANYA +1BBA ; Avagraha # Lo SUNDANESE AVAGRAHA +111C1 ; Avagraha # Lo SHARADA SIGN AVAGRAHA +1133D ; Avagraha # Lo GRANTHA SIGN AVAGRAHA +11447 ; Avagraha # Lo NEWA SIGN AVAGRAHA +114C4 ; Avagraha # Lo TIRHUTA SIGN AVAGRAHA +11C40 ; Avagraha # Lo BHAIKSUKI SIGN AVAGRAHA + +# ================================================ + +# Indic_Syllabic_Category=Nukta + +# Nukta (diacritic for borrowed consonants or other consonant +# modifications). Note that while the resulting sound is typically a +# consonant, the base letter a nukta follows may be an independent +# vowel. For example, is used to transcribe ARABIC LETTER +# AIN. + +# [Not derivable] + +093C ; Nukta # Mn DEVANAGARI SIGN NUKTA +09BC ; Nukta # Mn BENGALI SIGN NUKTA +0A3C ; Nukta # Mn GURMUKHI SIGN NUKTA +0ABC ; Nukta # Mn GUJARATI SIGN NUKTA +0AFD..0AFF ; Nukta # Mn [3] GUJARATI SIGN THREE-DOT NUKTA ABOVE..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B3C ; Nukta # Mn ORIYA SIGN NUKTA +0CBC ; Nukta # Mn KANNADA SIGN NUKTA +0F39 ; Nukta # Mn TIBETAN MARK TSA -PHRU +1B34 ; Nukta # Mn BALINESE SIGN REREKAN +1BE6 ; Nukta # Mn BATAK SIGN TOMPI +1C37 ; Nukta # Mn LEPCHA SIGN NUKTA +A9B3 ; Nukta # Mn JAVANESE SIGN CECAK TELU +10A38..10A3A ; Nukta # Mn [3] KHAROSHTHI SIGN BAR ABOVE..KHAROSHTHI SIGN DOT BELOW +110BA ; Nukta # Mn KAITHI SIGN NUKTA +11173 ; Nukta # Mn MAHAJANI SIGN NUKTA +111CA ; Nukta # Mn SHARADA SIGN NUKTA +11236 ; Nukta # Mn KHOJKI SIGN NUKTA +112E9 ; Nukta # Mn KHUDAWADI SIGN NUKTA +1133C ; Nukta # Mn GRANTHA SIGN NUKTA +11446 ; Nukta # Mn NEWA SIGN NUKTA +114C3 ; Nukta # Mn TIRHUTA SIGN NUKTA +115C0 ; Nukta # Mn SIDDHAM SIGN NUKTA +116B7 ; Nukta # Mn TAKRI SIGN NUKTA +11D42 ; Nukta # Mn MASARAM GONDI SIGN NUKTA + +# ================================================ + +# Indic_Syllabic_Category=Virama + +# Virama (killing of inherent vowel in consonant sequence +# or consonant stacker) +# Only includes characters that can act both as visible killer viramas +# and consonant stackers. Separate property values exist for characters +# that can only act as pure killers or only as consonant stackers. + +# [Derivation: (ccc=9) - (InSC=Pure_Killer) - (InSC=Invisible_Stacker) +# - (InSC=Number_Joiner) - 2D7F] + +094D ; Virama # Mn DEVANAGARI SIGN VIRAMA +09CD ; Virama # Mn BENGALI SIGN VIRAMA +0A4D ; Virama # Mn GURMUKHI SIGN VIRAMA +0ACD ; Virama # Mn GUJARATI SIGN VIRAMA +0B4D ; Virama # Mn ORIYA SIGN VIRAMA +0BCD ; Virama # Mn TAMIL SIGN VIRAMA +0C4D ; Virama # Mn TELUGU SIGN VIRAMA +0CCD ; Virama # Mn KANNADA SIGN VIRAMA +0D4D ; Virama # Mn MALAYALAM SIGN VIRAMA +0DCA ; Virama # Mn SINHALA SIGN AL-LAKUNA +1B44 ; Virama # Mc BALINESE ADEG ADEG +A8C4 ; Virama # Mn SAURASHTRA SIGN VIRAMA +A9C0 ; Virama # Mc JAVANESE PANGKON +11046 ; Virama # Mn BRAHMI VIRAMA +110B9 ; Virama # Mn KAITHI SIGN VIRAMA +111C0 ; Virama # Mc SHARADA SIGN VIRAMA +11235 ; Virama # Mc KHOJKI SIGN VIRAMA +1134D ; Virama # Mc GRANTHA SIGN VIRAMA +11442 ; Virama # Mn NEWA SIGN VIRAMA +114C2 ; Virama # Mn TIRHUTA SIGN VIRAMA +115BF ; Virama # Mn SIDDHAM SIGN VIRAMA +1163F ; Virama # Mn MODI SIGN VIRAMA +116B6 ; Virama # Mc TAKRI SIGN VIRAMA +11C3F ; Virama # Mn BHAIKSUKI SIGN VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Pure_Killer + +# Pure killer (killing of inherent vowel in consonant sequence, +# with no consonant stacking behavior) + +# [Not derivable] + +0D3B ; Pure_Killer # Mn MALAYALAM SIGN VERTICAL BAR VIRAMA +0D3C ; Pure_Killer # Mn MALAYALAM SIGN CIRCULAR VIRAMA +0E3A ; Pure_Killer # Mn THAI CHARACTER PHINTHU +0E4E ; Pure_Killer # Mn THAI CHARACTER YAMAKKAN +0F84 ; Pure_Killer # Mn TIBETAN MARK HALANTA +103A ; Pure_Killer # Mn MYANMAR SIGN ASAT +1714 ; Pure_Killer # Mn TAGALOG SIGN VIRAMA +1734 ; Pure_Killer # Mn HANUNOO SIGN PAMUDPOD +17D1 ; Pure_Killer # Mn KHMER SIGN VIRIAM +1A7A ; Pure_Killer # Mn TAI THAM SIGN RA HAAM +1BAA ; Pure_Killer # Mc SUNDANESE SIGN PAMAAEH +1BF2..1BF3 ; Pure_Killer # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +A806 ; Pure_Killer # Mn SYLOTI NAGRI SIGN HASANTA +A953 ; Pure_Killer # Mc REJANG VIRAMA +ABED ; Pure_Killer # Mn MEETEI MAYEK APUN IYEK +11134 ; Pure_Killer # Mn CHAKMA MAAYYAA +112EA ; Pure_Killer # Mn KHUDAWADI SIGN VIRAMA +1172B ; Pure_Killer # Mn AHOM SIGN KILLER +11A34 ; Pure_Killer # Mn ZANABAZAR SQUARE SIGN VIRAMA +11D44 ; Pure_Killer # Mn MASARAM GONDI SIGN HALANTA + +# ================================================ + +# Indic_Syllabic_Category=Invisible_Stacker + +# Invisible stacker (invisible consonant stacker virama) + +# [Not derivable] + +1039 ; Invisible_Stacker # Mn MYANMAR SIGN VIRAMA +17D2 ; Invisible_Stacker # Mn KHMER SIGN COENG +1A60 ; Invisible_Stacker # Mn TAI THAM SIGN SAKOT +1BAB ; Invisible_Stacker # Mn SUNDANESE SIGN VIRAMA +AAF6 ; Invisible_Stacker # Mn MEETEI MAYEK VIRAMA +10A3F ; Invisible_Stacker # Mn KHAROSHTHI VIRAMA +11133 ; Invisible_Stacker # Mn CHAKMA VIRAMA +11A47 ; Invisible_Stacker # Mn ZANABAZAR SQUARE SUBJOINER +11A99 ; Invisible_Stacker # Mn SOYOMBO SUBJOINER +11D45 ; Invisible_Stacker # Mn MASARAM GONDI VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Independent + +# Independent Vowels (contrasted with matras) + +# [Not derivable] + +0904..0914 ; Vowel_Independent # Lo [17] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER AU +0960..0961 ; Vowel_Independent # Lo [2] DEVANAGARI LETTER VOCALIC RR..DEVANAGARI LETTER VOCALIC LL +0972..0977 ; Vowel_Independent # Lo [6] DEVANAGARI LETTER CANDRA A..DEVANAGARI LETTER UUE +0985..098C ; Vowel_Independent # Lo [8] BENGALI LETTER A..BENGALI LETTER VOCALIC L +098F..0990 ; Vowel_Independent # Lo [2] BENGALI LETTER E..BENGALI LETTER AI +0993..0994 ; Vowel_Independent # Lo [2] BENGALI LETTER O..BENGALI LETTER AU +09E0..09E1 ; Vowel_Independent # Lo [2] BENGALI LETTER VOCALIC RR..BENGALI LETTER VOCALIC LL +0A05..0A0A ; Vowel_Independent # Lo [6] GURMUKHI LETTER A..GURMUKHI LETTER UU +0A0F..0A10 ; Vowel_Independent # Lo [2] GURMUKHI LETTER EE..GURMUKHI LETTER AI +0A13..0A14 ; Vowel_Independent # Lo [2] GURMUKHI LETTER OO..GURMUKHI LETTER AU +0A85..0A8D ; Vowel_Independent # Lo [9] GUJARATI LETTER A..GUJARATI VOWEL CANDRA E +0A8F..0A91 ; Vowel_Independent # Lo [3] GUJARATI LETTER E..GUJARATI VOWEL CANDRA O +0A93..0A94 ; Vowel_Independent # Lo [2] GUJARATI LETTER O..GUJARATI LETTER AU +0AE0..0AE1 ; Vowel_Independent # Lo [2] GUJARATI LETTER VOCALIC RR..GUJARATI LETTER VOCALIC LL +0B05..0B0C ; Vowel_Independent # Lo [8] ORIYA LETTER A..ORIYA LETTER VOCALIC L +0B0F..0B10 ; Vowel_Independent # Lo [2] ORIYA LETTER E..ORIYA LETTER AI +0B13..0B14 ; Vowel_Independent # Lo [2] ORIYA LETTER O..ORIYA LETTER AU +0B60..0B61 ; Vowel_Independent # Lo [2] ORIYA LETTER VOCALIC RR..ORIYA LETTER VOCALIC LL +0B85..0B8A ; Vowel_Independent # Lo [6] TAMIL LETTER A..TAMIL LETTER UU +0B8E..0B90 ; Vowel_Independent # Lo [3] TAMIL LETTER E..TAMIL LETTER AI +0B92..0B94 ; Vowel_Independent # Lo [3] TAMIL LETTER O..TAMIL LETTER AU +0C05..0C0C ; Vowel_Independent # Lo [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L +0C0E..0C10 ; Vowel_Independent # Lo [3] TELUGU LETTER E..TELUGU LETTER AI +0C12..0C14 ; Vowel_Independent # Lo [3] TELUGU LETTER O..TELUGU LETTER AU +0C60..0C61 ; Vowel_Independent # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL +0C85..0C8C ; Vowel_Independent # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L +0C8E..0C90 ; Vowel_Independent # Lo [3] KANNADA LETTER E..KANNADA LETTER AI +0C92..0C94 ; Vowel_Independent # Lo [3] KANNADA LETTER O..KANNADA LETTER AU +0CE0..0CE1 ; Vowel_Independent # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL +0D05..0D0C ; Vowel_Independent # Lo [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L +0D0E..0D10 ; Vowel_Independent # Lo [3] MALAYALAM LETTER E..MALAYALAM LETTER AI +0D12..0D14 ; Vowel_Independent # Lo [3] MALAYALAM LETTER O..MALAYALAM LETTER AU +0D5F..0D61 ; Vowel_Independent # Lo [3] MALAYALAM LETTER ARCHAIC II..MALAYALAM LETTER VOCALIC LL +0D85..0D96 ; Vowel_Independent # Lo [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA +1021..102A ; Vowel_Independent # Lo [10] MYANMAR LETTER A..MYANMAR LETTER AU +1052..1055 ; Vowel_Independent # Lo [4] MYANMAR LETTER VOCALIC R..MYANMAR LETTER VOCALIC LL +1700..1702 ; Vowel_Independent # Lo [3] TAGALOG LETTER A..TAGALOG LETTER U +1720..1722 ; Vowel_Independent # Lo [3] HANUNOO LETTER A..HANUNOO LETTER U +1740..1742 ; Vowel_Independent # Lo [3] BUHID LETTER A..BUHID LETTER U +1760..1762 ; Vowel_Independent # Lo [3] TAGBANWA LETTER A..TAGBANWA LETTER U +17A3..17B3 ; Vowel_Independent # Lo [17] KHMER INDEPENDENT VOWEL QAQ..KHMER INDEPENDENT VOWEL QAU +1A4D..1A52 ; Vowel_Independent # Lo [6] TAI THAM LETTER I..TAI THAM LETTER OO +1B05..1B12 ; Vowel_Independent # Lo [14] BALINESE LETTER AKARA..BALINESE LETTER OKARA TEDUNG +1B83..1B89 ; Vowel_Independent # Lo [7] SUNDANESE LETTER A..SUNDANESE LETTER EU +1BE4..1BE5 ; Vowel_Independent # Lo [2] BATAK LETTER I..BATAK LETTER U +A800..A801 ; Vowel_Independent # Lo [2] SYLOTI NAGRI LETTER A..SYLOTI NAGRI LETTER I +A803..A805 ; Vowel_Independent # Lo [3] SYLOTI NAGRI LETTER U..SYLOTI NAGRI LETTER O +A882..A891 ; Vowel_Independent # Lo [16] SAURASHTRA LETTER A..SAURASHTRA LETTER AU +A984..A988 ; Vowel_Independent # Lo [5] JAVANESE LETTER A..JAVANESE LETTER U +A98C..A98E ; Vowel_Independent # Lo [3] JAVANESE LETTER E..JAVANESE LETTER O +AA00..AA05 ; Vowel_Independent # Lo [6] CHAM LETTER A..CHAM LETTER O +AAE0..AAE1 ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER E..MEETEI MAYEK LETTER O +ABCE..ABCF ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER UN..MEETEI MAYEK LETTER I +ABD1 ; Vowel_Independent # Lo MEETEI MAYEK LETTER ATIYA +11005..11012 ; Vowel_Independent # Lo [14] BRAHMI LETTER A..BRAHMI LETTER AU +11083..1108C ; Vowel_Independent # Lo [10] KAITHI LETTER A..KAITHI LETTER AU +11103..11106 ; Vowel_Independent # Lo [4] CHAKMA LETTER AA..CHAKMA LETTER E +11183..11190 ; Vowel_Independent # Lo [14] SHARADA LETTER A..SHARADA LETTER AU +11200..11207 ; Vowel_Independent # Lo [8] KHOJKI LETTER A..KHOJKI LETTER AU +11280..11283 ; Vowel_Independent # Lo [4] MULTANI LETTER A..MULTANI LETTER E +112B0..112B9 ; Vowel_Independent # Lo [10] KHUDAWADI LETTER A..KHUDAWADI LETTER AU +11305..1130C ; Vowel_Independent # Lo [8] GRANTHA LETTER A..GRANTHA LETTER VOCALIC L +1130F..11310 ; Vowel_Independent # Lo [2] GRANTHA LETTER EE..GRANTHA LETTER AI +11313..11314 ; Vowel_Independent # Lo [2] GRANTHA LETTER OO..GRANTHA LETTER AU +11360..11361 ; Vowel_Independent # Lo [2] GRANTHA LETTER VOCALIC RR..GRANTHA LETTER VOCALIC LL +11400..1140D ; Vowel_Independent # Lo [14] NEWA LETTER A..NEWA LETTER AU +11481..1148E ; Vowel_Independent # Lo [14] TIRHUTA LETTER A..TIRHUTA LETTER AU +11580..1158D ; Vowel_Independent # Lo [14] SIDDHAM LETTER A..SIDDHAM LETTER AU +115D8..115DB ; Vowel_Independent # Lo [4] SIDDHAM LETTER THREE-CIRCLE ALTERNATE I..SIDDHAM LETTER ALTERNATE U +11600..1160D ; Vowel_Independent # Lo [14] MODI LETTER A..MODI LETTER AU +11680..11689 ; Vowel_Independent # Lo [10] TAKRI LETTER A..TAKRI LETTER AU +11A00 ; Vowel_Independent # Lo ZANABAZAR SQUARE LETTER A +11A50 ; Vowel_Independent # Lo SOYOMBO LETTER A +11C00..11C08 ; Vowel_Independent # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L +11C0A..11C0D ; Vowel_Independent # Lo [4] BHAIKSUKI LETTER E..BHAIKSUKI LETTER AU +11D00..11D06 ; Vowel_Independent # Lo [6] MASARAM GONDI LETTER A..MASARAM GONDI LETTER E +11D08..11D09 ; Vowel_Independent # Lo [2] MASARAM GONDI LETTER AI..MASARAM GONDI LETTER O +11D0B ; Vowel_Independent # Lo MASARAM GONDI LETTER AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Dependent + +# Dependent Vowels (contrasted with independent vowels and/or with +# complex placement). Known as matras in Indic scripts. Also +# includes vowel modifiers that follow dependent (and sometimes +# independent) vowels. + +# [Not derivable] + +093A ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN OE +093B ; Vowel_Dependent # Mc DEVANAGARI VOWEL SIGN OOE +093E..0940 ; Vowel_Dependent # Mc [3] DEVANAGARI VOWEL SIGN AA..DEVANAGARI VOWEL SIGN II +0941..0948 ; Vowel_Dependent # Mn [8] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN AI +0949..094C ; Vowel_Dependent # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094E..094F ; Vowel_Dependent # Mc [2] DEVANAGARI VOWEL SIGN PRISHTHAMATRA E..DEVANAGARI VOWEL SIGN AW +0955..0957 ; Vowel_Dependent # Mn [3] DEVANAGARI VOWEL SIGN CANDRA LONG E..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Vowel_Dependent # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BE..09C0 ; Vowel_Dependent # Mc [3] BENGALI VOWEL SIGN AA..BENGALI VOWEL SIGN II +09C1..09C4 ; Vowel_Dependent # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09C7..09C8 ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +09CB..09CC ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +09D7 ; Vowel_Dependent # Mc BENGALI AU LENGTH MARK +09E2..09E3 ; Vowel_Dependent # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3E..0A40 ; Vowel_Dependent # Mc [3] GURMUKHI VOWEL SIGN AA..GURMUKHI VOWEL SIGN II +0A41..0A42 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A47..0A48 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0ABE..0AC0 ; Vowel_Dependent # Mc [3] GUJARATI VOWEL SIGN AA..GUJARATI VOWEL SIGN II +0AC1..0AC5 ; Vowel_Dependent # Mn [5] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AC9 ; Vowel_Dependent # Mc GUJARATI VOWEL SIGN CANDRA O +0ACB..0ACC ; Vowel_Dependent # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0AE2..0AE3 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3E ; Vowel_Dependent # Mc ORIYA VOWEL SIGN AA +0B3F ; Vowel_Dependent # Mn ORIYA VOWEL SIGN I +0B40 ; Vowel_Dependent # Mc ORIYA VOWEL SIGN II +0B41..0B44 ; Vowel_Dependent # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B47..0B48 ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI +0B4B..0B4C ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN O..ORIYA VOWEL SIGN AU +0B56 ; Vowel_Dependent # Mn ORIYA AI LENGTH MARK +0B57 ; Vowel_Dependent # Mc ORIYA AU LENGTH MARK +0B62..0B63 ; Vowel_Dependent # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BBE..0BBF ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC0 ; Vowel_Dependent # Mn TAMIL VOWEL SIGN II +0BC1..0BC2 ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BC6..0BC8 ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0BCA..0BCC ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0BD7 ; Vowel_Dependent # Mc TAMIL AU LENGTH MARK +0C3E..0C40 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C41..0C44 ; Vowel_Dependent # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C46..0C48 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI +0C4A..0C4C ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C55..0C56 ; Vowel_Dependent # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK +0C62..0C63 ; Vowel_Dependent # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBE ; Vowel_Dependent # Mc KANNADA VOWEL SIGN AA +0CBF ; Vowel_Dependent # Mn KANNADA VOWEL SIGN I +0CC0..0CC4 ; Vowel_Dependent # Mc [5] KANNADA VOWEL SIGN II..KANNADA VOWEL SIGN VOCALIC RR +0CC6 ; Vowel_Dependent # Mn KANNADA VOWEL SIGN E +0CC7..0CC8 ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +0CCC ; Vowel_Dependent # Mn KANNADA VOWEL SIGN AU +0CD5..0CD6 ; Vowel_Dependent # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CE2..0CE3 ; Vowel_Dependent # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D3E..0D40 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D44 ; Vowel_Dependent # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR +0D46..0D48 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0D4A..0D4C ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0D57 ; Vowel_Dependent # Mc MALAYALAM AU LENGTH MARK +0D62..0D63 ; Vowel_Dependent # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DCF..0DD1 ; Vowel_Dependent # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD2..0DD4 ; Vowel_Dependent # Mn [3] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Vowel_Dependent # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0DD8..0DDF ; Vowel_Dependent # Mc [8] SINHALA VOWEL SIGN GAETTA-PILLA..SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Vowel_Dependent # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Vowel_Dependent # Lo THAI CHARACTER SARA A +0E31 ; Vowel_Dependent # Mn THAI CHARACTER MAI HAN-AKAT +0E32..0E33 ; Vowel_Dependent # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E34..0E39 ; Vowel_Dependent # Mn [6] THAI CHARACTER SARA I..THAI CHARACTER SARA UU +0E40..0E45 ; Vowel_Dependent # Lo [6] THAI CHARACTER SARA E..THAI CHARACTER LAKKHANGYAO +0E47 ; Vowel_Dependent # Mn THAI CHARACTER MAITAIKHU +0EB0 ; Vowel_Dependent # Lo LAO VOWEL SIGN A +0EB1 ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KAN +0EB2..0EB3 ; Vowel_Dependent # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0EB4..0EB9 ; Vowel_Dependent # Mn [6] LAO VOWEL SIGN I..LAO VOWEL SIGN UU +0EBB ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KON +0EC0..0EC4 ; Vowel_Dependent # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +0F71..0F7D ; Vowel_Dependent # Mn [13] TIBETAN VOWEL SIGN AA..TIBETAN VOWEL SIGN OO +0F80..0F81 ; Vowel_Dependent # Mn [2] TIBETAN VOWEL SIGN REVERSED I..TIBETAN VOWEL SIGN REVERSED II +102B..102C ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +102D..1030 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN UU +1031 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN E +1032..1035 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +1056..1057 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1058..1059 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1062 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1071..1074 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1083..1084 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN SHAN AA..MYANMAR VOWEL SIGN SHAN E +1085..1086 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109C ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN AITON A +109D ; Vowel_Dependent # Mn MYANMAR VOWEL SIGN AITON AI +1712..1713 ; Vowel_Dependent # Mn [2] TAGALOG VOWEL SIGN I..TAGALOG VOWEL SIGN U +1732..1733 ; Vowel_Dependent # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1752..1753 ; Vowel_Dependent # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U +1772..1773 ; Vowel_Dependent # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U +17B6 ; Vowel_Dependent # Mc KHMER VOWEL SIGN AA +17B7..17BD ; Vowel_Dependent # Mn [7] KHMER VOWEL SIGN I..KHMER VOWEL SIGN UA +17BE..17C5 ; Vowel_Dependent # Mc [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU +17C8 ; Vowel_Dependent # Mc KHMER SIGN YUUKALEAPINTU +1920..1922 ; Vowel_Dependent # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U +1923..1926 ; Vowel_Dependent # Mc [4] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AU +1927..1928 ; Vowel_Dependent # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Vowel_Dependent # Mn LIMBU SIGN KEMPHRENG +19B0..19C0 ; Vowel_Dependent # Lo [17] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN IY +1A17..1A18 ; Vowel_Dependent # Mn [2] BUGINESE VOWEL SIGN I..BUGINESE VOWEL SIGN U +1A19..1A1A ; Vowel_Dependent # Mc [2] BUGINESE VOWEL SIGN E..BUGINESE VOWEL SIGN O +1A1B ; Vowel_Dependent # Mn BUGINESE VOWEL SIGN AE +1A61 ; Vowel_Dependent # Mc TAI THAM VOWEL SIGN A +1A62 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN MAI SAT +1A63..1A64 ; Vowel_Dependent # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A65..1A6C ; Vowel_Dependent # Mn [8] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN OA BELOW +1A6D..1A72 ; Vowel_Dependent # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI +1A73 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN OA ABOVE +1B35 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN TEDUNG +1B36..1B3A ; Vowel_Dependent # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA +1B3B ; Vowel_Dependent # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +1B3C ; Vowel_Dependent # Mn BALINESE VOWEL SIGN LA LENGA +1B3D..1B41 ; Vowel_Dependent # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1B42 ; Vowel_Dependent # Mn BALINESE VOWEL SIGN PEPET +1B43 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN PEPET TEDUNG +1BA4..1BA5 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PANGHULU..SUNDANESE VOWEL SIGN PANYUKU +1BA6..1BA7 ; Vowel_Dependent # Mc [2] SUNDANESE VOWEL SIGN PANAELAENG..SUNDANESE VOWEL SIGN PANOLONG +1BA8..1BA9 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE7 ; Vowel_Dependent # Mc BATAK VOWEL SIGN E +1BE8..1BE9 ; Vowel_Dependent # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BEA..1BEC ; Vowel_Dependent # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BED ; Vowel_Dependent # Mn BATAK VOWEL SIGN KARO O +1BEE ; Vowel_Dependent # Mc BATAK VOWEL SIGN U +1BEF ; Vowel_Dependent # Mn BATAK VOWEL SIGN U FOR SIMALUNGUN SA +1C26..1C2B ; Vowel_Dependent # Mc [6] LEPCHA VOWEL SIGN AA..LEPCHA VOWEL SIGN UU +1C2C ; Vowel_Dependent # Mn LEPCHA VOWEL SIGN E +A823..A824 ; Vowel_Dependent # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A825..A826 ; Vowel_Dependent # Mn [2] SYLOTI NAGRI VOWEL SIGN U..SYLOTI NAGRI VOWEL SIGN E +A827 ; Vowel_Dependent # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Vowel_Dependent # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A947..A94E ; Vowel_Dependent # Mn [8] REJANG VOWEL SIGN I..REJANG VOWEL SIGN EA +A9B4..A9B5 ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9B6..A9B9 ; Vowel_Dependent # Mn [4] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BA..A9BB ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +A9BC ; Vowel_Dependent # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Vowel_Dependent # Mn MYANMAR SIGN SHAN SAW +AA29..AA2E ; Vowel_Dependent # Mn [6] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN OE +AA2F..AA30 ; Vowel_Dependent # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA31..AA32 ; Vowel_Dependent # Mn [2] CHAM VOWEL SIGN AU..CHAM VOWEL SIGN UE +AAB0 ; Vowel_Dependent # Mn TAI VIET MAI KANG +AAB1 ; Vowel_Dependent # Lo TAI VIET VOWEL AA +AAB2..AAB4 ; Vowel_Dependent # Mn [3] TAI VIET VOWEL I..TAI VIET VOWEL U +AAB5..AAB6 ; Vowel_Dependent # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB7..AAB8 ; Vowel_Dependent # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AAB9..AABD ; Vowel_Dependent # Lo [5] TAI VIET VOWEL UEA..TAI VIET VOWEL AN +AABE ; Vowel_Dependent # Mn TAI VIET VOWEL AM +AAEB ; Vowel_Dependent # Mc MEETEI MAYEK VOWEL SIGN II +AAEC..AAED ; Vowel_Dependent # Mn [2] MEETEI MAYEK VOWEL SIGN UU..MEETEI MAYEK VOWEL SIGN AAI +AAEE..AAEF ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN AU..MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE5 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN ANAP +ABE6..ABE7 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE8 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABE9..ABEA ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +10A01..10A03 ; Vowel_Dependent # Mn [3] KHAROSHTHI VOWEL SIGN I..KHAROSHTHI VOWEL SIGN VOCALIC R +10A05..10A06 ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O +10A0C..10A0D ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN DOUBLE RING BELOW +11038..11045 ; Vowel_Dependent # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +110B0..110B2 ; Vowel_Dependent # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II +110B3..110B6 ; Vowel_Dependent # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI +110B7..110B8 ; Vowel_Dependent # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11127..1112B ; Vowel_Dependent # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU +1112C ; Vowel_Dependent # Mc CHAKMA VOWEL SIGN E +1112D..11132 ; Vowel_Dependent # Mn [6] CHAKMA VOWEL SIGN AI..CHAKMA AU MARK +111B3..111B5 ; Vowel_Dependent # Mc [3] SHARADA VOWEL SIGN AA..SHARADA VOWEL SIGN II +111B6..111BE ; Vowel_Dependent # Mn [9] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN O +111BF ; Vowel_Dependent # Mc SHARADA VOWEL SIGN AU +111CB..111CC ; Vowel_Dependent # Mn [2] SHARADA VOWEL MODIFIER MARK..SHARADA EXTRA SHORT VOWEL MARK +1122C..1122E ; Vowel_Dependent # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +1122F..11231 ; Vowel_Dependent # Mn [3] KHOJKI VOWEL SIGN U..KHOJKI VOWEL SIGN AI +11232..11233 ; Vowel_Dependent # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU +112E0..112E2 ; Vowel_Dependent # Mc [3] KHUDAWADI VOWEL SIGN AA..KHUDAWADI VOWEL SIGN II +112E3..112E8 ; Vowel_Dependent # Mn [6] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN AU +1133E..1133F ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11340 ; Vowel_Dependent # Mn GRANTHA VOWEL SIGN II +11341..11344 ; Vowel_Dependent # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +11347..11348 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +1134B..1134C ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +11357 ; Vowel_Dependent # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +11435..11437 ; Vowel_Dependent # Mc [3] NEWA VOWEL SIGN AA..NEWA VOWEL SIGN II +11438..1143F ; Vowel_Dependent # Mn [8] NEWA VOWEL SIGN U..NEWA VOWEL SIGN AI +11440..11441 ; Vowel_Dependent # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +114B0..114B2 ; Vowel_Dependent # Mc [3] TIRHUTA VOWEL SIGN AA..TIRHUTA VOWEL SIGN II +114B3..114B8 ; Vowel_Dependent # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114B9 ; Vowel_Dependent # Mc TIRHUTA VOWEL SIGN E +114BA ; Vowel_Dependent # Mn TIRHUTA VOWEL SIGN SHORT E +114BB..114BE ; Vowel_Dependent # Mc [4] TIRHUTA VOWEL SIGN AI..TIRHUTA VOWEL SIGN AU +115AF..115B1 ; Vowel_Dependent # Mc [3] SIDDHAM VOWEL SIGN AA..SIDDHAM VOWEL SIGN II +115B2..115B5 ; Vowel_Dependent # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115B8..115BB ; Vowel_Dependent # Mc [4] SIDDHAM VOWEL SIGN E..SIDDHAM VOWEL SIGN AU +115DC..115DD ; Vowel_Dependent # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11630..11632 ; Vowel_Dependent # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +11633..1163A ; Vowel_Dependent # Mn [8] MODI VOWEL SIGN U..MODI VOWEL SIGN AI +1163B..1163C ; Vowel_Dependent # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +11640 ; Vowel_Dependent # Mn MODI SIGN ARDHACANDRA +116AD ; Vowel_Dependent # Mn TAKRI VOWEL SIGN AA +116AE..116AF ; Vowel_Dependent # Mc [2] TAKRI VOWEL SIGN I..TAKRI VOWEL SIGN II +116B0..116B5 ; Vowel_Dependent # Mn [6] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN AU +11720..11721 ; Vowel_Dependent # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +11722..11725 ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN I..AHOM VOWEL SIGN UU +11726 ; Vowel_Dependent # Mc AHOM VOWEL SIGN E +11727..1172A ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN AW..AHOM VOWEL SIGN AM +11A01..11A06 ; Vowel_Dependent # Mn [6] ZANABAZAR SQUARE VOWEL SIGN I..ZANABAZAR SQUARE VOWEL SIGN O +11A07..11A08 ; Vowel_Dependent # Mc [2] ZANABAZAR SQUARE VOWEL SIGN AI..ZANABAZAR SQUARE VOWEL SIGN AU +11A09..11A0A ; Vowel_Dependent # Mn [2] ZANABAZAR SQUARE VOWEL SIGN REVERSED I..ZANABAZAR SQUARE VOWEL LENGTH MARK +11A51..11A56 ; Vowel_Dependent # Mn [6] SOYOMBO VOWEL SIGN I..SOYOMBO VOWEL SIGN OE +11A57..11A58 ; Vowel_Dependent # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A59..11A5B ; Vowel_Dependent # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11C2F ; Vowel_Dependent # Mc BHAIKSUKI VOWEL SIGN AA +11C30..11C36 ; Vowel_Dependent # Mn [7] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN VOCALIC L +11C38..11C3B ; Vowel_Dependent # Mn [4] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI VOWEL SIGN AU +11CB0 ; Vowel_Dependent # Mn MARCHEN VOWEL SIGN AA +11CB1 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN I +11CB2..11CB3 ; Vowel_Dependent # Mn [2] MARCHEN VOWEL SIGN U..MARCHEN VOWEL SIGN E +11CB4 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN O +11D31..11D36 ; Vowel_Dependent # Mn [6] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN VOCALIC R +11D3A ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Vowel_Dependent # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN AU +11D43 ; Vowel_Dependent # Mn MASARAM GONDI SIGN CANDRA + +# ================================================ + +# Indic_Syllabic_Category=Vowel + +# (Other) Vowels (reanalyzed as ordinary alphabetic letters or marks) + +# [Not derivable] + +1963..196D ; Vowel # Lo [11] TAI LE LETTER A..TAI LE LETTER AI +A85E..A861 ; Vowel # Lo [4] PHAGS-PA LETTER I..PHAGS-PA LETTER O +A866 ; Vowel # Lo PHAGS-PA LETTER EE +A922..A925 ; Vowel # Lo [4] KAYAH LI LETTER A..KAYAH LI LETTER OO +A926..A92A ; Vowel # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O +11150..11154 ; Vowel # Lo [5] MAHAJANI LETTER A..MAHAJANI LETTER O + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Placeholder + +# Consonant Placeholder +# This includes generic placeholders used for +# Indic script layout (NBSP and dotted circle), as well as a few script- +# specific vowel-holder characters which are not technically +# consonants, but serve instead as bases for placement of vowel marks. + +# [Not derivable] + +002D ; Consonant_Placeholder # Pd HYPHEN-MINUS +00A0 ; Consonant_Placeholder # Zs NO-BREAK SPACE +00D7 ; Consonant_Placeholder # Sm MULTIPLICATION SIGN +0A72..0A73 ; Consonant_Placeholder # Lo [2] GURMUKHI IRI..GURMUKHI URA +104E ; Consonant_Placeholder # Po MYANMAR SYMBOL AFOREMENTIONED +1900 ; Consonant_Placeholder # Lo LIMBU VOWEL-CARRIER LETTER +2010..2014 ; Consonant_Placeholder # Pd [5] HYPHEN..EM DASH +25CC ; Consonant_Placeholder # So DOTTED CIRCLE +AA74..AA76 ; Consonant_Placeholder # Lo [3] MYANMAR LOGOGRAM KHAMTI OAY..MYANMAR LOGOGRAM KHAMTI HM +11A3F ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL HEAD MARK +11A45 ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL DOUBLE-LINED HEAD MARK + +# ================================================ + +# Indic_Syllabic_Category=Consonant + +# Consonant (ordinary abugida consonants, with inherent vowels) + +# [Not derivable] + +0915..0939 ; Consonant # Lo [37] DEVANAGARI LETTER KA..DEVANAGARI LETTER HA +0958..095F ; Consonant # Lo [8] DEVANAGARI LETTER QA..DEVANAGARI LETTER YYA +0978..097F ; Consonant # Lo [8] DEVANAGARI LETTER MARWARI DDA..DEVANAGARI LETTER BBA +0995..09A8 ; Consonant # Lo [20] BENGALI LETTER KA..BENGALI LETTER NA +09AA..09B0 ; Consonant # Lo [7] BENGALI LETTER PA..BENGALI LETTER RA +09B2 ; Consonant # Lo BENGALI LETTER LA +09B6..09B9 ; Consonant # Lo [4] BENGALI LETTER SHA..BENGALI LETTER HA +09DC..09DD ; Consonant # Lo [2] BENGALI LETTER RRA..BENGALI LETTER RHA +09DF ; Consonant # Lo BENGALI LETTER YYA +09F0..09F1 ; Consonant # Lo [2] BENGALI LETTER RA WITH MIDDLE DIAGONAL..BENGALI LETTER RA WITH LOWER DIAGONAL +0A15..0A28 ; Consonant # Lo [20] GURMUKHI LETTER KA..GURMUKHI LETTER NA +0A2A..0A30 ; Consonant # Lo [7] GURMUKHI LETTER PA..GURMUKHI LETTER RA +0A32..0A33 ; Consonant # Lo [2] GURMUKHI LETTER LA..GURMUKHI LETTER LLA +0A35..0A36 ; Consonant # Lo [2] GURMUKHI LETTER VA..GURMUKHI LETTER SHA +0A38..0A39 ; Consonant # Lo [2] GURMUKHI LETTER SA..GURMUKHI LETTER HA +0A59..0A5C ; Consonant # Lo [4] GURMUKHI LETTER KHHA..GURMUKHI LETTER RRA +0A5E ; Consonant # Lo GURMUKHI LETTER FA +0A95..0AA8 ; Consonant # Lo [20] GUJARATI LETTER KA..GUJARATI LETTER NA +0AAA..0AB0 ; Consonant # Lo [7] GUJARATI LETTER PA..GUJARATI LETTER RA +0AB2..0AB3 ; Consonant # Lo [2] GUJARATI LETTER LA..GUJARATI LETTER LLA +0AB5..0AB9 ; Consonant # Lo [5] GUJARATI LETTER VA..GUJARATI LETTER HA +0AF9 ; Consonant # Lo GUJARATI LETTER ZHA +0B15..0B28 ; Consonant # Lo [20] ORIYA LETTER KA..ORIYA LETTER NA +0B2A..0B30 ; Consonant # Lo [7] ORIYA LETTER PA..ORIYA LETTER RA +0B32..0B33 ; Consonant # Lo [2] ORIYA LETTER LA..ORIYA LETTER LLA +0B35..0B39 ; Consonant # Lo [5] ORIYA LETTER VA..ORIYA LETTER HA +0B5C..0B5D ; Consonant # Lo [2] ORIYA LETTER RRA..ORIYA LETTER RHA +0B5F ; Consonant # Lo ORIYA LETTER YYA +0B71 ; Consonant # Lo ORIYA LETTER WA +0B95 ; Consonant # Lo TAMIL LETTER KA +0B99..0B9A ; Consonant # Lo [2] TAMIL LETTER NGA..TAMIL LETTER CA +0B9C ; Consonant # Lo TAMIL LETTER JA +0B9E..0B9F ; Consonant # Lo [2] TAMIL LETTER NYA..TAMIL LETTER TTA +0BA3..0BA4 ; Consonant # Lo [2] TAMIL LETTER NNA..TAMIL LETTER TA +0BA8..0BAA ; Consonant # Lo [3] TAMIL LETTER NA..TAMIL LETTER PA +0BAE..0BB9 ; Consonant # Lo [12] TAMIL LETTER MA..TAMIL LETTER HA +0C15..0C28 ; Consonant # Lo [20] TELUGU LETTER KA..TELUGU LETTER NA +0C2A..0C39 ; Consonant # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C58..0C5A ; Consonant # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C95..0CA8 ; Consonant # Lo [20] KANNADA LETTER KA..KANNADA LETTER NA +0CAA..0CB3 ; Consonant # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA +0CB5..0CB9 ; Consonant # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA +0CDE ; Consonant # Lo KANNADA LETTER FA +0D15..0D3A ; Consonant # Lo [38] MALAYALAM LETTER KA..MALAYALAM LETTER TTTA +0D9A..0DB1 ; Consonant # Lo [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA +0DB3..0DBB ; Consonant # Lo [9] SINHALA LETTER SANYAKA DAYANNA..SINHALA LETTER RAYANNA +0DBD ; Consonant # Lo SINHALA LETTER DANTAJA LAYANNA +0DC0..0DC6 ; Consonant # Lo [7] SINHALA LETTER VAYANNA..SINHALA LETTER FAYANNA +0E01..0E2E ; Consonant # Lo [46] THAI CHARACTER KO KAI..THAI CHARACTER HO NOKHUK +0E81..0E82 ; Consonant # Lo [2] LAO LETTER KO..LAO LETTER KHO SUNG +0E84 ; Consonant # Lo LAO LETTER KHO TAM +0E87..0E88 ; Consonant # Lo [2] LAO LETTER NGO..LAO LETTER CO +0E8A ; Consonant # Lo LAO LETTER SO TAM +0E8D ; Consonant # Lo LAO LETTER NYO +0E94..0E97 ; Consonant # Lo [4] LAO LETTER DO..LAO LETTER THO TAM +0E99..0E9F ; Consonant # Lo [7] LAO LETTER NO..LAO LETTER FO SUNG +0EA1..0EA3 ; Consonant # Lo [3] LAO LETTER MO..LAO LETTER LO LING +0EA5 ; Consonant # Lo LAO LETTER LO LOOT +0EA7 ; Consonant # Lo LAO LETTER WO +0EAA..0EAB ; Consonant # Lo [2] LAO LETTER SO SUNG..LAO LETTER HO SUNG +0EAD..0EAE ; Consonant # Lo [2] LAO LETTER O..LAO LETTER HO TAM +0EDC..0EDF ; Consonant # Lo [4] LAO HO NO..LAO LETTER KHMU NYO +0F40..0F47 ; Consonant # Lo [8] TIBETAN LETTER KA..TIBETAN LETTER JA +0F49..0F6C ; Consonant # Lo [36] TIBETAN LETTER NYA..TIBETAN LETTER RRA +1000..1020 ; Consonant # Lo [33] MYANMAR LETTER KA..MYANMAR LETTER LLA +103F ; Consonant # Lo MYANMAR LETTER GREAT SA +1050..1051 ; Consonant # Lo [2] MYANMAR LETTER SHA..MYANMAR LETTER SSA +105A..105D ; Consonant # Lo [4] MYANMAR LETTER MON NGA..MYANMAR LETTER MON BBE +1061 ; Consonant # Lo MYANMAR LETTER SGAW KAREN SHA +1065..1066 ; Consonant # Lo [2] MYANMAR LETTER WESTERN PWO KAREN THA..MYANMAR LETTER WESTERN PWO KAREN PWA +106E..1070 ; Consonant # Lo [3] MYANMAR LETTER EASTERN PWO KAREN NNA..MYANMAR LETTER EASTERN PWO KAREN GHWA +1075..1081 ; Consonant # Lo [13] MYANMAR LETTER SHAN KA..MYANMAR LETTER SHAN HA +108E ; Consonant # Lo MYANMAR LETTER RUMAI PALAUNG FA +1703..170C ; Consonant # Lo [10] TAGALOG LETTER KA..TAGALOG LETTER YA +170E..1711 ; Consonant # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1723..1731 ; Consonant # Lo [15] HANUNOO LETTER KA..HANUNOO LETTER HA +1743..1751 ; Consonant # Lo [15] BUHID LETTER KA..BUHID LETTER HA +1763..176C ; Consonant # Lo [10] TAGBANWA LETTER KA..TAGBANWA LETTER YA +176E..1770 ; Consonant # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA +1780..17A2 ; Consonant # Lo [35] KHMER LETTER KA..KHMER LETTER QA +1901..191E ; Consonant # Lo [30] LIMBU LETTER KA..LIMBU LETTER TRA +1950..1962 ; Consonant # Lo [19] TAI LE LETTER KA..TAI LE LETTER NA +1980..19AB ; Consonant # Lo [44] NEW TAI LUE LETTER HIGH QA..NEW TAI LUE LETTER LOW SUA +1A00..1A16 ; Consonant # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA +1A20..1A4C ; Consonant # Lo [45] TAI THAM LETTER HIGH KA..TAI THAM LETTER LOW HA +1A53..1A54 ; Consonant # Lo [2] TAI THAM LETTER LAE..TAI THAM LETTER GREAT SA +1B13..1B33 ; Consonant # Lo [33] BALINESE LETTER KA..BALINESE LETTER HA +1B45..1B4B ; Consonant # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B8A..1BA0 ; Consonant # Lo [23] SUNDANESE LETTER KA..SUNDANESE LETTER HA +1BAE..1BAF ; Consonant # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA +1BBB..1BBD ; Consonant # Lo [3] SUNDANESE LETTER REU..SUNDANESE LETTER BHA +1BC0..1BE3 ; Consonant # Lo [36] BATAK LETTER A..BATAK LETTER MBA +1C00..1C23 ; Consonant # Lo [36] LEPCHA LETTER KA..LEPCHA LETTER A +1C4D..1C4F ; Consonant # Lo [3] LEPCHA LETTER TTA..LEPCHA LETTER DDA +A807..A80A ; Consonant # Lo [4] SYLOTI NAGRI LETTER KO..SYLOTI NAGRI LETTER GHO +A80C..A822 ; Consonant # Lo [23] SYLOTI NAGRI LETTER CO..SYLOTI NAGRI LETTER HO +A840..A85D ; Consonant # Lo [30] PHAGS-PA LETTER KA..PHAGS-PA LETTER A +A862..A865 ; Consonant # Lo [4] PHAGS-PA LETTER QA..PHAGS-PA LETTER GGA +A869..A870 ; Consonant # Lo [8] PHAGS-PA LETTER TTA..PHAGS-PA LETTER ASPIRATED FA +A872 ; Consonant # Lo PHAGS-PA SUPERFIXED LETTER RA +A892..A8B3 ; Consonant # Lo [34] SAURASHTRA LETTER KA..SAURASHTRA LETTER LLA +A90A..A921 ; Consonant # Lo [24] KAYAH LI LETTER KA..KAYAH LI LETTER CA +A930..A946 ; Consonant # Lo [23] REJANG LETTER KA..REJANG LETTER A +A989..A98B ; Consonant # Lo [3] JAVANESE LETTER PA CEREK..JAVANESE LETTER NGA LELET RASWADI +A98F..A9B2 ; Consonant # Lo [36] JAVANESE LETTER KA..JAVANESE LETTER HA +A9E0..A9E4 ; Consonant # Lo [5] MYANMAR LETTER SHAN GHA..MYANMAR LETTER SHAN BHA +A9E7..A9EF ; Consonant # Lo [9] MYANMAR LETTER TAI LAING NYA..MYANMAR LETTER TAI LAING NNA +A9FA..A9FE ; Consonant # Lo [5] MYANMAR LETTER TAI LAING LLA..MYANMAR LETTER TAI LAING BHA +AA06..AA28 ; Consonant # Lo [35] CHAM LETTER KA..CHAM LETTER HA +AA60..AA6F ; Consonant # Lo [16] MYANMAR LETTER KHAMTI GA..MYANMAR LETTER KHAMTI FA +AA71..AA73 ; Consonant # Lo [3] MYANMAR LETTER KHAMTI XA..MYANMAR LETTER KHAMTI RA +AA7A ; Consonant # Lo MYANMAR LETTER AITON RA +AA7E..AA7F ; Consonant # Lo [2] MYANMAR LETTER SHWE PALAUNG CHA..MYANMAR LETTER SHWE PALAUNG SHA +AA80..AAAF ; Consonant # Lo [48] TAI VIET LETTER LOW KO..TAI VIET LETTER HIGH O +AAE2..AAEA ; Consonant # Lo [9] MEETEI MAYEK LETTER CHA..MEETEI MAYEK LETTER SSA +ABC0..ABCD ; Consonant # Lo [14] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER HUK +ABD0 ; Consonant # Lo MEETEI MAYEK LETTER PHAM +ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTER BHAM +10A00 ; Consonant # Lo KHAROSHTHI LETTER A +10A10..10A13 ; Consonant # Lo [4] KHAROSHTHI LETTER KA..KHAROSHTHI LETTER GHA +10A15..10A17 ; Consonant # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA +10A19..10A33 ; Consonant # Lo [27] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER TTTHA +11013..11037 ; Consonant # Lo [37] BRAHMI LETTER KA..BRAHMI LETTER OLD TAMIL NNNA +1108D..110AF ; Consonant # Lo [35] KAITHI LETTER KA..KAITHI LETTER HA +11107..11126 ; Consonant # Lo [32] CHAKMA LETTER KAA..CHAKMA LETTER HAA +11155..11172 ; Consonant # Lo [30] MAHAJANI LETTER KA..MAHAJANI LETTER RRA +11191..111B2 ; Consonant # Lo [34] SHARADA LETTER KA..SHARADA LETTER HA +11208..11211 ; Consonant # Lo [10] KHOJKI LETTER KA..KHOJKI LETTER JJA +11213..1122B ; Consonant # Lo [25] KHOJKI LETTER NYA..KHOJKI LETTER LLA +11284..11286 ; Consonant # Lo [3] MULTANI LETTER KA..MULTANI LETTER GA +11288 ; Consonant # Lo MULTANI LETTER GHA +1128A..1128D ; Consonant # Lo [4] MULTANI LETTER CA..MULTANI LETTER JJA +1128F..1129D ; Consonant # Lo [15] MULTANI LETTER NYA..MULTANI LETTER BA +1129F..112A8 ; Consonant # Lo [10] MULTANI LETTER BHA..MULTANI LETTER RHA +112BA..112DE ; Consonant # Lo [37] KHUDAWADI LETTER KA..KHUDAWADI LETTER HA +11315..11328 ; Consonant # Lo [20] GRANTHA LETTER KA..GRANTHA LETTER NA +1132A..11330 ; Consonant # Lo [7] GRANTHA LETTER PA..GRANTHA LETTER RA +11332..11333 ; Consonant # Lo [2] GRANTHA LETTER LA..GRANTHA LETTER LLA +11335..11339 ; Consonant # Lo [5] GRANTHA LETTER VA..GRANTHA LETTER HA +1140E..11434 ; Consonant # Lo [39] NEWA LETTER KA..NEWA LETTER HA +1148F..114AF ; Consonant # Lo [33] TIRHUTA LETTER KA..TIRHUTA LETTER HA +1158E..115AE ; Consonant # Lo [33] SIDDHAM LETTER KA..SIDDHAM LETTER HA +1160E..1162F ; Consonant # Lo [34] MODI LETTER KA..MODI LETTER LLA +1168A..116AA ; Consonant # Lo [33] TAKRI LETTER KA..TAKRI LETTER RRA +11700..11719 ; Consonant # Lo [26] AHOM LETTER KA..AHOM LETTER JHA +11A0B..11A32 ; Consonant # Lo [40] ZANABAZAR SQUARE LETTER KA..ZANABAZAR SQUARE LETTER KSSA +11A5C..11A83 ; Consonant # Lo [40] SOYOMBO LETTER KA..SOYOMBO LETTER KSSA +11C0E..11C2E ; Consonant # Lo [33] BHAIKSUKI LETTER KA..BHAIKSUKI LETTER HA +11C72..11C8F ; Consonant # Lo [30] MARCHEN LETTER KA..MARCHEN LETTER A +11D0C..11D30 ; Consonant # Lo [37] MASARAM GONDI LETTER KA..MASARAM GONDI LETTER TRA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Dead + +# Dead Consonant (special consonant with killed vowel) + +# [Not derivable] + +09CE ; Consonant_Dead # Lo BENGALI LETTER KHANDA TA +0D54..0D56 ; Consonant_Dead # Lo [3] MALAYALAM LETTER CHILLU M..MALAYALAM LETTER CHILLU LLL +0D7A..0D7F ; Consonant_Dead # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K + +# ================================================ + +# Indic_Syllabic_Category=Consonant_With_Stacker + +# Consonants that may make stacked ligatures with the next consonant +# without the use of a virama + +# [Not derivable] + +0CF1..0CF2 ; Consonant_With_Stacker # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA +11003..11004 ; Consonant_With_Stacker # Lo [2] BRAHMI SIGN JIHVAMULIYA..BRAHMI SIGN UPADHMANIYA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Prefixed + +# Cluster-initial consonants + +# [Not derivable] + +111C2..111C3 ; Consonant_Prefixed # Lo [2] SHARADA SIGN JIHVAMULIYA..SHARADA SIGN UPADHMANIYA +11A3A ; Consonant_Prefixed # Lo ZANABAZAR SQUARE CLUSTER-INITIAL LETTER RA +11A86..11A89 ; Consonant_Prefixed # Lo [4] SOYOMBO CLUSTER-INITIAL LETTER RA..SOYOMBO CLUSTER-INITIAL LETTER SA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Preceding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when preceding the main consonant + +# [Not derivable] + +0D4E ; Consonant_Preceding_Repha # Lo MALAYALAM LETTER DOT REPH +11D46 ; Consonant_Preceding_Repha # Lo MASARAM GONDI REPHA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Succeeding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when succeeding the main consonant. +# Additionally, U+1A5A TAI THAM CONSONANT SIGN LOW PA has been temporarily classified +# in this class due to its behavior, although it is not a RA. + +# [Not derivable] + +17CC ; Consonant_Succeeding_Repha # Mn KHMER SIGN ROBAT +1A5A ; Consonant_Succeeding_Repha # Mn TAI THAM CONSONANT SIGN LOW PA +1B03 ; Consonant_Succeeding_Repha # Mn BALINESE SIGN SURANG +1B81 ; Consonant_Succeeding_Repha # Mn SUNDANESE SIGN PANGLAYAR +A982 ; Consonant_Succeeding_Repha # Mn JAVANESE SIGN LAYAR + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Subjoined + +# Subjoined Consonant (C2 form subtending a base consonant in Tibetan, etc.) + +# [Not derivable] + +0F8D..0F97 ; Consonant_Subjoined # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Consonant_Subjoined # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +1929..192B ; Consonant_Subjoined # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1A57 ; Consonant_Subjoined # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A5B..1A5E ; Consonant_Subjoined # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1BA1 ; Consonant_Subjoined # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA2..1BA3 ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BAC..1BAD ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C24..1C25 ; Consonant_Subjoined # Mc [2] LEPCHA SUBJOINED LETTER YA..LEPCHA SUBJOINED LETTER RA +A867..A868 ; Consonant_Subjoined # Lo [2] PHAGS-PA SUBJOINED LETTER WA..PHAGS-PA SUBJOINED LETTER YA +A871 ; Consonant_Subjoined # Lo PHAGS-PA SUBJOINED LETTER RA +A9BD ; Consonant_Subjoined # Mc JAVANESE CONSONANT SIGN KERET +11C92..11CA7 ; Consonant_Subjoined # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CA9 ; Consonant_Subjoined # Mc MARCHEN SUBJOINED LETTER YA +11CAA..11CAF ; Consonant_Subjoined # Mn [6] MARCHEN SUBJOINED LETTER RA..MARCHEN SUBJOINED LETTER A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Medial + +# Medial Consonant (medial liquid, occurring in clusters) + +# [Not derivable] + +0A75 ; Consonant_Medial # Mn GURMUKHI SIGN YAKASH +0EBC ; Consonant_Medial # Mn LAO SEMIVOWEL SIGN LO +0EBD ; Consonant_Medial # Lo LAO SEMIVOWEL SIGN NYO +103B..103C ; Consonant_Medial # Mc [2] MYANMAR CONSONANT SIGN MEDIAL YA..MYANMAR CONSONANT SIGN MEDIAL RA +103D..103E ; Consonant_Medial # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +105E..1060 ; Consonant_Medial # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Consonant_Medial # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +1A55 ; Consonant_Medial # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A56 ; Consonant_Medial # Mn TAI THAM CONSONANT SIGN MEDIAL LA +A9BE..A9BF ; Consonant_Medial # Mc [2] JAVANESE CONSONANT SIGN PENGKAL..JAVANESE CONSONANT SIGN CAKRA +AA33..AA34 ; Consonant_Medial # Mc [2] CHAM CONSONANT SIGN YA..CHAM CONSONANT SIGN RA +AA35..AA36 ; Consonant_Medial # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +1171D..1171F ; Consonant_Medial # Mn [3] AHOM CONSONANT SIGN MEDIAL LA..AHOM CONSONANT SIGN MEDIAL LIGATING RA +11A3B..11A3E ; Consonant_Medial # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11D47 ; Consonant_Medial # Mn MASARAM GONDI RA-KARA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Final + +# Final Consonant (special final forms which do not take vowels) + +# [Not derivable] + +1930..1931 ; Consonant_Final # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Consonant_Final # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +1939 ; Consonant_Final # Mn LIMBU SIGN MUKPHRENG +19C1..19C7 ; Consonant_Final # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B +1A58..1A59 ; Consonant_Final # Mn [2] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN FINAL NGA +1BBE..1BBF ; Consonant_Final # Lo [2] SUNDANESE LETTER FINAL K..SUNDANESE LETTER FINAL M +1BF0..1BF1 ; Consonant_Final # Mn [2] BATAK CONSONANT SIGN NG..BATAK CONSONANT SIGN H +1C2D..1C33 ; Consonant_Final # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +A8B4 ; Consonant_Final # Mc SAURASHTRA CONSONANT SIGN HAARU +A94F..A951 ; Consonant_Final # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A952 ; Consonant_Final # Mc REJANG CONSONANT SIGN H +AA40..AA42 ; Consonant_Final # Lo [3] CHAM LETTER FINAL K..CHAM LETTER FINAL NG +AA43 ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL NG +AA44..AA4B ; Consonant_Final # Lo [8] CHAM LETTER FINAL CH..CHAM LETTER FINAL SS +AA4C ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL M +AA4D ; Consonant_Final # Mc CHAM CONSONANT SIGN FINAL H +ABDB..ABE2 ; Consonant_Final # Lo [8] MEETEI MAYEK LETTER KOK LONSUM..MEETEI MAYEK LETTER I LONSUM +11A8A..11A95 ; Consonant_Final # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Head_Letter + +# Head Letter (Tibetan) + +# [Not derivable] + +0F88..0F8C ; Consonant_Head_Letter # Lo [5] TIBETAN SIGN LCE TSA CAN..TIBETAN SIGN INVERTED MCHU CAN + +# ================================================ + +# Indic_Syllabic_Category=Modifying_Letter + +# Reanalyzed letters not participating in the abugida structure, but +# serving to modify the sound of an adjacent vowel or consonant. +# Note that this is not the same as General_Category=Modifier_Letter. + +# [Not derivable] + +0B83 ; Modifying_Letter # Lo TAMIL SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Tone_Letter + +# Tone Letter (spacing lexical tone mark with status as a letter) + +# [Not derivable] + +1970..1974 ; Tone_Letter # Lo [5] TAI LE LETTER TONE-2..TAI LE LETTER TONE-6 +AAC0 ; Tone_Letter # Lo TAI VIET TONE MAI NUENG +AAC2 ; Tone_Letter # Lo TAI VIET TONE MAI SONG + +# ================================================ + +# Indic_Syllabic_Category=Tone_Mark + +# Tone Mark (nonspacing or spacing lexical tone mark) + +# [Not derivable] + +0E48..0E4B ; Tone_Mark # Mn [4] THAI CHARACTER MAI EK..THAI CHARACTER MAI CHATTAWA +0EC8..0ECB ; Tone_Mark # Mn [4] LAO TONE MAI EK..LAO TONE MAI CATAWA +1037 ; Tone_Mark # Mn MYANMAR SIGN DOT BELOW +1063..1064 ; Tone_Mark # Mc [2] MYANMAR TONE MARK SGAW KAREN HATHI..MYANMAR TONE MARK SGAW KAREN KE PHO +1069..106D ; Tone_Mark # Mc [5] MYANMAR SIGN WESTERN PWO KAREN TONE-1..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1087..108C ; Tone_Mark # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108D ; Tone_Mark # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +108F ; Tone_Mark # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109B ; Tone_Mark # Mc [2] MYANMAR SIGN KHAMTI TONE-1..MYANMAR SIGN KHAMTI TONE-3 +19C8..19C9 ; Tone_Mark # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A75..1A79 ; Tone_Mark # Mn [5] TAI THAM SIGN TONE-1..TAI THAM SIGN KHUEN TONE-5 +A92B..A92D ; Tone_Mark # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +AA7B ; Tone_Mark # Mc MYANMAR SIGN PAO KAREN TONE +AA7C ; Tone_Mark # Mn MYANMAR SIGN TAI LAING TONE-2 +AA7D ; Tone_Mark # Mc MYANMAR SIGN TAI LAING TONE-5 +AABF ; Tone_Mark # Mn TAI VIET TONE MAI EK +AAC1 ; Tone_Mark # Mn TAI VIET TONE MAI THO +ABEC ; Tone_Mark # Mc MEETEI MAYEK LUM IYEK + +# ================================================ + +# Indic_Syllabic_Category=Gemination_Mark + +# Gemination Mark (doubling of the preceding or following consonant) + +# [Not derivable] + +0A71 ; Gemination_Mark # Mn GURMUKHI ADDAK +11237 ; Gemination_Mark # Mn KHOJKI SIGN SHADDA +11A98 ; Gemination_Mark # Mn SOYOMBO GEMINATION MARK + +# ================================================ + +# Indic_Syllabic_Category=Cantillation_Mark + +# Cantillation Mark (recitation marks, such as svara markers for the Samaveda) + +# [Not derivable] + +0951..0952 ; Cantillation_Mark # Mn [2] DEVANAGARI STRESS SIGN UDATTA..DEVANAGARI STRESS SIGN ANUDATTA +0AFA..0AFC ; Cantillation_Mark # Mn [3] GUJARATI SIGN SUKUN..GUJARATI SIGN MADDAH +1CD0..1CD2 ; Cantillation_Mark # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CD4..1CE0 ; Cantillation_Mark # Mn [13] VEDIC SIGN YAJURVEDIC MIDLINE SVARITA..VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CE1 ; Cantillation_Mark # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF4 ; Cantillation_Mark # Mn VEDIC TONE CANDRA ABOVE +1CF7 ; Cantillation_Mark # Mc VEDIC SIGN ATIKRAMA +1CF8..1CF9 ; Cantillation_Mark # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE +A8E0..A8F1 ; Cantillation_Mark # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +1123E ; Cantillation_Mark # Mn KHOJKI SIGN SUKUN +11366..1136C ; Cantillation_Mark # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Cantillation_Mark # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA + +# ================================================ + +# Indic_Syllabic_Category=Register_Shifter + +# Register Shifter (shifts register for consonants, akin to a tone mark) + +# [Not derivable] + +17C9..17CA ; Register_Shifter # Mn [2] KHMER SIGN MUUSIKATOAN..KHMER SIGN TRIISAP + +# ================================================ + +# Indic_Syllabic_Category=Syllable_Modifier + +# Syllable Modifier (miscellaneous combining characters that modify +# something in the orthographic syllable they succeed) + +# [Not derivable] + +00B2..00B3 ; Syllable_Modifier # No [2] SUPERSCRIPT TWO..SUPERSCRIPT THREE +0F35 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0FC6 ; Syllable_Modifier # Mn TIBETAN SYMBOL PADMA GDAN +17CB ; Syllable_Modifier # Mn KHMER SIGN BANTOC +17CE..17D0 ; Syllable_Modifier # Mn [3] KHMER SIGN KAKABAT..KHMER SIGN SAMYOK SANNYA +17D3 ; Syllable_Modifier # Mn KHMER SIGN BATHAMASAT +17DD ; Syllable_Modifier # Mn KHMER SIGN ATTHACAN +193B ; Syllable_Modifier # Mn LIMBU SIGN SA-I +1A7B..1A7C ; Syllable_Modifier # Mn [2] TAI THAM SIGN MAI SAM..TAI THAM SIGN KHUEN-LUE KARAN +1A7F ; Syllable_Modifier # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1C36 ; Syllable_Modifier # Mn LEPCHA SIGN RAN +1DFB ; Syllable_Modifier # Mn COMBINING DELETION MARK +2074 ; Syllable_Modifier # No SUPERSCRIPT FOUR +2082..2084 ; Syllable_Modifier # No [3] SUBSCRIPT TWO..SUBSCRIPT FOUR +11A33 ; Syllable_Modifier # Mn ZANABAZAR SQUARE FINAL CONSONANT MARK + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Killer + +# Consonant Killer (signifies that the previous consonant or consonants are +# not pronounced) + +# [Not derivable] + +0E4C ; Consonant_Killer # Mn THAI CHARACTER THANTHAKHAT +17CD ; Consonant_Killer # Mn KHMER SIGN TOANDAKHIAT + +# ================================================ + +# Indic_Syllabic_Category=Non_Joiner + +# Non_Joiner (Zero Width Non-Joiner) + +# [Not derivable] + +200C ; Non_Joiner # Cf ZERO WIDTH NON-JOINER + +# ================================================ + +# Indic_Syllabic_Category=Joiner + +# Joiner (Zero Width Joiner) + +# [Not derivable] + +200D ; Joiner # Cf ZERO WIDTH JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number_Joiner + +# Number_Joiner (forms ligatures between numbers for multiplication) + +# [Not derivable] + +1107F ; Number_Joiner # Mn BRAHMI NUMBER JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number + +# Number (can be used as vowel-holders like consonant placeholders) +# Note: A number may even hold subjoined consonants which may in turn +# have been formed using a virama or a stacker, e.g. the sequence +# where THAI THAM LETTER LOW TA is subjoined to +# TAI THAM THAM DIGIT THREE using an invisible stacker. + +# [Not derivable] + +0030..0039 ; Number # Nd [10] DIGIT ZERO..DIGIT NINE +0966..096F ; Number # Nd [10] DEVANAGARI DIGIT ZERO..DEVANAGARI DIGIT NINE +09E6..09EF ; Number # Nd [10] BENGALI DIGIT ZERO..BENGALI DIGIT NINE +0A66..0A6F ; Number # Nd [10] GURMUKHI DIGIT ZERO..GURMUKHI DIGIT NINE +0AE6..0AEF ; Number # Nd [10] GUJARATI DIGIT ZERO..GUJARATI DIGIT NINE +0B66..0B6F ; Number # Nd [10] ORIYA DIGIT ZERO..ORIYA DIGIT NINE +0BE6..0BEF ; Number # Nd [10] TAMIL DIGIT ZERO..TAMIL DIGIT NINE +0C66..0C6F ; Number # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE +0CE6..0CEF ; Number # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE +0D66..0D6F ; Number # Nd [10] MALAYALAM DIGIT ZERO..MALAYALAM DIGIT NINE +0DE6..0DEF ; Number # Nd [10] SINHALA LITH DIGIT ZERO..SINHALA LITH DIGIT NINE +0E50..0E59 ; Number # Nd [10] THAI DIGIT ZERO..THAI DIGIT NINE +0ED0..0ED9 ; Number # Nd [10] LAO DIGIT ZERO..LAO DIGIT NINE +0F20..0F29 ; Number # Nd [10] TIBETAN DIGIT ZERO..TIBETAN DIGIT NINE +0F2A..0F33 ; Number # No [10] TIBETAN DIGIT HALF ONE..TIBETAN DIGIT HALF ZERO +1040..1049 ; Number # Nd [10] MYANMAR DIGIT ZERO..MYANMAR DIGIT NINE +1090..1099 ; Number # Nd [10] MYANMAR SHAN DIGIT ZERO..MYANMAR SHAN DIGIT NINE +17E0..17E9 ; Number # Nd [10] KHMER DIGIT ZERO..KHMER DIGIT NINE +1946..194F ; Number # Nd [10] LIMBU DIGIT ZERO..LIMBU DIGIT NINE +19D0..19D9 ; Number # Nd [10] NEW TAI LUE DIGIT ZERO..NEW TAI LUE DIGIT NINE +1A80..1A89 ; Number # Nd [10] TAI THAM HORA DIGIT ZERO..TAI THAM HORA DIGIT NINE +1A90..1A99 ; Number # Nd [10] TAI THAM THAM DIGIT ZERO..TAI THAM THAM DIGIT NINE +1B50..1B59 ; Number # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE +1BB0..1BB9 ; Number # Nd [10] SUNDANESE DIGIT ZERO..SUNDANESE DIGIT NINE +1C40..1C49 ; Number # Nd [10] LEPCHA DIGIT ZERO..LEPCHA DIGIT NINE +A8D0..A8D9 ; Number # Nd [10] SAURASHTRA DIGIT ZERO..SAURASHTRA DIGIT NINE +A900..A909 ; Number # Nd [10] KAYAH LI DIGIT ZERO..KAYAH LI DIGIT NINE +A9D0..A9D9 ; Number # Nd [10] JAVANESE DIGIT ZERO..JAVANESE DIGIT NINE +A9F0..A9F9 ; Number # Nd [10] MYANMAR TAI LAING DIGIT ZERO..MYANMAR TAI LAING DIGIT NINE +AA50..AA59 ; Number # Nd [10] CHAM DIGIT ZERO..CHAM DIGIT NINE +ABF0..ABF9 ; Number # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE +10A40..10A47 ; Number # No [8] KHAROSHTHI DIGIT ONE..KHAROSHTHI NUMBER ONE THOUSAND +11066..1106F ; Number # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11136..1113F ; Number # Nd [10] CHAKMA DIGIT ZERO..CHAKMA DIGIT NINE +111D0..111D9 ; Number # Nd [10] SHARADA DIGIT ZERO..SHARADA DIGIT NINE +111E1..111F4 ; Number # No [20] SINHALA ARCHAIC DIGIT ONE..SINHALA ARCHAIC NUMBER ONE THOUSAND +112F0..112F9 ; Number # Nd [10] KHUDAWADI DIGIT ZERO..KHUDAWADI DIGIT NINE +11450..11459 ; Number # Nd [10] NEWA DIGIT ZERO..NEWA DIGIT NINE +114D0..114D9 ; Number # Nd [10] TIRHUTA DIGIT ZERO..TIRHUTA DIGIT NINE +11650..11659 ; Number # Nd [10] MODI DIGIT ZERO..MODI DIGIT NINE +116C0..116C9 ; Number # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE +11730..11739 ; Number # Nd [10] AHOM DIGIT ZERO..AHOM DIGIT NINE +1173A..1173B ; Number # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY +11C50..11C59 ; Number # Nd [10] BHAIKSUKI DIGIT ZERO..BHAIKSUKI DIGIT NINE +11C5A..11C6C ; Number # No [19] BHAIKSUKI NUMBER ONE..BHAIKSUKI HUNDREDS UNIT MARK +11D50..11D59 ; Number # Nd [10] MASARAM GONDI DIGIT ZERO..MASARAM GONDI DIGIT NINE + +# ================================================ + +# Indic_Syllabic_Category=Brahmi_Joining_Number + +# Brahmi Joining Number (similar to Number in that in can be used as +# vowel-holders like Consonant_Placeholder, but may also be joined by +# a Number_Joiner of the same script, e.g. in Brahmi) + +# [Not derivable] + +11052..11065 ; Brahmi_Joining_Number # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND + +# EOF diff --git a/data/11.0.0-indic-positional-category.txt b/data/11.0.0-indic-positional-category.txt new file mode 100644 index 0000000..9c07cd9 --- /dev/null +++ b/data/11.0.0-indic-positional-category.txt @@ -0,0 +1,735 @@ +# IndicPositionalCategory-11.0.0.txt +# Date: 2018-02-05, 16:21:00 GMT [KW, RP] +# © 2018 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# +# For documentation, see UAX #44: Unicode Character Database, +# at http://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Positional_Category enumerated property +# +# Scope: This property is aimed at the problem of +# the specification of syllabic structure for Indic scripts. +# Because dependent vowels (matras), visible viramas, and other +# characters are placed in notional slots around the consonant (or +# consonant cluster) core of an Indic syllable, there may be +# cooccurrence constraints or other interactions. Also, it may be +# desirable, in cases where more than one such character may occur in +# sequence, as for example, in a top slot and a bottom slot, to +# specify preferred orders for spelling. As such, this property +# is designed primarily to supplement the Indic_Syllabic_Category +# property. +# +# Note that this property is *not* intended as +# a prescriptive property regarding display or font design, +# for a number of reasons. Good font design requires information +# that is outside the context of a character encoding standard, +# and is best handled in other venues. For Indic dependent +# vowels and similar characters, in particular: +# +# 1. Matra placement may vary somewhat based on typeface design. +# 2. Matra placement, even within a single script, may vary +# somewhat according to historic period or local conventions. +# 3. Matra placement may be changed by explicit orthographic reform +# decisions. +# 4. Matras may ligate in various ways with a consonant (or even +# other elements of a syllable) instead of occurring in a +# discrete location. +# 5. Matra display may be contextually determined. This is +# notable, for example, in the Tamil script, where the shape +# and placement of -u and -uu vowels depends strongly on +# which consonant they adjoin. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Positional_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as containing dependent vowels or similar characters +# in the structural sense used for the Indic_Positional_Category are the +# following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Dogra, Grantha, Gujarati, Gunjala Gondi, +# Gurmukhi, Hanunoo, Javanese, Kaithi, Kannada, Kharoshthi, Khmer, +# Khojki, Khudawadi, Lao, Lepcha, Limbu, Makasar, Malayalam, Marchen, +# Masaram Gondi, Meetei Mayek, Modi, Myanmar, Newa, New Tai Lue, +# Oriya, Rejang, Saurashtra, Sharada, Siddham, Sinhala, Soyombo, +# Sundanese, Syloti Nagri, Tagalog, Tagbanwa, Tai Tham, Tai Viet, +# Takri, Tamil, Telugu, Thai, Tibetan, Tirhuta, and Zanabazar Square. +# +# All characters for all other scripts not in that list +# take the default value for this property. +# +# See IndicSyllabicCategory.txt for a slightly more extended +# list of Indic scripts, including those which do not have +# positional characters. Currently, those additional +# Indic scripts without positional characters are +# Kayah Li, Mahajani, Multani, Phags-pa, and Tai Le. +# +# Notes: +# +# 1. The following characters are all assigned the positional category Right, +# but may have different positions in some cases: +# * U+0BC1 TAMIL VOWEL SIGN U and U+0BC2 TAMIL VOWEL SIGN UU have +# contextually variable placement in Tamil. +# * U+0D41 MALAYALAM VOWEL SIGN U and U+0D42 MALAYALAM VOWEL SIGN UU form +# complex ligatures with consonants in older Malayalam orthography. +# * U+11341 GRANTHA VOWEL SIGN U and U+11342 GRANTHA VOWEL SIGN UU have +# contextually variable placement in Grantha. +# * U+11440 NEWA VOWEL SIGN O and U+11441 NEWA VOWEL SIGN AU have contextually +# variable placement in Newa. +# +# 2. The following characters are all assigned the positional category Top, +# but may have different positions in some cases: +# * U+1143E NEWA VOWEL SIGN E and U+1143F NEWA VOWEL SIGN AI have contextually +# variable placement in Newa. +# +# 3. The following characters are all assigned the positional category Bottom, +# but may have different positions in some cases: +# * U+102F MYANMAR VOWEL SIGN U and U+1030 MYANMAR VOWEL SIGN UU have +# contextually variable placement in Myanmar. + + +# ================================================ + +# Property: Indic_Positional_Category +# +# All code points not explicitly listed for Indic_Positional_Category +# have the value NA (not applicable). +# +# @missing: 0000..10FFFF; NA + +# ------------------------------------------------ + +# Indic_Positional_Category=Right + +0903 ; Right # Mc DEVANAGARI SIGN VISARGA +093B ; Right # Mc DEVANAGARI VOWEL SIGN OOE +093E ; Right # Mc DEVANAGARI VOWEL SIGN AA +0940 ; Right # Mc DEVANAGARI VOWEL SIGN II +0949..094C ; Right # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094F ; Right # Mc DEVANAGARI VOWEL SIGN AW +0982..0983 ; Right # Mc [2] BENGALI SIGN ANUSVARA..BENGALI SIGN VISARGA +09BE ; Right # Mc BENGALI VOWEL SIGN AA +09C0 ; Right # Mc BENGALI VOWEL SIGN II +09D7 ; Right # Mc BENGALI AU LENGTH MARK +0A03 ; Right # Mc GURMUKHI SIGN VISARGA +0A3E ; Right # Mc GURMUKHI VOWEL SIGN AA +0A40 ; Right # Mc GURMUKHI VOWEL SIGN II +0A83 ; Right # Mc GUJARATI SIGN VISARGA +0ABE ; Right # Mc GUJARATI VOWEL SIGN AA +0AC0 ; Right # Mc GUJARATI VOWEL SIGN II +0ACB..0ACC ; Right # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0B02..0B03 ; Right # Mc [2] ORIYA SIGN ANUSVARA..ORIYA SIGN VISARGA +0B3E ; Right # Mc ORIYA VOWEL SIGN AA +0B40 ; Right # Mc ORIYA VOWEL SIGN II +0BBE..0BBF ; Right # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC1..0BC2 ; Right # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BD7 ; Right # Mc TAMIL AU LENGTH MARK +0C01..0C03 ; Right # Mc [3] TELUGU SIGN CANDRABINDU..TELUGU SIGN VISARGA +0C41..0C44 ; Right # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C82..0C83 ; Right # Mc [2] KANNADA SIGN ANUSVARA..KANNADA SIGN VISARGA +0CBE ; Right # Mc KANNADA VOWEL SIGN AA +0CC1..0CC4 ; Right # Mc [4] KANNADA VOWEL SIGN U..KANNADA VOWEL SIGN VOCALIC RR +0CD5..0CD6 ; Right # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0D02..0D03 ; Right # Mc [2] MALAYALAM SIGN ANUSVARA..MALAYALAM SIGN VISARGA +0D3E..0D40 ; Right # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D42 ; Right # Mn [2] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN UU +0D57 ; Right # Mc MALAYALAM AU LENGTH MARK +0D82..0D83 ; Right # Mc [2] SINHALA SIGN ANUSVARAYA..SINHALA SIGN VISARGAYA +0DCF..0DD1 ; Right # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD8 ; Right # Mc SINHALA VOWEL SIGN GAETTA-PILLA +0DDF ; Right # Mc SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Right # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Right # Lo THAI CHARACTER SARA A +0E32..0E33 ; Right # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E45 ; Right # Lo THAI CHARACTER LAKKHANGYAO +0EB0 ; Right # Lo LAO VOWEL SIGN A +0EB2..0EB3 ; Right # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0F3E ; Right # Mc TIBETAN SIGN YAR TSHES +0F7F ; Right # Mc TIBETAN SIGN RNAM BCAD +102B..102C ; Right # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +1038 ; Right # Mc MYANMAR SIGN VISARGA +103B ; Right # Mc MYANMAR CONSONANT SIGN MEDIAL YA +1056..1057 ; Right # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1062..1064 ; Right # Mc [3] MYANMAR VOWEL SIGN SGAW KAREN EU..MYANMAR TONE MARK SGAW KAREN KE PHO +1067..106D ; Right # Mc [7] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1083 ; Right # Mc MYANMAR VOWEL SIGN SHAN AA +1087..108C ; Right # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108F ; Right # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109C ; Right # Mc [3] MYANMAR SIGN KHAMTI TONE-1..MYANMAR VOWEL SIGN AITON A +17B6 ; Right # Mc KHMER VOWEL SIGN AA +17C7..17C8 ; Right # Mc [2] KHMER SIGN REAHMUK..KHMER SIGN YUUKALEAPINTU +1923..1924 ; Right # Mc [2] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AI +1929..192B ; Right # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1930..1931 ; Right # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Right # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +19B0..19B4 ; Right # Lo [5] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN UU +19B8..19B9 ; Right # Lo [2] NEW TAI LUE VOWEL SIGN OA..NEW TAI LUE VOWEL SIGN UE +19BB..19C0 ; Right # Lo [6] NEW TAI LUE VOWEL SIGN AAY..NEW TAI LUE VOWEL SIGN IY +19C8..19C9 ; Right # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A1A ; Right # Mc BUGINESE VOWEL SIGN O +1A57 ; Right # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A61 ; Right # Mc TAI THAM VOWEL SIGN A +1A63..1A64 ; Right # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A6D ; Right # Mc TAI THAM VOWEL SIGN OY +1B04 ; Right # Mc BALINESE SIGN BISAH +1B35 ; Right # Mc BALINESE VOWEL SIGN TEDUNG +1B44 ; Right # Mc BALINESE ADEG ADEG +1B82 ; Right # Mc SUNDANESE SIGN PANGWISAD +1BA1 ; Right # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA7 ; Right # Mc SUNDANESE VOWEL SIGN PANOLONG +1BAA ; Right # Mc SUNDANESE SIGN PAMAAEH +1BE7 ; Right # Mc BATAK VOWEL SIGN E +1BEA..1BEC ; Right # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BEE ; Right # Mc BATAK VOWEL SIGN U +1BF2..1BF3 ; Right # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +1C24..1C26 ; Right # Mc [3] LEPCHA SUBJOINED LETTER YA..LEPCHA VOWEL SIGN AA +1C2A..1C2B ; Right # Mc [2] LEPCHA VOWEL SIGN U..LEPCHA VOWEL SIGN UU +1CE1 ; Right # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF7 ; Right # Mc VEDIC SIGN ATIKRAMA +A823..A824 ; Right # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A827 ; Right # Mc SYLOTI NAGRI VOWEL SIGN OO +A880..A881 ; Right # Mc [2] SAURASHTRA SIGN ANUSVARA..SAURASHTRA SIGN VISARGA +A8B4..A8C3 ; Right # Mc [16] SAURASHTRA CONSONANT SIGN HAARU..SAURASHTRA VOWEL SIGN AU +A952..A953 ; Right # Mc [2] REJANG CONSONANT SIGN H..REJANG VIRAMA +A983 ; Right # Mc JAVANESE SIGN WIGNYAN +A9B4..A9B5 ; Right # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9BD..A9BE ; Right # Mc [2] JAVANESE CONSONANT SIGN KERET..JAVANESE CONSONANT SIGN PENGKAL +AA33 ; Right # Mc CHAM CONSONANT SIGN YA +AA4D ; Right # Mc CHAM CONSONANT SIGN FINAL H +AA7B ; Right # Mc MYANMAR SIGN PAO KAREN TONE +AA7D ; Right # Mc MYANMAR SIGN TAI LAING TONE-5 +AAB1 ; Right # Lo TAI VIET VOWEL AA +AABA ; Right # Lo TAI VIET VOWEL UA +AABD ; Right # Lo TAI VIET VOWEL AN +AAEF ; Right # Mc MEETEI MAYEK VOWEL SIGN AAU +AAF5 ; Right # Mc MEETEI MAYEK VOWEL SIGN VISARGA +ABE3..ABE4 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE6..ABE7 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE9..ABEA ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +ABEC ; Right # Mc MEETEI MAYEK LUM IYEK +11000 ; Right # Mc BRAHMI SIGN CANDRABINDU +11002 ; Right # Mc BRAHMI SIGN VISARGA +11082 ; Right # Mc KAITHI SIGN VISARGA +110B0 ; Right # Mc KAITHI VOWEL SIGN AA +110B2 ; Right # Mc KAITHI VOWEL SIGN II +110B7..110B8 ; Right # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11145..11146 ; Right # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI +11182 ; Right # Mc SHARADA SIGN VISARGA +111B3 ; Right # Mc SHARADA VOWEL SIGN AA +111B5 ; Right # Mc SHARADA VOWEL SIGN II +111C0 ; Right # Mc SHARADA SIGN VIRAMA +1122C..1122E ; Right # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +11235 ; Right # Mc KHOJKI SIGN VIRAMA +112E0 ; Right # Mc KHUDAWADI VOWEL SIGN AA +112E2 ; Right # Mc KHUDAWADI VOWEL SIGN II +11302..11303 ; Right # Mc [2] GRANTHA SIGN ANUSVARA..GRANTHA SIGN VISARGA +1133E..1133F ; Right # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11341..11344 ; Right # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +1134D ; Right # Mc GRANTHA SIGN VIRAMA +11357 ; Right # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Right # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +11435 ; Right # Mc NEWA VOWEL SIGN AA +11437 ; Right # Mc NEWA VOWEL SIGN II +11440..11441 ; Right # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +11445 ; Right # Mc NEWA SIGN VISARGA +114B0 ; Right # Mc TIRHUTA VOWEL SIGN AA +114B2 ; Right # Mc TIRHUTA VOWEL SIGN II +114BD ; Right # Mc TIRHUTA VOWEL SIGN SHORT O +114C1 ; Right # Mc TIRHUTA SIGN VISARGA +115AF ; Right # Mc SIDDHAM VOWEL SIGN AA +115B1 ; Right # Mc SIDDHAM VOWEL SIGN II +115BE ; Right # Mc SIDDHAM SIGN VISARGA +11630..11632 ; Right # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +1163B..1163C ; Right # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +1163E ; Right # Mc MODI SIGN VISARGA +116AC ; Right # Mc TAKRI SIGN VISARGA +116AF ; Right # Mc TAKRI VOWEL SIGN II +116B6 ; Right # Mc TAKRI SIGN VIRAMA +11720..11721 ; Right # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +1182C ; Right # Mc DOGRA VOWEL SIGN AA +1182E ; Right # Mc DOGRA VOWEL SIGN II +11838 ; Right # Mc DOGRA SIGN VISARGA +11A39 ; Right # Mc ZANABAZAR SQUARE SIGN VISARGA +11A57..11A58 ; Right # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A97 ; Right # Mc SOYOMBO SIGN VISARGA +11C2F ; Right # Mc BHAIKSUKI VOWEL SIGN AA +11C3E ; Right # Mc BHAIKSUKI SIGN VISARGA +11CA9 ; Right # Mc MARCHEN SUBJOINED LETTER YA +11CB4 ; Right # Mc MARCHEN VOWEL SIGN O +11D8A..11D8E ; Right # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU +11D93..11D94 ; Right # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU +11D96 ; Right # Mc GUNJALA GONDI SIGN VISARGA +11EF6 ; Right # Mc MAKASAR VOWEL SIGN O + +# Indic_Positional_Category=Left + +093F ; Left # Mc DEVANAGARI VOWEL SIGN I +094E ; Left # Mc DEVANAGARI VOWEL SIGN PRISHTHAMATRA E +09BF ; Left # Mc BENGALI VOWEL SIGN I +09C7..09C8 ; Left # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +0A3F ; Left # Mc GURMUKHI VOWEL SIGN I +0ABF ; Left # Mc GUJARATI VOWEL SIGN I +0B47 ; Left # Mc ORIYA VOWEL SIGN E +0BC6..0BC8 ; Left # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0D46..0D48 ; Left # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0DD9 ; Left # Mc SINHALA VOWEL SIGN KOMBUVA +0DDB ; Left # Mc SINHALA VOWEL SIGN KOMBU DEKA +0F3F ; Left # Mc TIBETAN SIGN MAR TSHES +1031 ; Left # Mc MYANMAR VOWEL SIGN E +1084 ; Left # Mc MYANMAR VOWEL SIGN SHAN E +17C1..17C3 ; Left # Mc [3] KHMER VOWEL SIGN E..KHMER VOWEL SIGN AI +1A19 ; Left # Mc BUGINESE VOWEL SIGN E +1A55 ; Left # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A6E..1A72 ; Left # Mc [5] TAI THAM VOWEL SIGN E..TAI THAM VOWEL SIGN THAM AI +1B3E..1B3F ; Left # Mc [2] BALINESE VOWEL SIGN TALING..BALINESE VOWEL SIGN TALING REPA +1BA6 ; Left # Mc SUNDANESE VOWEL SIGN PANAELAENG +1C27..1C28 ; Left # Mc [2] LEPCHA VOWEL SIGN I..LEPCHA VOWEL SIGN O +1C34..1C35 ; Left # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A9BA..A9BB ; Left # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +AA2F..AA30 ; Left # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA34 ; Left # Mc CHAM CONSONANT SIGN RA +AAEB ; Left # Mc MEETEI MAYEK VOWEL SIGN II +AAEE ; Left # Mc MEETEI MAYEK VOWEL SIGN AU +110B1 ; Left # Mc KAITHI VOWEL SIGN I +1112C ; Left # Mc CHAKMA VOWEL SIGN E +111B4 ; Left # Mc SHARADA VOWEL SIGN I +112E1 ; Left # Mc KHUDAWADI VOWEL SIGN I +11347..11348 ; Left # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +11436 ; Left # Mc NEWA VOWEL SIGN I +114B1 ; Left # Mc TIRHUTA VOWEL SIGN I +114B9 ; Left # Mc TIRHUTA VOWEL SIGN E +115B0 ; Left # Mc SIDDHAM VOWEL SIGN I +115B8 ; Left # Mc SIDDHAM VOWEL SIGN E +116AE ; Left # Mc TAKRI VOWEL SIGN I +11726 ; Left # Mc AHOM VOWEL SIGN E +1182D ; Left # Mc DOGRA VOWEL SIGN I +11CB1 ; Left # Mc MARCHEN VOWEL SIGN I +11EF5 ; Left # Mc MAKASAR VOWEL SIGN E + +# Indic_Positional_Category=Visual_Order_Left + +# These are dependent vowels that occur to the left of the consonant +# letter in a syllable, but which occur in scripts using the visual order +# model, instead of the logical order model. Because of the different +# model, these left-side vowels occur first in the backing store (before +# the consonant letter) and are not reordered during text rendering. +# +# [Derivation: Logical_Order_Exception=Yes] + +0E40..0E44 ; Visual_Order_Left # Lo [5] THAI CHARACTER SARA E..THAI CHARACTER SARA AI MAIMALAI +0EC0..0EC4 ; Visual_Order_Left # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +19B5..19B7 ; Visual_Order_Left # Lo [3] NEW TAI LUE VOWEL SIGN E..NEW TAI LUE VOWEL SIGN O +19BA ; Visual_Order_Left # Lo NEW TAI LUE VOWEL SIGN AY +AAB5..AAB6 ; Visual_Order_Left # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB9 ; Visual_Order_Left # Lo TAI VIET VOWEL UEA +AABB..AABC ; Visual_Order_Left # Lo [2] TAI VIET VOWEL AUE..TAI VIET VOWEL AY + +# Indic_Positional_Category=Left_And_Right + +09CB..09CC ; Left_And_Right # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +0B4B ; Left_And_Right # Mc ORIYA VOWEL SIGN O +0BCA..0BCC ; Left_And_Right # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0D4A..0D4C ; Left_And_Right # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0DDC ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA +0DDE ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA +17C0 ; Left_And_Right # Mc KHMER VOWEL SIGN IE +17C4..17C5 ; Left_And_Right # Mc [2] KHMER VOWEL SIGN OO..KHMER VOWEL SIGN AU +1B40..1B41 ; Left_And_Right # Mc [2] BALINESE VOWEL SIGN TALING TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1134B..1134C ; Left_And_Right # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +114BC ; Left_And_Right # Mc TIRHUTA VOWEL SIGN O +114BE ; Left_And_Right # Mc TIRHUTA VOWEL SIGN AU +115BA ; Left_And_Right # Mc SIDDHAM VOWEL SIGN O + +# Indic_Positional_Category=Top + +0900..0902 ; Top # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +093A ; Top # Mn DEVANAGARI VOWEL SIGN OE +0945..0948 ; Top # Mn [4] DEVANAGARI VOWEL SIGN CANDRA E..DEVANAGARI VOWEL SIGN AI +0951 ; Top # Mn DEVANAGARI STRESS SIGN UDATTA +0953..0955 ; Top # Mn [3] DEVANAGARI GRAVE ACCENT..DEVANAGARI VOWEL SIGN CANDRA LONG E +0981 ; Top # Mn BENGALI SIGN CANDRABINDU +09FE ; Top # Mn BENGALI SANDHI MARK +0A01..0A02 ; Top # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A47..0A48 ; Top # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Top # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0A70..0A71 ; Top # Mn [2] GURMUKHI TIPPI..GURMUKHI ADDAK +0A81..0A82 ; Top # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0AC5 ; Top # Mn GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Top # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AFA..0AFF ; Top # Mn [6] GUJARATI SIGN SUKUN..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B01 ; Top # Mn ORIYA SIGN CANDRABINDU +0B3F ; Top # Mn ORIYA VOWEL SIGN I +0B56 ; Top # Mn ORIYA AI LENGTH MARK +0B82 ; Top # Mn TAMIL SIGN ANUSVARA +0BC0 ; Top # Mn TAMIL VOWEL SIGN II +0BCD ; Top # Mn TAMIL SIGN VIRAMA +0C00 ; Top # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C04 ; Top # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C3E..0C40 ; Top # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C46..0C47 ; Top # Mn [2] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN EE +0C4A..0C4D ; Top # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA +0C55 ; Top # Mn TELUGU LENGTH MARK +0C81 ; Top # Mn KANNADA SIGN CANDRABINDU +0CBF ; Top # Mn KANNADA VOWEL SIGN I +0CC6 ; Top # Mn KANNADA VOWEL SIGN E +0CCC..0CCD ; Top # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA +0D00..0D01 ; Top # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU +0D3B..0D3C ; Top # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA +0D4D ; Top # Mn MALAYALAM SIGN VIRAMA +0DCA ; Top # Mn SINHALA SIGN AL-LAKUNA +0DD2..0DD3 ; Top # Mn [2] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN DIGA IS-PILLA +0E31 ; Top # Mn THAI CHARACTER MAI HAN-AKAT +0E34..0E37 ; Top # Mn [4] THAI CHARACTER SARA I..THAI CHARACTER SARA UEE +0E47..0E4E ; Top # Mn [8] THAI CHARACTER MAITAIKHU..THAI CHARACTER YAMAKKAN +0EB1 ; Top # Mn LAO VOWEL SIGN MAI KAN +0EB4..0EB7 ; Top # Mn [4] LAO VOWEL SIGN I..LAO VOWEL SIGN YY +0EBB ; Top # Mn LAO VOWEL SIGN MAI KON +0EC8..0ECD ; Top # Mn [6] LAO TONE MAI EK..LAO NIGGAHITA +0F39 ; Top # Mn TIBETAN MARK TSA -PHRU +0F72 ; Top # Mn TIBETAN VOWEL SIGN I +0F7A..0F7E ; Top # Mn [5] TIBETAN VOWEL SIGN E..TIBETAN SIGN RJES SU NGA RO +0F80 ; Top # Mn TIBETAN VOWEL SIGN REVERSED I +0F82..0F83 ; Top # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +0F86..0F87 ; Top # Mn [2] TIBETAN SIGN LCI RTAGS..TIBETAN SIGN YANG RTAGS +102D..102E ; Top # Mn [2] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN II +1032..1036 ; Top # Mn [5] MYANMAR VOWEL SIGN AI..MYANMAR SIGN ANUSVARA +103A ; Top # Mn MYANMAR SIGN ASAT +1071..1074 ; Top # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1085..1086 ; Top # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109D ; Top # Mn MYANMAR VOWEL SIGN AITON AI +1712 ; Top # Mn TAGALOG VOWEL SIGN I +1732 ; Top # Mn HANUNOO VOWEL SIGN I +1752 ; Top # Mn BUHID VOWEL SIGN I +1772 ; Top # Mn TAGBANWA VOWEL SIGN I +17B7..17BA ; Top # Mn [4] KHMER VOWEL SIGN I..KHMER VOWEL SIGN YY +17C6 ; Top # Mn KHMER SIGN NIKAHIT +17C9..17D1 ; Top # Mn [9] KHMER SIGN MUUSIKATOAN..KHMER SIGN VIRIAM +17D3 ; Top # Mn KHMER SIGN BATHAMASAT +17DD ; Top # Mn KHMER SIGN ATTHACAN +1920..1921 ; Top # Mn [2] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN I +1927..1928 ; Top # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Top # Mn LIMBU SIGN KEMPHRENG +1A17 ; Top # Mn BUGINESE VOWEL SIGN I +1A1B ; Top # Mn BUGINESE VOWEL SIGN AE +1A58..1A5A ; Top # Mn [3] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN LOW PA +1A62 ; Top # Mn TAI THAM VOWEL SIGN MAI SAT +1A65..1A68 ; Top # Mn [4] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN UUE +1A6B ; Top # Mn TAI THAM VOWEL SIGN O +1A73..1A7C ; Top # Mn [10] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN KHUEN-LUE KARAN +1B00..1B03 ; Top # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG +1B34 ; Top # Mn BALINESE SIGN REREKAN +1B36..1B37 ; Top # Mn [2] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN ULU SARI +1B42 ; Top # Mn BALINESE VOWEL SIGN PEPET +1B6B ; Top # Mn BALINESE MUSICAL SYMBOL COMBINING TEGEH +1B6D..1B73 ; Top # Mn [7] BALINESE MUSICAL SYMBOL COMBINING KEMPUL..BALINESE MUSICAL SYMBOL COMBINING GONG +1B80..1B81 ; Top # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR +1BA4 ; Top # Mn SUNDANESE VOWEL SIGN PANGHULU +1BA8..1BA9 ; Top # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE6 ; Top # Mn BATAK SIGN TOMPI +1BE8..1BE9 ; Top # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BED ; Top # Mn BATAK VOWEL SIGN KARO O +1BEF..1BF1 ; Top # Mn [3] BATAK VOWEL SIGN U FOR SIMALUNGUN SA..BATAK CONSONANT SIGN H +1C2D..1C33 ; Top # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +1C36 ; Top # Mn LEPCHA SIGN RAN +1CD0..1CD2 ; Top # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CDA..1CDB ; Top # Mn [2] VEDIC TONE DOUBLE SVARITA..VEDIC TONE TRIPLE SVARITA +1CE0 ; Top # Mn VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CF4 ; Top # Mn VEDIC TONE CANDRA ABOVE +1DFB ; Top # Mn COMBINING DELETION MARK +A806 ; Top # Mn SYLOTI NAGRI SIGN HASANTA +A80B ; Top # Mn SYLOTI NAGRI SIGN ANUSVARA +A826 ; Top # Mn SYLOTI NAGRI VOWEL SIGN E +A8C5 ; Top # Mn SAURASHTRA SIGN CANDRABINDU +A8E0..A8F1 ; Top # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +A8FF ; Top # Mn DEVANAGARI VOWEL SIGN AY +A94A ; Top # Mn REJANG VOWEL SIGN AI +A94F..A951 ; Top # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A980..A982 ; Top # Mn [3] JAVANESE SIGN PANYANGGA..JAVANESE SIGN LAYAR +A9B3 ; Top # Mn JAVANESE SIGN CECAK TELU +A9B6..A9B7 ; Top # Mn [2] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN WULU MELIK +A9BC ; Top # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Top # Mn MYANMAR SIGN SHAN SAW +AA29..AA2C ; Top # Mn [4] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN EI +AA2E ; Top # Mn CHAM VOWEL SIGN OE +AA31 ; Top # Mn CHAM VOWEL SIGN AU +AA43 ; Top # Mn CHAM CONSONANT SIGN FINAL NG +AA4C ; Top # Mn CHAM CONSONANT SIGN FINAL M +AA7C ; Top # Mn MYANMAR SIGN TAI LAING TONE-2 +AAB0 ; Top # Mn TAI VIET MAI KANG +AAB2..AAB3 ; Top # Mn [2] TAI VIET VOWEL I..TAI VIET VOWEL UE +AAB7..AAB8 ; Top # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AABE..AABF ; Top # Mn [2] TAI VIET VOWEL AM..TAI VIET TONE MAI EK +AAC1 ; Top # Mn TAI VIET TONE MAI THO +AAED ; Top # Mn MEETEI MAYEK VOWEL SIGN AAI +ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP +10A05 ; Top # Mn KHAROSHTHI VOWEL SIGN E +10A0F ; Top # Mn KHAROSHTHI SIGN VISARGA +10A38 ; Top # Mn KHAROSHTHI SIGN BAR ABOVE +11001 ; Top # Mn BRAHMI SIGN ANUSVARA +11038..1103B ; Top # Mn [4] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN II +11042..11046 ; Top # Mn [5] BRAHMI VOWEL SIGN E..BRAHMI VIRAMA +11080..11081 ; Top # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +110B5..110B6 ; Top # Mn [2] KAITHI VOWEL SIGN E..KAITHI VOWEL SIGN AI +11100..11102 ; Top # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA +11127..11129 ; Top # Mn [3] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN II +1112D ; Top # Mn CHAKMA VOWEL SIGN AI +11130 ; Top # Mn CHAKMA VOWEL SIGN OI +11134 ; Top # Mn CHAKMA MAAYYAA +11180..11181 ; Top # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +111BC..111BE ; Top # Mn [3] SHARADA VOWEL SIGN E..SHARADA VOWEL SIGN O +111CB ; Top # Mn SHARADA VOWEL MODIFIER MARK +11230..11231 ; Top # Mn [2] KHOJKI VOWEL SIGN E..KHOJKI VOWEL SIGN AI +11234 ; Top # Mn KHOJKI SIGN ANUSVARA +11236..11237 ; Top # Mn [2] KHOJKI SIGN NUKTA..KHOJKI SIGN SHADDA +1123E ; Top # Mn KHOJKI SIGN SUKUN +112DF ; Top # Mn KHUDAWADI SIGN ANUSVARA +112E5..112E8 ; Top # Mn [4] KHUDAWADI VOWEL SIGN E..KHUDAWADI VOWEL SIGN AU +11301 ; Top # Mn GRANTHA SIGN CANDRABINDU +11340 ; Top # Mn GRANTHA VOWEL SIGN II +11366..1136C ; Top # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Top # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA +1143E..1143F ; Top # Mn [2] NEWA VOWEL SIGN E..NEWA VOWEL SIGN AI +11443..11444 ; Top # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +1145E ; Top # Mn NEWA SANDHI MARK +114BA ; Top # Mn TIRHUTA VOWEL SIGN SHORT E +114BF..114C0 ; Top # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Top # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +11639..1163A ; Top # Mn [2] MODI VOWEL SIGN E..MODI VOWEL SIGN AI +1163D ; Top # Mn MODI SIGN ANUSVARA +11640 ; Top # Mn MODI SIGN ARDHACANDRA +116AB ; Top # Mn TAKRI SIGN ANUSVARA +116AD ; Top # Mn TAKRI VOWEL SIGN AA +116B2..116B5 ; Top # Mn [4] TAKRI VOWEL SIGN E..TAKRI VOWEL SIGN AU +1171F ; Top # Mn AHOM CONSONANT SIGN MEDIAL LIGATING RA +11722..11723 ; Top # Mn [2] AHOM VOWEL SIGN I..AHOM VOWEL SIGN II +11727 ; Top # Mn AHOM VOWEL SIGN AW +11729..1172B ; Top # Mn [3] AHOM VOWEL SIGN AI..AHOM SIGN KILLER +11833..11837 ; Top # Mn [5] DOGRA VOWEL SIGN E..DOGRA SIGN ANUSVARA +11A01 ; Top # Mn ZANABAZAR SQUARE VOWEL SIGN I +11A04..11A09 ; Top # Mn [6] ZANABAZAR SQUARE VOWEL SIGN E..ZANABAZAR SQUARE VOWEL SIGN REVERSED I +11A35..11A38 ; Top # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A51 ; Top # Mn SOYOMBO VOWEL SIGN I +11A54..11A56 ; Top # Mn [3] SOYOMBO VOWEL SIGN E..SOYOMBO VOWEL SIGN OE +11A96 ; Top # Mn SOYOMBO SIGN ANUSVARA +11A98 ; Top # Mn SOYOMBO GEMINATION MARK +11C30..11C31 ; Top # Mn [2] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN II +11C38..11C3D ; Top # Mn [6] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI SIGN ANUSVARA +11CB3 ; Top # Mn MARCHEN VOWEL SIGN E +11CB5..11CB6 ; Top # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D31..11D35 ; Top # Mn [5] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN UU +11D3A ; Top # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Top # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F..11D41 ; Top # Mn [3] MASARAM GONDI VOWEL SIGN AU..MASARAM GONDI SIGN VISARGA +11D43 ; Top # Mn MASARAM GONDI SIGN CANDRA +11D90..11D91 ; Top # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI +11D95 ; Top # Mn GUNJALA GONDI SIGN ANUSVARA +11EF3 ; Top # Mn MAKASAR VOWEL SIGN I + +# Indic_Positional_Category=Bottom + +093C ; Bottom # Mn DEVANAGARI SIGN NUKTA +0941..0944 ; Bottom # Mn [4] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN VOCALIC RR +094D ; Bottom # Mn DEVANAGARI SIGN VIRAMA +0952 ; Bottom # Mn DEVANAGARI STRESS SIGN ANUDATTA +0956..0957 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN UE..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BC ; Bottom # Mn BENGALI SIGN NUKTA +09C1..09C4 ; Bottom # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09CD ; Bottom # Mn BENGALI SIGN VIRAMA +09E2..09E3 ; Bottom # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3C ; Bottom # Mn GURMUKHI SIGN NUKTA +0A41..0A42 ; Bottom # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A4D ; Bottom # Mn GURMUKHI SIGN VIRAMA +0A75 ; Bottom # Mn GURMUKHI SIGN YAKASH +0ABC ; Bottom # Mn GUJARATI SIGN NUKTA +0AC1..0AC4 ; Bottom # Mn [4] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN VOCALIC RR +0ACD ; Bottom # Mn GUJARATI SIGN VIRAMA +0AE2..0AE3 ; Bottom # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3C ; Bottom # Mn ORIYA SIGN NUKTA +0B41..0B44 ; Bottom # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B4D ; Bottom # Mn ORIYA SIGN VIRAMA +0B62..0B63 ; Bottom # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0C56 ; Bottom # Mn TELUGU AI LENGTH MARK +0C62..0C63 ; Bottom # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBC ; Bottom # Mn KANNADA SIGN NUKTA +0CE2..0CE3 ; Bottom # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D43..0D44 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC R..MALAYALAM VOWEL SIGN VOCALIC RR +0D62..0D63 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DD4 ; Bottom # Mn SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Bottom # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0E38..0E3A ; Bottom # Mn [3] THAI CHARACTER SARA U..THAI CHARACTER PHINTHU +0EB8..0EB9 ; Bottom # Mn [2] LAO VOWEL SIGN U..LAO VOWEL SIGN UU +0EBC ; Bottom # Mn LAO SEMIVOWEL SIGN LO +0F18..0F19 ; Bottom # Mn [2] TIBETAN ASTROLOGICAL SIGN -KHYUD PA..TIBETAN ASTROLOGICAL SIGN SDONG TSHUGS +0F35 ; Bottom # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Bottom # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0F71 ; Bottom # Mn TIBETAN VOWEL SIGN AA +0F74..0F75 ; Bottom # Mn [2] TIBETAN VOWEL SIGN U..TIBETAN VOWEL SIGN UU +0F84 ; Bottom # Mn TIBETAN MARK HALANTA +0F8D..0F97 ; Bottom # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Bottom # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +0FC6 ; Bottom # Mn TIBETAN SYMBOL PADMA GDAN +102F..1030 ; Bottom # Mn [2] MYANMAR VOWEL SIGN U..MYANMAR VOWEL SIGN UU +1037 ; Bottom # Mn MYANMAR SIGN DOT BELOW +103D..103E ; Bottom # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +1058..1059 ; Bottom # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +105E..1060 ; Bottom # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Bottom # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +108D ; Bottom # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +1713..1714 ; Bottom # Mn [2] TAGALOG VOWEL SIGN U..TAGALOG SIGN VIRAMA +1733..1734 ; Bottom # Mn [2] HANUNOO VOWEL SIGN U..HANUNOO SIGN PAMUDPOD +1753 ; Bottom # Mn BUHID VOWEL SIGN U +1773 ; Bottom # Mn TAGBANWA VOWEL SIGN U +17BB..17BD ; Bottom # Mn [3] KHMER VOWEL SIGN U..KHMER VOWEL SIGN UA +1922 ; Bottom # Mn LIMBU VOWEL SIGN U +1932 ; Bottom # Mn LIMBU SMALL LETTER ANUSVARA +1939 ; Bottom # Mn LIMBU SIGN MUKPHRENG +193B ; Bottom # Mn LIMBU SIGN SA-I +1A18 ; Bottom # Mn BUGINESE VOWEL SIGN U +1A56 ; Bottom # Mn TAI THAM CONSONANT SIGN MEDIAL LA +1A5B..1A5E ; Bottom # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1A69..1A6A ; Bottom # Mn [2] TAI THAM VOWEL SIGN U..TAI THAM VOWEL SIGN UU +1A6C ; Bottom # Mn TAI THAM VOWEL SIGN OA BELOW +1A7F ; Bottom # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1B38..1B3A ; Bottom # Mn [3] BALINESE VOWEL SIGN SUKU..BALINESE VOWEL SIGN RA REPA +1B6C ; Bottom # Mn BALINESE MUSICAL SYMBOL COMBINING ENDEP +1BA2..1BA3 ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BA5 ; Bottom # Mn SUNDANESE VOWEL SIGN PANYUKU +1BAC..1BAD ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C2C ; Bottom # Mn LEPCHA VOWEL SIGN E +1C37 ; Bottom # Mn LEPCHA SIGN NUKTA +1CD5..1CD9 ; Bottom # Mn [5] VEDIC TONE YAJURVEDIC AGGRAVATED INDEPENDENT SVARITA..VEDIC TONE YAJURVEDIC KATHAKA INDEPENDENT SVARITA SCHROEDER +1CDC..1CDF ; Bottom # Mn [4] VEDIC TONE KATHAKA ANUDATTA..VEDIC TONE THREE DOTS BELOW +1CED ; Bottom # Mn VEDIC SIGN TIRYAK +A825 ; Bottom # Mn SYLOTI NAGRI VOWEL SIGN U +A8C4 ; Bottom # Mn SAURASHTRA SIGN VIRAMA +A92B..A92D ; Bottom # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +A947..A949 ; Bottom # Mn [3] REJANG VOWEL SIGN I..REJANG VOWEL SIGN E +A94B..A94E ; Bottom # Mn [4] REJANG VOWEL SIGN O..REJANG VOWEL SIGN EA +A9B8..A9B9 ; Bottom # Mn [2] JAVANESE VOWEL SIGN SUKU..JAVANESE VOWEL SIGN SUKU MENDUT +AA2D ; Bottom # Mn CHAM VOWEL SIGN U +AA32 ; Bottom # Mn CHAM VOWEL SIGN UE +AA35..AA36 ; Bottom # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +AAB4 ; Bottom # Mn TAI VIET VOWEL U +AAEC ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UU +ABE8 ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK +10A02..10A03 ; Bottom # Mn [2] KHAROSHTHI VOWEL SIGN U..KHAROSHTHI VOWEL SIGN VOCALIC R +10A0C..10A0E ; Bottom # Mn [3] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN ANUSVARA +10A39..10A3A ; Bottom # Mn [2] KHAROSHTHI SIGN CAUDA..KHAROSHTHI SIGN DOT BELOW +1103C..11041 ; Bottom # Mn [6] BRAHMI VOWEL SIGN U..BRAHMI VOWEL SIGN VOCALIC LL +110B3..110B4 ; Bottom # Mn [2] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN UU +110B9..110BA ; Bottom # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +1112A..1112B ; Bottom # Mn [2] CHAKMA VOWEL SIGN U..CHAKMA VOWEL SIGN UU +11131..11132 ; Bottom # Mn [2] CHAKMA O MARK..CHAKMA AU MARK +11173 ; Bottom # Mn MAHAJANI SIGN NUKTA +111B6..111BB ; Bottom # Mn [6] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN VOCALIC LL +111C9 ; Bottom # Mn SHARADA SANDHI MARK +111CC ; Bottom # Mn SHARADA EXTRA SHORT VOWEL MARK +1122F ; Bottom # Mn KHOJKI VOWEL SIGN U +112E3..112E4 ; Bottom # Mn [2] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN UU +112E9..112EA ; Bottom # Mn [2] KHUDAWADI SIGN NUKTA..KHUDAWADI SIGN VIRAMA +1133B..1133C ; Bottom # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA +11438..1143D ; Bottom # Mn [6] NEWA VOWEL SIGN U..NEWA VOWEL SIGN VOCALIC LL +11442 ; Bottom # Mn NEWA SIGN VIRAMA +11446 ; Bottom # Mn NEWA SIGN NUKTA +114B3..114B8 ; Bottom # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114C2..114C3 ; Bottom # Mn [2] TIRHUTA SIGN VIRAMA..TIRHUTA SIGN NUKTA +115B2..115B5 ; Bottom # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115BF..115C0 ; Bottom # Mn [2] SIDDHAM SIGN VIRAMA..SIDDHAM SIGN NUKTA +115DC..115DD ; Bottom # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11633..11638 ; Bottom # Mn [6] MODI VOWEL SIGN U..MODI VOWEL SIGN VOCALIC LL +1163F ; Bottom # Mn MODI SIGN VIRAMA +116B0..116B1 ; Bottom # Mn [2] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN UU +116B7 ; Bottom # Mn TAKRI SIGN NUKTA +1171D ; Bottom # Mn AHOM CONSONANT SIGN MEDIAL LA +11724..11725 ; Bottom # Mn [2] AHOM VOWEL SIGN U..AHOM VOWEL SIGN UU +11728 ; Bottom # Mn AHOM VOWEL SIGN O +1182F..11832 ; Bottom # Mn [4] DOGRA VOWEL SIGN U..DOGRA VOWEL SIGN VOCALIC RR +11839..1183A ; Bottom # Mn [2] DOGRA SIGN VIRAMA..DOGRA SIGN NUKTA +11A02..11A03 ; Bottom # Mn [2] ZANABAZAR SQUARE VOWEL SIGN UE..ZANABAZAR SQUARE VOWEL SIGN U +11A0A ; Bottom # Mn ZANABAZAR SQUARE VOWEL LENGTH MARK +11A33..11A34 ; Bottom # Mn [2] ZANABAZAR SQUARE FINAL CONSONANT MARK..ZANABAZAR SQUARE SIGN VIRAMA +11A3B..11A3E ; Bottom # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11A52..11A53 ; Bottom # Mn [2] SOYOMBO VOWEL SIGN UE..SOYOMBO VOWEL SIGN U +11A59..11A5B ; Bottom # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11A8A..11A95 ; Bottom # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A +11C32..11C36 ; Bottom # Mn [5] BHAIKSUKI VOWEL SIGN U..BHAIKSUKI VOWEL SIGN VOCALIC L +11C3F ; Bottom # Mn BHAIKSUKI SIGN VIRAMA +11C92..11CA7 ; Bottom # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CAA..11CB0 ; Bottom # Mn [7] MARCHEN SUBJOINED LETTER RA..MARCHEN VOWEL SIGN AA +11CB2 ; Bottom # Mn MARCHEN VOWEL SIGN U +11D36 ; Bottom # Mn MASARAM GONDI VOWEL SIGN VOCALIC R +11D42 ; Bottom # Mn MASARAM GONDI SIGN NUKTA +11D44 ; Bottom # Mn MASARAM GONDI SIGN HALANTA +11D47 ; Bottom # Mn MASARAM GONDI RA-KARA +11EF4 ; Bottom # Mn MAKASAR VOWEL SIGN U + +# Indic_Positional_Category=Top_And_Bottom + +0C48 ; Top_And_Bottom # Mn TELUGU VOWEL SIGN AI +0F73 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN II +0F76..0F79 ; Top_And_Bottom # Mn [4] TIBETAN VOWEL SIGN VOCALIC R..TIBETAN VOWEL SIGN VOCALIC LL +0F81 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN REVERSED II +1B3C ; Top_And_Bottom # Mn BALINESE VOWEL SIGN LA LENGA +1112E..1112F ; Top_And_Bottom # Mn [2] CHAKMA VOWEL SIGN O..CHAKMA VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Right + +0AC9 ; Top_And_Right # Mc GUJARATI VOWEL SIGN CANDRA O +0B57 ; Top_And_Right # Mc ORIYA AU LENGTH MARK +0CC0 ; Top_And_Right # Mc KANNADA VOWEL SIGN II +0CC7..0CC8 ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +1925..1926 ; Top_And_Right # Mc [2] LIMBU VOWEL SIGN OO..LIMBU VOWEL SIGN AU +1B43 ; Top_And_Right # Mc BALINESE VOWEL SIGN PEPET TEDUNG +111BF ; Top_And_Right # Mc SHARADA VOWEL SIGN AU +11232..11233 ; Top_And_Right # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Left + +0B48 ; Top_And_Left # Mc ORIYA VOWEL SIGN AI +0DDA ; Top_And_Left # Mc SINHALA VOWEL SIGN DIGA KOMBUVA +17BE ; Top_And_Left # Mc KHMER VOWEL SIGN OE +1C29 ; Top_And_Left # Mc LEPCHA VOWEL SIGN OO +114BB ; Top_And_Left # Mc TIRHUTA VOWEL SIGN AI +115B9 ; Top_And_Left # Mc SIDDHAM VOWEL SIGN AI + +# Indic_Positional_Category=Top_And_Left_And_Right + +0B4C ; Top_And_Left_And_Right # Mc ORIYA VOWEL SIGN AU +0DDD ; Top_And_Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA +17BF ; Top_And_Left_And_Right # Mc KHMER VOWEL SIGN YA +115BB ; Top_And_Left_And_Right # Mc SIDDHAM VOWEL SIGN AU + +# Indic_Positional_Category=Bottom_And_Right + +1B3B ; Bottom_And_Right # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +A9C0 ; Bottom_And_Right # Mc JAVANESE PANGKON + +# Indic_Positional_Category=Bottom_And_Left + +A9BF ; Bottom_And_Left # Mc JAVANESE CONSONANT SIGN CAKRA + +# Indic_Positional_Category=Top_And_Bottom_And_Right + +1B3D ; Top_And_Bottom_And_Right # Mc BALINESE VOWEL SIGN LA LENGA TEDUNG + +# Indic_Positional_Category=Overstruck + +1CD4 ; Overstruck # Mn VEDIC SIGN YAJURVEDIC MIDLINE SVARITA +1CE2..1CE8 ; Overstruck # Mn [7] VEDIC SIGN VISARGA SVARITA..VEDIC SIGN VISARGA ANUDATTA WITH TAIL +10A01 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN I +10A06 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN O + +# EOF diff --git a/data/11.0.0-indic-syllabic-category.txt b/data/11.0.0-indic-syllabic-category.txt new file mode 100644 index 0000000..3d25284 --- /dev/null +++ b/data/11.0.0-indic-syllabic-category.txt @@ -0,0 +1,1273 @@ +# IndicSyllabicCategory-11.0.0.txt +# Date: 2018-05-21, 18:33:00 GMT [KW, RP] +# © 2018 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# +# For documentation, see UAX #44: Unicode Character Database, +# at http://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Syllabic_Category enumerated property +# +# Scope: This property is aimed at two general problem +# areas involving the analysis and processing of Indic scripts: +# +# 1. Specification of syllabic structure. +# 2. Specification of segmentation rules. +# +# Both of these problem areas may benefit from having defined subtypes +# of Indic script characters which are relevant to how Indic +# syllables (or aksaras) are constructed. Note that rules for +# syllabic structure in Indic scripts may differ significantly +# from how phonological syllables are defined. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Syllabic_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as Indic in the structural sense used for the +# Indic_Syllabic_Category are the following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Dogra, Grantha, Gujarati, Gunjala Gondi, +# Gurmukhi, Hanunoo, Javanese, Kaithi, Kannada, Kayah Li, Kharoshthi, +# Khmer, Khojki, Khudawadi, Lao, Lepcha, Limbu, Mahajani, Makasar, +# Malayalam, Marchen, Masaram Gondi, Meetei Mayek, Modi, Multani, +# Myanmar, Newa, New Tai Lue, Oriya, Phags-pa, Rejang, Saurashtra, +# Sharada, Siddham, Sinhala, Soyombo, Sundanese, Syloti Nagri, +# Tagalog, Tagbanwa, Tai Le, Tai Tham, Tai Viet, Takri, Tamil, +# Telugu, Thai, Tibetan, Tirhuta, and Zanabazar Square. +# +# All characters for all other scripts not in that list +# take the default value for this property, unless they +# are individually listed in this data file. +# + +# ================================================ + +# Property: Indic_Syllabic_Category +# +# All code points not explicitly listed for Indic_Syllabic_Category +# have the value Other. +# +# @missing: 0000..10FFFF; Other + +# ================================================ + +# Indic_Syllabic_Category=Bindu + +# Bindu/Anusvara (nasalization or -n) + +# [Not derivable] + +0900..0902 ; Bindu # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +0981 ; Bindu # Mn BENGALI SIGN CANDRABINDU +0982 ; Bindu # Mc BENGALI SIGN ANUSVARA +09FC ; Bindu # Lo BENGALI LETTER VEDIC ANUSVARA +0A01..0A02 ; Bindu # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A70 ; Bindu # Mn GURMUKHI TIPPI +0A81..0A82 ; Bindu # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0B01 ; Bindu # Mn ORIYA SIGN CANDRABINDU +0B02 ; Bindu # Mc ORIYA SIGN ANUSVARA +0B82 ; Bindu # Mn TAMIL SIGN ANUSVARA +0C00 ; Bindu # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C01..0C02 ; Bindu # Mc [2] TELUGU SIGN CANDRABINDU..TELUGU SIGN ANUSVARA +0C04 ; Bindu # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C81 ; Bindu # Mn KANNADA SIGN CANDRABINDU +0C82 ; Bindu # Mc KANNADA SIGN ANUSVARA +0D00..0D01 ; Bindu # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU +0D02 ; Bindu # Mc MALAYALAM SIGN ANUSVARA +0D82 ; Bindu # Mc SINHALA SIGN ANUSVARAYA +0E4D ; Bindu # Mn THAI CHARACTER NIKHAHIT +0ECD ; Bindu # Mn LAO NIGGAHITA +0F7E ; Bindu # Mn TIBETAN SIGN RJES SU NGA RO +0F82..0F83 ; Bindu # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +1036 ; Bindu # Mn MYANMAR SIGN ANUSVARA +17C6 ; Bindu # Mn KHMER SIGN NIKAHIT +1932 ; Bindu # Mn LIMBU SMALL LETTER ANUSVARA +1A74 ; Bindu # Mn TAI THAM SIGN MAI KANG +1B00..1B02 ; Bindu # Mn [3] BALINESE SIGN ULU RICEM..BALINESE SIGN CECEK +1B80 ; Bindu # Mn SUNDANESE SIGN PANYECEK +1C34..1C35 ; Bindu # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A80B ; Bindu # Mn SYLOTI NAGRI SIGN ANUSVARA +A873 ; Bindu # Lo PHAGS-PA LETTER CANDRABINDU +A880 ; Bindu # Mc SAURASHTRA SIGN ANUSVARA +A8C5 ; Bindu # Mn SAURASHTRA SIGN CANDRABINDU +A8F2..A8F3 ; Bindu # Lo [2] DEVANAGARI SIGN SPACING CANDRABINDU..DEVANAGARI SIGN CANDRABINDU VIRAMA +A980..A981 ; Bindu # Mn [2] JAVANESE SIGN PANYANGGA..JAVANESE SIGN CECAK +10A0E ; Bindu # Mn KHAROSHTHI SIGN ANUSVARA +11000 ; Bindu # Mc BRAHMI SIGN CANDRABINDU +11001 ; Bindu # Mn BRAHMI SIGN ANUSVARA +11080..11081 ; Bindu # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +11100..11101 ; Bindu # Mn [2] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN ANUSVARA +11180..11181 ; Bindu # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +11234 ; Bindu # Mn KHOJKI SIGN ANUSVARA +112DF ; Bindu # Mn KHUDAWADI SIGN ANUSVARA +11300..11301 ; Bindu # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11302 ; Bindu # Mc GRANTHA SIGN ANUSVARA +1135E..1135F ; Bindu # Lo [2] GRANTHA LETTER VEDIC ANUSVARA..GRANTHA LETTER VEDIC DOUBLE ANUSVARA +11443..11444 ; Bindu # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +114BF..114C0 ; Bindu # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Bindu # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +1163D ; Bindu # Mn MODI SIGN ANUSVARA +116AB ; Bindu # Mn TAKRI SIGN ANUSVARA +11837 ; Bindu # Mn DOGRA SIGN ANUSVARA +11A35..11A38 ; Bindu # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A96 ; Bindu # Mn SOYOMBO SIGN ANUSVARA +11C3C..11C3D ; Bindu # Mn [2] BHAIKSUKI SIGN CANDRABINDU..BHAIKSUKI SIGN ANUSVARA +11CB5..11CB6 ; Bindu # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D40 ; Bindu # Mn MASARAM GONDI SIGN ANUSVARA +11D95 ; Bindu # Mn GUNJALA GONDI SIGN ANUSVARA + +# ================================================ + +# Indic_Syllabic_Category=Visarga + +# Visarga (-h) +# Includes specialized case for Sanskrit: ardhavisarga +# Excludes letters for jihvamuliya and upadhmaniya, which are +# related, but structured somewhat differently. + +# [Not derivable] + +0903 ; Visarga # Mc DEVANAGARI SIGN VISARGA +0983 ; Visarga # Mc BENGALI SIGN VISARGA +0A03 ; Visarga # Mc GURMUKHI SIGN VISARGA +0A83 ; Visarga # Mc GUJARATI SIGN VISARGA +0B03 ; Visarga # Mc ORIYA SIGN VISARGA +0C03 ; Visarga # Mc TELUGU SIGN VISARGA +0C83 ; Visarga # Mc KANNADA SIGN VISARGA +0D03 ; Visarga # Mc MALAYALAM SIGN VISARGA +0D83 ; Visarga # Mc SINHALA SIGN VISARGAYA +0F7F ; Visarga # Mc TIBETAN SIGN RNAM BCAD +1038 ; Visarga # Mc MYANMAR SIGN VISARGA +17C7 ; Visarga # Mc KHMER SIGN REAHMUK +1B04 ; Visarga # Mc BALINESE SIGN BISAH +1B82 ; Visarga # Mc SUNDANESE SIGN PANGWISAD +1CF2..1CF3 ; Visarga # Mc [2] VEDIC SIGN ARDHAVISARGA..VEDIC SIGN ROTATED ARDHAVISARGA +A881 ; Visarga # Mc SAURASHTRA SIGN VISARGA +A983 ; Visarga # Mc JAVANESE SIGN WIGNYAN +AAF5 ; Visarga # Mc MEETEI MAYEK VOWEL SIGN VISARGA +10A0F ; Visarga # Mn KHAROSHTHI SIGN VISARGA +11002 ; Visarga # Mc BRAHMI SIGN VISARGA +11082 ; Visarga # Mc KAITHI SIGN VISARGA +11102 ; Visarga # Mn CHAKMA SIGN VISARGA +11182 ; Visarga # Mc SHARADA SIGN VISARGA +11303 ; Visarga # Mc GRANTHA SIGN VISARGA +11445 ; Visarga # Mc NEWA SIGN VISARGA +114C1 ; Visarga # Mc TIRHUTA SIGN VISARGA +115BE ; Visarga # Mc SIDDHAM SIGN VISARGA +1163E ; Visarga # Mc MODI SIGN VISARGA +116AC ; Visarga # Mc TAKRI SIGN VISARGA +11838 ; Visarga # Mc DOGRA SIGN VISARGA +11A39 ; Visarga # Mc ZANABAZAR SQUARE SIGN VISARGA +11A97 ; Visarga # Mc SOYOMBO SIGN VISARGA +11C3E ; Visarga # Mc BHAIKSUKI SIGN VISARGA +11D41 ; Visarga # Mn MASARAM GONDI SIGN VISARGA +11D96 ; Visarga # Mc GUNJALA GONDI SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Avagraha + +# Avagraha (elision of initial a- in sandhi) + +# [Not derivable] + +093D ; Avagraha # Lo DEVANAGARI SIGN AVAGRAHA +09BD ; Avagraha # Lo BENGALI SIGN AVAGRAHA +0ABD ; Avagraha # Lo GUJARATI SIGN AVAGRAHA +0B3D ; Avagraha # Lo ORIYA SIGN AVAGRAHA +0C3D ; Avagraha # Lo TELUGU SIGN AVAGRAHA +0CBD ; Avagraha # Lo KANNADA SIGN AVAGRAHA +0D3D ; Avagraha # Lo MALAYALAM SIGN AVAGRAHA +0F85 ; Avagraha # Po TIBETAN MARK PALUTA +17DC ; Avagraha # Lo KHMER SIGN AVAKRAHASANYA +1BBA ; Avagraha # Lo SUNDANESE AVAGRAHA +111C1 ; Avagraha # Lo SHARADA SIGN AVAGRAHA +1133D ; Avagraha # Lo GRANTHA SIGN AVAGRAHA +11447 ; Avagraha # Lo NEWA SIGN AVAGRAHA +114C4 ; Avagraha # Lo TIRHUTA SIGN AVAGRAHA +11A9D ; Avagraha # Lo SOYOMBO MARK PLUTA +11C40 ; Avagraha # Lo BHAIKSUKI SIGN AVAGRAHA + +# ================================================ + +# Indic_Syllabic_Category=Nukta + +# Nukta (diacritic for borrowed consonants or other consonant +# modifications). Note that while the resulting sound is typically a +# consonant, the base letter a nukta follows may be an independent +# vowel. For example, is used to transcribe ARABIC LETTER +# AIN. + +# [Not derivable] + +093C ; Nukta # Mn DEVANAGARI SIGN NUKTA +09BC ; Nukta # Mn BENGALI SIGN NUKTA +0A3C ; Nukta # Mn GURMUKHI SIGN NUKTA +0ABC ; Nukta # Mn GUJARATI SIGN NUKTA +0AFD..0AFF ; Nukta # Mn [3] GUJARATI SIGN THREE-DOT NUKTA ABOVE..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B3C ; Nukta # Mn ORIYA SIGN NUKTA +0CBC ; Nukta # Mn KANNADA SIGN NUKTA +0F39 ; Nukta # Mn TIBETAN MARK TSA -PHRU +1B34 ; Nukta # Mn BALINESE SIGN REREKAN +1BE6 ; Nukta # Mn BATAK SIGN TOMPI +1C37 ; Nukta # Mn LEPCHA SIGN NUKTA +A9B3 ; Nukta # Mn JAVANESE SIGN CECAK TELU +10A38..10A3A ; Nukta # Mn [3] KHAROSHTHI SIGN BAR ABOVE..KHAROSHTHI SIGN DOT BELOW +110BA ; Nukta # Mn KAITHI SIGN NUKTA +11173 ; Nukta # Mn MAHAJANI SIGN NUKTA +111CA ; Nukta # Mn SHARADA SIGN NUKTA +11236 ; Nukta # Mn KHOJKI SIGN NUKTA +112E9 ; Nukta # Mn KHUDAWADI SIGN NUKTA +1133B..1133C ; Nukta # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA +11446 ; Nukta # Mn NEWA SIGN NUKTA +114C3 ; Nukta # Mn TIRHUTA SIGN NUKTA +115C0 ; Nukta # Mn SIDDHAM SIGN NUKTA +116B7 ; Nukta # Mn TAKRI SIGN NUKTA +1183A ; Nukta # Mn DOGRA SIGN NUKTA +11D42 ; Nukta # Mn MASARAM GONDI SIGN NUKTA + +# ================================================ + +# Indic_Syllabic_Category=Virama + +# Virama (killing of inherent vowel in consonant sequence +# or consonant stacker) +# Only includes characters that can act both as visible killer viramas +# and consonant stackers. Separate property values exist for characters +# that can only act as pure killers or only as consonant stackers. + +# [Derivation: (ccc=9) - (InSC=Pure_Killer) - (InSC=Invisible_Stacker) +# - (InSC=Number_Joiner) - 2D7F] + +094D ; Virama # Mn DEVANAGARI SIGN VIRAMA +09CD ; Virama # Mn BENGALI SIGN VIRAMA +0A4D ; Virama # Mn GURMUKHI SIGN VIRAMA +0ACD ; Virama # Mn GUJARATI SIGN VIRAMA +0B4D ; Virama # Mn ORIYA SIGN VIRAMA +0BCD ; Virama # Mn TAMIL SIGN VIRAMA +0C4D ; Virama # Mn TELUGU SIGN VIRAMA +0CCD ; Virama # Mn KANNADA SIGN VIRAMA +0D4D ; Virama # Mn MALAYALAM SIGN VIRAMA +0DCA ; Virama # Mn SINHALA SIGN AL-LAKUNA +1B44 ; Virama # Mc BALINESE ADEG ADEG +A8C4 ; Virama # Mn SAURASHTRA SIGN VIRAMA +A9C0 ; Virama # Mc JAVANESE PANGKON +11046 ; Virama # Mn BRAHMI VIRAMA +110B9 ; Virama # Mn KAITHI SIGN VIRAMA +111C0 ; Virama # Mc SHARADA SIGN VIRAMA +11235 ; Virama # Mc KHOJKI SIGN VIRAMA +1134D ; Virama # Mc GRANTHA SIGN VIRAMA +11442 ; Virama # Mn NEWA SIGN VIRAMA +114C2 ; Virama # Mn TIRHUTA SIGN VIRAMA +115BF ; Virama # Mn SIDDHAM SIGN VIRAMA +1163F ; Virama # Mn MODI SIGN VIRAMA +116B6 ; Virama # Mc TAKRI SIGN VIRAMA +11839 ; Virama # Mn DOGRA SIGN VIRAMA +11C3F ; Virama # Mn BHAIKSUKI SIGN VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Pure_Killer + +# Pure killer (killing of inherent vowel in consonant sequence, +# with no consonant stacking behavior) + +# [Not derivable] + +0D3B..0D3C ; Pure_Killer # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA +0E3A ; Pure_Killer # Mn THAI CHARACTER PHINTHU +0E4E ; Pure_Killer # Mn THAI CHARACTER YAMAKKAN +0F84 ; Pure_Killer # Mn TIBETAN MARK HALANTA +103A ; Pure_Killer # Mn MYANMAR SIGN ASAT +1714 ; Pure_Killer # Mn TAGALOG SIGN VIRAMA +1734 ; Pure_Killer # Mn HANUNOO SIGN PAMUDPOD +17D1 ; Pure_Killer # Mn KHMER SIGN VIRIAM +1A7A ; Pure_Killer # Mn TAI THAM SIGN RA HAAM +1BAA ; Pure_Killer # Mc SUNDANESE SIGN PAMAAEH +1BF2..1BF3 ; Pure_Killer # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +A806 ; Pure_Killer # Mn SYLOTI NAGRI SIGN HASANTA +A953 ; Pure_Killer # Mc REJANG VIRAMA +ABED ; Pure_Killer # Mn MEETEI MAYEK APUN IYEK +11134 ; Pure_Killer # Mn CHAKMA MAAYYAA +112EA ; Pure_Killer # Mn KHUDAWADI SIGN VIRAMA +1172B ; Pure_Killer # Mn AHOM SIGN KILLER +11A34 ; Pure_Killer # Mn ZANABAZAR SQUARE SIGN VIRAMA +11D44 ; Pure_Killer # Mn MASARAM GONDI SIGN HALANTA + +# ================================================ + +# Indic_Syllabic_Category=Invisible_Stacker + +# Invisible stacker (invisible consonant stacker virama). +# +# Note that in some scripts, such as Kharoshthi and Masaram Gondi, an invisible +# stacker may have a second function, changing the shape and/or location of the +# consonant preceding it, even when there is no consonant following the +# invisible stacker. + +# [Not derivable] + +1039 ; Invisible_Stacker # Mn MYANMAR SIGN VIRAMA +17D2 ; Invisible_Stacker # Mn KHMER SIGN COENG +1A60 ; Invisible_Stacker # Mn TAI THAM SIGN SAKOT +1BAB ; Invisible_Stacker # Mn SUNDANESE SIGN VIRAMA +AAF6 ; Invisible_Stacker # Mn MEETEI MAYEK VIRAMA +10A3F ; Invisible_Stacker # Mn KHAROSHTHI VIRAMA +11133 ; Invisible_Stacker # Mn CHAKMA VIRAMA +11A47 ; Invisible_Stacker # Mn ZANABAZAR SQUARE SUBJOINER +11A99 ; Invisible_Stacker # Mn SOYOMBO SUBJOINER +11D45 ; Invisible_Stacker # Mn MASARAM GONDI VIRAMA +11D97 ; Invisible_Stacker # Mn GUNJALA GONDI VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Independent + +# Independent Vowels (contrasted with matras) + +# [Not derivable] + +0904..0914 ; Vowel_Independent # Lo [17] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER AU +0960..0961 ; Vowel_Independent # Lo [2] DEVANAGARI LETTER VOCALIC RR..DEVANAGARI LETTER VOCALIC LL +0972..0977 ; Vowel_Independent # Lo [6] DEVANAGARI LETTER CANDRA A..DEVANAGARI LETTER UUE +0985..098C ; Vowel_Independent # Lo [8] BENGALI LETTER A..BENGALI LETTER VOCALIC L +098F..0990 ; Vowel_Independent # Lo [2] BENGALI LETTER E..BENGALI LETTER AI +0993..0994 ; Vowel_Independent # Lo [2] BENGALI LETTER O..BENGALI LETTER AU +09E0..09E1 ; Vowel_Independent # Lo [2] BENGALI LETTER VOCALIC RR..BENGALI LETTER VOCALIC LL +0A05..0A0A ; Vowel_Independent # Lo [6] GURMUKHI LETTER A..GURMUKHI LETTER UU +0A0F..0A10 ; Vowel_Independent # Lo [2] GURMUKHI LETTER EE..GURMUKHI LETTER AI +0A13..0A14 ; Vowel_Independent # Lo [2] GURMUKHI LETTER OO..GURMUKHI LETTER AU +0A85..0A8D ; Vowel_Independent # Lo [9] GUJARATI LETTER A..GUJARATI VOWEL CANDRA E +0A8F..0A91 ; Vowel_Independent # Lo [3] GUJARATI LETTER E..GUJARATI VOWEL CANDRA O +0A93..0A94 ; Vowel_Independent # Lo [2] GUJARATI LETTER O..GUJARATI LETTER AU +0AE0..0AE1 ; Vowel_Independent # Lo [2] GUJARATI LETTER VOCALIC RR..GUJARATI LETTER VOCALIC LL +0B05..0B0C ; Vowel_Independent # Lo [8] ORIYA LETTER A..ORIYA LETTER VOCALIC L +0B0F..0B10 ; Vowel_Independent # Lo [2] ORIYA LETTER E..ORIYA LETTER AI +0B13..0B14 ; Vowel_Independent # Lo [2] ORIYA LETTER O..ORIYA LETTER AU +0B60..0B61 ; Vowel_Independent # Lo [2] ORIYA LETTER VOCALIC RR..ORIYA LETTER VOCALIC LL +0B85..0B8A ; Vowel_Independent # Lo [6] TAMIL LETTER A..TAMIL LETTER UU +0B8E..0B90 ; Vowel_Independent # Lo [3] TAMIL LETTER E..TAMIL LETTER AI +0B92..0B94 ; Vowel_Independent # Lo [3] TAMIL LETTER O..TAMIL LETTER AU +0C05..0C0C ; Vowel_Independent # Lo [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L +0C0E..0C10 ; Vowel_Independent # Lo [3] TELUGU LETTER E..TELUGU LETTER AI +0C12..0C14 ; Vowel_Independent # Lo [3] TELUGU LETTER O..TELUGU LETTER AU +0C60..0C61 ; Vowel_Independent # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL +0C85..0C8C ; Vowel_Independent # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L +0C8E..0C90 ; Vowel_Independent # Lo [3] KANNADA LETTER E..KANNADA LETTER AI +0C92..0C94 ; Vowel_Independent # Lo [3] KANNADA LETTER O..KANNADA LETTER AU +0CE0..0CE1 ; Vowel_Independent # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL +0D05..0D0C ; Vowel_Independent # Lo [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L +0D0E..0D10 ; Vowel_Independent # Lo [3] MALAYALAM LETTER E..MALAYALAM LETTER AI +0D12..0D14 ; Vowel_Independent # Lo [3] MALAYALAM LETTER O..MALAYALAM LETTER AU +0D5F..0D61 ; Vowel_Independent # Lo [3] MALAYALAM LETTER ARCHAIC II..MALAYALAM LETTER VOCALIC LL +0D85..0D96 ; Vowel_Independent # Lo [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA +1021..102A ; Vowel_Independent # Lo [10] MYANMAR LETTER A..MYANMAR LETTER AU +1052..1055 ; Vowel_Independent # Lo [4] MYANMAR LETTER VOCALIC R..MYANMAR LETTER VOCALIC LL +1700..1702 ; Vowel_Independent # Lo [3] TAGALOG LETTER A..TAGALOG LETTER U +1720..1722 ; Vowel_Independent # Lo [3] HANUNOO LETTER A..HANUNOO LETTER U +1740..1742 ; Vowel_Independent # Lo [3] BUHID LETTER A..BUHID LETTER U +1760..1762 ; Vowel_Independent # Lo [3] TAGBANWA LETTER A..TAGBANWA LETTER U +17A3..17B3 ; Vowel_Independent # Lo [17] KHMER INDEPENDENT VOWEL QAQ..KHMER INDEPENDENT VOWEL QAU +1A4D..1A52 ; Vowel_Independent # Lo [6] TAI THAM LETTER I..TAI THAM LETTER OO +1B05..1B12 ; Vowel_Independent # Lo [14] BALINESE LETTER AKARA..BALINESE LETTER OKARA TEDUNG +1B83..1B89 ; Vowel_Independent # Lo [7] SUNDANESE LETTER A..SUNDANESE LETTER EU +1BE4..1BE5 ; Vowel_Independent # Lo [2] BATAK LETTER I..BATAK LETTER U +A800..A801 ; Vowel_Independent # Lo [2] SYLOTI NAGRI LETTER A..SYLOTI NAGRI LETTER I +A803..A805 ; Vowel_Independent # Lo [3] SYLOTI NAGRI LETTER U..SYLOTI NAGRI LETTER O +A882..A891 ; Vowel_Independent # Lo [16] SAURASHTRA LETTER A..SAURASHTRA LETTER AU +A8FE ; Vowel_Independent # Lo DEVANAGARI LETTER AY +A984..A988 ; Vowel_Independent # Lo [5] JAVANESE LETTER A..JAVANESE LETTER U +A98C..A98E ; Vowel_Independent # Lo [3] JAVANESE LETTER E..JAVANESE LETTER O +AA00..AA05 ; Vowel_Independent # Lo [6] CHAM LETTER A..CHAM LETTER O +AAE0..AAE1 ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER E..MEETEI MAYEK LETTER O +ABCE..ABCF ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER UN..MEETEI MAYEK LETTER I +ABD1 ; Vowel_Independent # Lo MEETEI MAYEK LETTER ATIYA +11005..11012 ; Vowel_Independent # Lo [14] BRAHMI LETTER A..BRAHMI LETTER AU +11083..1108C ; Vowel_Independent # Lo [10] KAITHI LETTER A..KAITHI LETTER AU +11103..11106 ; Vowel_Independent # Lo [4] CHAKMA LETTER AA..CHAKMA LETTER E +11183..11190 ; Vowel_Independent # Lo [14] SHARADA LETTER A..SHARADA LETTER AU +11200..11207 ; Vowel_Independent # Lo [8] KHOJKI LETTER A..KHOJKI LETTER AU +11280..11283 ; Vowel_Independent # Lo [4] MULTANI LETTER A..MULTANI LETTER E +112B0..112B9 ; Vowel_Independent # Lo [10] KHUDAWADI LETTER A..KHUDAWADI LETTER AU +11305..1130C ; Vowel_Independent # Lo [8] GRANTHA LETTER A..GRANTHA LETTER VOCALIC L +1130F..11310 ; Vowel_Independent # Lo [2] GRANTHA LETTER EE..GRANTHA LETTER AI +11313..11314 ; Vowel_Independent # Lo [2] GRANTHA LETTER OO..GRANTHA LETTER AU +11360..11361 ; Vowel_Independent # Lo [2] GRANTHA LETTER VOCALIC RR..GRANTHA LETTER VOCALIC LL +11400..1140D ; Vowel_Independent # Lo [14] NEWA LETTER A..NEWA LETTER AU +11481..1148E ; Vowel_Independent # Lo [14] TIRHUTA LETTER A..TIRHUTA LETTER AU +11580..1158D ; Vowel_Independent # Lo [14] SIDDHAM LETTER A..SIDDHAM LETTER AU +115D8..115DB ; Vowel_Independent # Lo [4] SIDDHAM LETTER THREE-CIRCLE ALTERNATE I..SIDDHAM LETTER ALTERNATE U +11600..1160D ; Vowel_Independent # Lo [14] MODI LETTER A..MODI LETTER AU +11680..11689 ; Vowel_Independent # Lo [10] TAKRI LETTER A..TAKRI LETTER AU +11800..11809 ; Vowel_Independent # Lo [10] DOGRA LETTER A..DOGRA LETTER AU +11A00 ; Vowel_Independent # Lo ZANABAZAR SQUARE LETTER A +11A50 ; Vowel_Independent # Lo SOYOMBO LETTER A +11C00..11C08 ; Vowel_Independent # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L +11C0A..11C0D ; Vowel_Independent # Lo [4] BHAIKSUKI LETTER E..BHAIKSUKI LETTER AU +11D00..11D06 ; Vowel_Independent # Lo [7] MASARAM GONDI LETTER A..MASARAM GONDI LETTER E +11D08..11D09 ; Vowel_Independent # Lo [2] MASARAM GONDI LETTER AI..MASARAM GONDI LETTER O +11D0B ; Vowel_Independent # Lo MASARAM GONDI LETTER AU +11D60..11D65 ; Vowel_Independent # Lo [6] GUNJALA GONDI LETTER A..GUNJALA GONDI LETTER UU +11D67..11D68 ; Vowel_Independent # Lo [2] GUNJALA GONDI LETTER EE..GUNJALA GONDI LETTER AI +11D6A..11D6B ; Vowel_Independent # Lo [2] GUNJALA GONDI LETTER OO..GUNJALA GONDI LETTER AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Dependent + +# Dependent Vowels (contrasted with independent vowels and/or with +# complex placement). Known as matras in Indic scripts. Also +# includes vowel modifiers that follow dependent (and sometimes +# independent) vowels. + +# [Not derivable] + +093A ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN OE +093B ; Vowel_Dependent # Mc DEVANAGARI VOWEL SIGN OOE +093E..0940 ; Vowel_Dependent # Mc [3] DEVANAGARI VOWEL SIGN AA..DEVANAGARI VOWEL SIGN II +0941..0948 ; Vowel_Dependent # Mn [8] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN AI +0949..094C ; Vowel_Dependent # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094E..094F ; Vowel_Dependent # Mc [2] DEVANAGARI VOWEL SIGN PRISHTHAMATRA E..DEVANAGARI VOWEL SIGN AW +0955..0957 ; Vowel_Dependent # Mn [3] DEVANAGARI VOWEL SIGN CANDRA LONG E..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Vowel_Dependent # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BE..09C0 ; Vowel_Dependent # Mc [3] BENGALI VOWEL SIGN AA..BENGALI VOWEL SIGN II +09C1..09C4 ; Vowel_Dependent # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09C7..09C8 ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +09CB..09CC ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +09D7 ; Vowel_Dependent # Mc BENGALI AU LENGTH MARK +09E2..09E3 ; Vowel_Dependent # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3E..0A40 ; Vowel_Dependent # Mc [3] GURMUKHI VOWEL SIGN AA..GURMUKHI VOWEL SIGN II +0A41..0A42 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A47..0A48 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0ABE..0AC0 ; Vowel_Dependent # Mc [3] GUJARATI VOWEL SIGN AA..GUJARATI VOWEL SIGN II +0AC1..0AC5 ; Vowel_Dependent # Mn [5] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AC9 ; Vowel_Dependent # Mc GUJARATI VOWEL SIGN CANDRA O +0ACB..0ACC ; Vowel_Dependent # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0AE2..0AE3 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3E ; Vowel_Dependent # Mc ORIYA VOWEL SIGN AA +0B3F ; Vowel_Dependent # Mn ORIYA VOWEL SIGN I +0B40 ; Vowel_Dependent # Mc ORIYA VOWEL SIGN II +0B41..0B44 ; Vowel_Dependent # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B47..0B48 ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI +0B4B..0B4C ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN O..ORIYA VOWEL SIGN AU +0B56 ; Vowel_Dependent # Mn ORIYA AI LENGTH MARK +0B57 ; Vowel_Dependent # Mc ORIYA AU LENGTH MARK +0B62..0B63 ; Vowel_Dependent # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BBE..0BBF ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC0 ; Vowel_Dependent # Mn TAMIL VOWEL SIGN II +0BC1..0BC2 ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BC6..0BC8 ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0BCA..0BCC ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0BD7 ; Vowel_Dependent # Mc TAMIL AU LENGTH MARK +0C3E..0C40 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C41..0C44 ; Vowel_Dependent # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C46..0C48 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI +0C4A..0C4C ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C55..0C56 ; Vowel_Dependent # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK +0C62..0C63 ; Vowel_Dependent # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBE ; Vowel_Dependent # Mc KANNADA VOWEL SIGN AA +0CBF ; Vowel_Dependent # Mn KANNADA VOWEL SIGN I +0CC0..0CC4 ; Vowel_Dependent # Mc [5] KANNADA VOWEL SIGN II..KANNADA VOWEL SIGN VOCALIC RR +0CC6 ; Vowel_Dependent # Mn KANNADA VOWEL SIGN E +0CC7..0CC8 ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +0CCC ; Vowel_Dependent # Mn KANNADA VOWEL SIGN AU +0CD5..0CD6 ; Vowel_Dependent # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CE2..0CE3 ; Vowel_Dependent # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D3E..0D40 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D44 ; Vowel_Dependent # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR +0D46..0D48 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0D4A..0D4C ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0D57 ; Vowel_Dependent # Mc MALAYALAM AU LENGTH MARK +0D62..0D63 ; Vowel_Dependent # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DCF..0DD1 ; Vowel_Dependent # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD2..0DD4 ; Vowel_Dependent # Mn [3] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Vowel_Dependent # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0DD8..0DDF ; Vowel_Dependent # Mc [8] SINHALA VOWEL SIGN GAETTA-PILLA..SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Vowel_Dependent # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Vowel_Dependent # Lo THAI CHARACTER SARA A +0E31 ; Vowel_Dependent # Mn THAI CHARACTER MAI HAN-AKAT +0E32..0E33 ; Vowel_Dependent # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E34..0E39 ; Vowel_Dependent # Mn [6] THAI CHARACTER SARA I..THAI CHARACTER SARA UU +0E40..0E45 ; Vowel_Dependent # Lo [6] THAI CHARACTER SARA E..THAI CHARACTER LAKKHANGYAO +0E47 ; Vowel_Dependent # Mn THAI CHARACTER MAITAIKHU +0EB0 ; Vowel_Dependent # Lo LAO VOWEL SIGN A +0EB1 ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KAN +0EB2..0EB3 ; Vowel_Dependent # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0EB4..0EB9 ; Vowel_Dependent # Mn [6] LAO VOWEL SIGN I..LAO VOWEL SIGN UU +0EBB ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KON +0EC0..0EC4 ; Vowel_Dependent # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +0F71..0F7D ; Vowel_Dependent # Mn [13] TIBETAN VOWEL SIGN AA..TIBETAN VOWEL SIGN OO +0F80..0F81 ; Vowel_Dependent # Mn [2] TIBETAN VOWEL SIGN REVERSED I..TIBETAN VOWEL SIGN REVERSED II +102B..102C ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +102D..1030 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN UU +1031 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN E +1032..1035 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +1056..1057 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1058..1059 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1062 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1071..1074 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1083..1084 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN SHAN AA..MYANMAR VOWEL SIGN SHAN E +1085..1086 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109C ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN AITON A +109D ; Vowel_Dependent # Mn MYANMAR VOWEL SIGN AITON AI +1712..1713 ; Vowel_Dependent # Mn [2] TAGALOG VOWEL SIGN I..TAGALOG VOWEL SIGN U +1732..1733 ; Vowel_Dependent # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1752..1753 ; Vowel_Dependent # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U +1772..1773 ; Vowel_Dependent # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U +17B6 ; Vowel_Dependent # Mc KHMER VOWEL SIGN AA +17B7..17BD ; Vowel_Dependent # Mn [7] KHMER VOWEL SIGN I..KHMER VOWEL SIGN UA +17BE..17C5 ; Vowel_Dependent # Mc [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU +17C8 ; Vowel_Dependent # Mc KHMER SIGN YUUKALEAPINTU +1920..1922 ; Vowel_Dependent # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U +1923..1926 ; Vowel_Dependent # Mc [4] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AU +1927..1928 ; Vowel_Dependent # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Vowel_Dependent # Mn LIMBU SIGN KEMPHRENG +19B0..19C0 ; Vowel_Dependent # Lo [17] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN IY +1A17..1A18 ; Vowel_Dependent # Mn [2] BUGINESE VOWEL SIGN I..BUGINESE VOWEL SIGN U +1A19..1A1A ; Vowel_Dependent # Mc [2] BUGINESE VOWEL SIGN E..BUGINESE VOWEL SIGN O +1A1B ; Vowel_Dependent # Mn BUGINESE VOWEL SIGN AE +1A61 ; Vowel_Dependent # Mc TAI THAM VOWEL SIGN A +1A62 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN MAI SAT +1A63..1A64 ; Vowel_Dependent # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A65..1A6C ; Vowel_Dependent # Mn [8] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN OA BELOW +1A6D..1A72 ; Vowel_Dependent # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI +1A73 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN OA ABOVE +1B35 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN TEDUNG +1B36..1B3A ; Vowel_Dependent # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA +1B3B ; Vowel_Dependent # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +1B3C ; Vowel_Dependent # Mn BALINESE VOWEL SIGN LA LENGA +1B3D..1B41 ; Vowel_Dependent # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1B42 ; Vowel_Dependent # Mn BALINESE VOWEL SIGN PEPET +1B43 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN PEPET TEDUNG +1BA4..1BA5 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PANGHULU..SUNDANESE VOWEL SIGN PANYUKU +1BA6..1BA7 ; Vowel_Dependent # Mc [2] SUNDANESE VOWEL SIGN PANAELAENG..SUNDANESE VOWEL SIGN PANOLONG +1BA8..1BA9 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE7 ; Vowel_Dependent # Mc BATAK VOWEL SIGN E +1BE8..1BE9 ; Vowel_Dependent # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BEA..1BEC ; Vowel_Dependent # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BED ; Vowel_Dependent # Mn BATAK VOWEL SIGN KARO O +1BEE ; Vowel_Dependent # Mc BATAK VOWEL SIGN U +1BEF ; Vowel_Dependent # Mn BATAK VOWEL SIGN U FOR SIMALUNGUN SA +1C26..1C2B ; Vowel_Dependent # Mc [6] LEPCHA VOWEL SIGN AA..LEPCHA VOWEL SIGN UU +1C2C ; Vowel_Dependent # Mn LEPCHA VOWEL SIGN E +A823..A824 ; Vowel_Dependent # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A825..A826 ; Vowel_Dependent # Mn [2] SYLOTI NAGRI VOWEL SIGN U..SYLOTI NAGRI VOWEL SIGN E +A827 ; Vowel_Dependent # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Vowel_Dependent # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A8FF ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN AY +A947..A94E ; Vowel_Dependent # Mn [8] REJANG VOWEL SIGN I..REJANG VOWEL SIGN EA +A9B4..A9B5 ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9B6..A9B9 ; Vowel_Dependent # Mn [4] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BA..A9BB ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +A9BC ; Vowel_Dependent # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Vowel_Dependent # Mn MYANMAR SIGN SHAN SAW +AA29..AA2E ; Vowel_Dependent # Mn [6] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN OE +AA2F..AA30 ; Vowel_Dependent # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA31..AA32 ; Vowel_Dependent # Mn [2] CHAM VOWEL SIGN AU..CHAM VOWEL SIGN UE +AAB0 ; Vowel_Dependent # Mn TAI VIET MAI KANG +AAB1 ; Vowel_Dependent # Lo TAI VIET VOWEL AA +AAB2..AAB4 ; Vowel_Dependent # Mn [3] TAI VIET VOWEL I..TAI VIET VOWEL U +AAB5..AAB6 ; Vowel_Dependent # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB7..AAB8 ; Vowel_Dependent # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AAB9..AABD ; Vowel_Dependent # Lo [5] TAI VIET VOWEL UEA..TAI VIET VOWEL AN +AABE ; Vowel_Dependent # Mn TAI VIET VOWEL AM +AAEB ; Vowel_Dependent # Mc MEETEI MAYEK VOWEL SIGN II +AAEC..AAED ; Vowel_Dependent # Mn [2] MEETEI MAYEK VOWEL SIGN UU..MEETEI MAYEK VOWEL SIGN AAI +AAEE..AAEF ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN AU..MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE5 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN ANAP +ABE6..ABE7 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE8 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABE9..ABEA ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +10A01..10A03 ; Vowel_Dependent # Mn [3] KHAROSHTHI VOWEL SIGN I..KHAROSHTHI VOWEL SIGN VOCALIC R +10A05..10A06 ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O +10A0C..10A0D ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN DOUBLE RING BELOW +11038..11045 ; Vowel_Dependent # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +110B0..110B2 ; Vowel_Dependent # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II +110B3..110B6 ; Vowel_Dependent # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI +110B7..110B8 ; Vowel_Dependent # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11127..1112B ; Vowel_Dependent # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU +1112C ; Vowel_Dependent # Mc CHAKMA VOWEL SIGN E +1112D..11132 ; Vowel_Dependent # Mn [6] CHAKMA VOWEL SIGN AI..CHAKMA AU MARK +11145..11146 ; Vowel_Dependent # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI +111B3..111B5 ; Vowel_Dependent # Mc [3] SHARADA VOWEL SIGN AA..SHARADA VOWEL SIGN II +111B6..111BE ; Vowel_Dependent # Mn [9] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN O +111BF ; Vowel_Dependent # Mc SHARADA VOWEL SIGN AU +111CB..111CC ; Vowel_Dependent # Mn [2] SHARADA VOWEL MODIFIER MARK..SHARADA EXTRA SHORT VOWEL MARK +1122C..1122E ; Vowel_Dependent # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +1122F..11231 ; Vowel_Dependent # Mn [3] KHOJKI VOWEL SIGN U..KHOJKI VOWEL SIGN AI +11232..11233 ; Vowel_Dependent # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU +112E0..112E2 ; Vowel_Dependent # Mc [3] KHUDAWADI VOWEL SIGN AA..KHUDAWADI VOWEL SIGN II +112E3..112E8 ; Vowel_Dependent # Mn [6] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN AU +1133E..1133F ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11340 ; Vowel_Dependent # Mn GRANTHA VOWEL SIGN II +11341..11344 ; Vowel_Dependent # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +11347..11348 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +1134B..1134C ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +11357 ; Vowel_Dependent # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +11435..11437 ; Vowel_Dependent # Mc [3] NEWA VOWEL SIGN AA..NEWA VOWEL SIGN II +11438..1143F ; Vowel_Dependent # Mn [8] NEWA VOWEL SIGN U..NEWA VOWEL SIGN AI +11440..11441 ; Vowel_Dependent # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +114B0..114B2 ; Vowel_Dependent # Mc [3] TIRHUTA VOWEL SIGN AA..TIRHUTA VOWEL SIGN II +114B3..114B8 ; Vowel_Dependent # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114B9 ; Vowel_Dependent # Mc TIRHUTA VOWEL SIGN E +114BA ; Vowel_Dependent # Mn TIRHUTA VOWEL SIGN SHORT E +114BB..114BE ; Vowel_Dependent # Mc [4] TIRHUTA VOWEL SIGN AI..TIRHUTA VOWEL SIGN AU +115AF..115B1 ; Vowel_Dependent # Mc [3] SIDDHAM VOWEL SIGN AA..SIDDHAM VOWEL SIGN II +115B2..115B5 ; Vowel_Dependent # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115B8..115BB ; Vowel_Dependent # Mc [4] SIDDHAM VOWEL SIGN E..SIDDHAM VOWEL SIGN AU +115DC..115DD ; Vowel_Dependent # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11630..11632 ; Vowel_Dependent # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +11633..1163A ; Vowel_Dependent # Mn [8] MODI VOWEL SIGN U..MODI VOWEL SIGN AI +1163B..1163C ; Vowel_Dependent # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +11640 ; Vowel_Dependent # Mn MODI SIGN ARDHACANDRA +116AD ; Vowel_Dependent # Mn TAKRI VOWEL SIGN AA +116AE..116AF ; Vowel_Dependent # Mc [2] TAKRI VOWEL SIGN I..TAKRI VOWEL SIGN II +116B0..116B5 ; Vowel_Dependent # Mn [6] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN AU +11720..11721 ; Vowel_Dependent # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +11722..11725 ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN I..AHOM VOWEL SIGN UU +11726 ; Vowel_Dependent # Mc AHOM VOWEL SIGN E +11727..1172A ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN AW..AHOM VOWEL SIGN AM +1182C..1182E ; Vowel_Dependent # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II +1182F..11836 ; Vowel_Dependent # Mn [8] DOGRA VOWEL SIGN U..DOGRA VOWEL SIGN AU +11A01..11A0A ; Vowel_Dependent # Mn [10] ZANABAZAR SQUARE VOWEL SIGN I..ZANABAZAR SQUARE VOWEL LENGTH MARK +11A51..11A56 ; Vowel_Dependent # Mn [6] SOYOMBO VOWEL SIGN I..SOYOMBO VOWEL SIGN OE +11A57..11A58 ; Vowel_Dependent # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A59..11A5B ; Vowel_Dependent # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11C2F ; Vowel_Dependent # Mc BHAIKSUKI VOWEL SIGN AA +11C30..11C36 ; Vowel_Dependent # Mn [7] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN VOCALIC L +11C38..11C3B ; Vowel_Dependent # Mn [4] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI VOWEL SIGN AU +11CB0 ; Vowel_Dependent # Mn MARCHEN VOWEL SIGN AA +11CB1 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN I +11CB2..11CB3 ; Vowel_Dependent # Mn [2] MARCHEN VOWEL SIGN U..MARCHEN VOWEL SIGN E +11CB4 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN O +11D31..11D36 ; Vowel_Dependent # Mn [6] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN VOCALIC R +11D3A ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Vowel_Dependent # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN AU +11D43 ; Vowel_Dependent # Mn MASARAM GONDI SIGN CANDRA +11D8A..11D8E ; Vowel_Dependent # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU +11D90..11D91 ; Vowel_Dependent # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI +11D93..11D94 ; Vowel_Dependent # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU +11EF3..11EF4 ; Vowel_Dependent # Mn [2] MAKASAR VOWEL SIGN I..MAKASAR VOWEL SIGN U +11EF5..11EF6 ; Vowel_Dependent # Mc [2] MAKASAR VOWEL SIGN E..MAKASAR VOWEL SIGN O + +# ================================================ + +# Indic_Syllabic_Category=Vowel + +# (Other) Vowels (reanalyzed as ordinary alphabetic letters or marks) + +# [Not derivable] + +1963..196D ; Vowel # Lo [11] TAI LE LETTER A..TAI LE LETTER AI +A85E..A861 ; Vowel # Lo [4] PHAGS-PA LETTER I..PHAGS-PA LETTER O +A866 ; Vowel # Lo PHAGS-PA LETTER EE +A922..A925 ; Vowel # Lo [4] KAYAH LI LETTER A..KAYAH LI LETTER OO +A926..A92A ; Vowel # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O +11150..11154 ; Vowel # Lo [5] MAHAJANI LETTER A..MAHAJANI LETTER O + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Placeholder + +# Consonant Placeholder +# This includes generic placeholders used for +# Indic script layout (NBSP and dotted circle), as well as a few script- +# specific vowel-holder characters which are not technically +# consonants, but serve instead as bases for placement of vowel marks. + +# [Not derivable] + +002D ; Consonant_Placeholder # Pd HYPHEN-MINUS +00A0 ; Consonant_Placeholder # Zs NO-BREAK SPACE +00D7 ; Consonant_Placeholder # Sm MULTIPLICATION SIGN +0980 ; Consonant_Placeholder # Lo BENGALI ANJI +0A72..0A73 ; Consonant_Placeholder # Lo [2] GURMUKHI IRI..GURMUKHI URA +104B ; Consonant_Placeholder # Po MYANMAR SIGN SECTION +104E ; Consonant_Placeholder # Po MYANMAR SYMBOL AFOREMENTIONED +1900 ; Consonant_Placeholder # Lo LIMBU VOWEL-CARRIER LETTER +2010..2014 ; Consonant_Placeholder # Pd [5] HYPHEN..EM DASH +25CC ; Consonant_Placeholder # So DOTTED CIRCLE +AA74..AA76 ; Consonant_Placeholder # Lo [3] MYANMAR LOGOGRAM KHAMTI OAY..MYANMAR LOGOGRAM KHAMTI HM +11A3F ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL HEAD MARK +11A45 ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL DOUBLE-LINED HEAD MARK +11EF2 ; Consonant_Placeholder # Lo MAKASAR ANGKA + +# ================================================ + +# Indic_Syllabic_Category=Consonant + +# Consonant (ordinary abugida consonants, with inherent vowels) + +# [Not derivable] + +0915..0939 ; Consonant # Lo [37] DEVANAGARI LETTER KA..DEVANAGARI LETTER HA +0958..095F ; Consonant # Lo [8] DEVANAGARI LETTER QA..DEVANAGARI LETTER YYA +0978..097F ; Consonant # Lo [8] DEVANAGARI LETTER MARWARI DDA..DEVANAGARI LETTER BBA +0995..09A8 ; Consonant # Lo [20] BENGALI LETTER KA..BENGALI LETTER NA +09AA..09B0 ; Consonant # Lo [7] BENGALI LETTER PA..BENGALI LETTER RA +09B2 ; Consonant # Lo BENGALI LETTER LA +09B6..09B9 ; Consonant # Lo [4] BENGALI LETTER SHA..BENGALI LETTER HA +09DC..09DD ; Consonant # Lo [2] BENGALI LETTER RRA..BENGALI LETTER RHA +09DF ; Consonant # Lo BENGALI LETTER YYA +09F0..09F1 ; Consonant # Lo [2] BENGALI LETTER RA WITH MIDDLE DIAGONAL..BENGALI LETTER RA WITH LOWER DIAGONAL +0A15..0A28 ; Consonant # Lo [20] GURMUKHI LETTER KA..GURMUKHI LETTER NA +0A2A..0A30 ; Consonant # Lo [7] GURMUKHI LETTER PA..GURMUKHI LETTER RA +0A32..0A33 ; Consonant # Lo [2] GURMUKHI LETTER LA..GURMUKHI LETTER LLA +0A35..0A36 ; Consonant # Lo [2] GURMUKHI LETTER VA..GURMUKHI LETTER SHA +0A38..0A39 ; Consonant # Lo [2] GURMUKHI LETTER SA..GURMUKHI LETTER HA +0A59..0A5C ; Consonant # Lo [4] GURMUKHI LETTER KHHA..GURMUKHI LETTER RRA +0A5E ; Consonant # Lo GURMUKHI LETTER FA +0A95..0AA8 ; Consonant # Lo [20] GUJARATI LETTER KA..GUJARATI LETTER NA +0AAA..0AB0 ; Consonant # Lo [7] GUJARATI LETTER PA..GUJARATI LETTER RA +0AB2..0AB3 ; Consonant # Lo [2] GUJARATI LETTER LA..GUJARATI LETTER LLA +0AB5..0AB9 ; Consonant # Lo [5] GUJARATI LETTER VA..GUJARATI LETTER HA +0AF9 ; Consonant # Lo GUJARATI LETTER ZHA +0B15..0B28 ; Consonant # Lo [20] ORIYA LETTER KA..ORIYA LETTER NA +0B2A..0B30 ; Consonant # Lo [7] ORIYA LETTER PA..ORIYA LETTER RA +0B32..0B33 ; Consonant # Lo [2] ORIYA LETTER LA..ORIYA LETTER LLA +0B35..0B39 ; Consonant # Lo [5] ORIYA LETTER VA..ORIYA LETTER HA +0B5C..0B5D ; Consonant # Lo [2] ORIYA LETTER RRA..ORIYA LETTER RHA +0B5F ; Consonant # Lo ORIYA LETTER YYA +0B71 ; Consonant # Lo ORIYA LETTER WA +0B95 ; Consonant # Lo TAMIL LETTER KA +0B99..0B9A ; Consonant # Lo [2] TAMIL LETTER NGA..TAMIL LETTER CA +0B9C ; Consonant # Lo TAMIL LETTER JA +0B9E..0B9F ; Consonant # Lo [2] TAMIL LETTER NYA..TAMIL LETTER TTA +0BA3..0BA4 ; Consonant # Lo [2] TAMIL LETTER NNA..TAMIL LETTER TA +0BA8..0BAA ; Consonant # Lo [3] TAMIL LETTER NA..TAMIL LETTER PA +0BAE..0BB9 ; Consonant # Lo [12] TAMIL LETTER MA..TAMIL LETTER HA +0C15..0C28 ; Consonant # Lo [20] TELUGU LETTER KA..TELUGU LETTER NA +0C2A..0C39 ; Consonant # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C58..0C5A ; Consonant # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C95..0CA8 ; Consonant # Lo [20] KANNADA LETTER KA..KANNADA LETTER NA +0CAA..0CB3 ; Consonant # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA +0CB5..0CB9 ; Consonant # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA +0CDE ; Consonant # Lo KANNADA LETTER FA +0D15..0D3A ; Consonant # Lo [38] MALAYALAM LETTER KA..MALAYALAM LETTER TTTA +0D9A..0DB1 ; Consonant # Lo [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA +0DB3..0DBB ; Consonant # Lo [9] SINHALA LETTER SANYAKA DAYANNA..SINHALA LETTER RAYANNA +0DBD ; Consonant # Lo SINHALA LETTER DANTAJA LAYANNA +0DC0..0DC6 ; Consonant # Lo [7] SINHALA LETTER VAYANNA..SINHALA LETTER FAYANNA +0E01..0E2E ; Consonant # Lo [46] THAI CHARACTER KO KAI..THAI CHARACTER HO NOKHUK +0E81..0E82 ; Consonant # Lo [2] LAO LETTER KO..LAO LETTER KHO SUNG +0E84 ; Consonant # Lo LAO LETTER KHO TAM +0E87..0E88 ; Consonant # Lo [2] LAO LETTER NGO..LAO LETTER CO +0E8A ; Consonant # Lo LAO LETTER SO TAM +0E8D ; Consonant # Lo LAO LETTER NYO +0E94..0E97 ; Consonant # Lo [4] LAO LETTER DO..LAO LETTER THO TAM +0E99..0E9F ; Consonant # Lo [7] LAO LETTER NO..LAO LETTER FO SUNG +0EA1..0EA3 ; Consonant # Lo [3] LAO LETTER MO..LAO LETTER LO LING +0EA5 ; Consonant # Lo LAO LETTER LO LOOT +0EA7 ; Consonant # Lo LAO LETTER WO +0EAA..0EAB ; Consonant # Lo [2] LAO LETTER SO SUNG..LAO LETTER HO SUNG +0EAD..0EAE ; Consonant # Lo [2] LAO LETTER O..LAO LETTER HO TAM +0EDC..0EDF ; Consonant # Lo [4] LAO HO NO..LAO LETTER KHMU NYO +0F40..0F47 ; Consonant # Lo [8] TIBETAN LETTER KA..TIBETAN LETTER JA +0F49..0F6C ; Consonant # Lo [36] TIBETAN LETTER NYA..TIBETAN LETTER RRA +1000..1020 ; Consonant # Lo [33] MYANMAR LETTER KA..MYANMAR LETTER LLA +103F ; Consonant # Lo MYANMAR LETTER GREAT SA +1050..1051 ; Consonant # Lo [2] MYANMAR LETTER SHA..MYANMAR LETTER SSA +105A..105D ; Consonant # Lo [4] MYANMAR LETTER MON NGA..MYANMAR LETTER MON BBE +1061 ; Consonant # Lo MYANMAR LETTER SGAW KAREN SHA +1065..1066 ; Consonant # Lo [2] MYANMAR LETTER WESTERN PWO KAREN THA..MYANMAR LETTER WESTERN PWO KAREN PWA +106E..1070 ; Consonant # Lo [3] MYANMAR LETTER EASTERN PWO KAREN NNA..MYANMAR LETTER EASTERN PWO KAREN GHWA +1075..1081 ; Consonant # Lo [13] MYANMAR LETTER SHAN KA..MYANMAR LETTER SHAN HA +108E ; Consonant # Lo MYANMAR LETTER RUMAI PALAUNG FA +1703..170C ; Consonant # Lo [10] TAGALOG LETTER KA..TAGALOG LETTER YA +170E..1711 ; Consonant # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1723..1731 ; Consonant # Lo [15] HANUNOO LETTER KA..HANUNOO LETTER HA +1743..1751 ; Consonant # Lo [15] BUHID LETTER KA..BUHID LETTER HA +1763..176C ; Consonant # Lo [10] TAGBANWA LETTER KA..TAGBANWA LETTER YA +176E..1770 ; Consonant # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA +1780..17A2 ; Consonant # Lo [35] KHMER LETTER KA..KHMER LETTER QA +1901..191E ; Consonant # Lo [30] LIMBU LETTER KA..LIMBU LETTER TRA +1950..1962 ; Consonant # Lo [19] TAI LE LETTER KA..TAI LE LETTER NA +1980..19AB ; Consonant # Lo [44] NEW TAI LUE LETTER HIGH QA..NEW TAI LUE LETTER LOW SUA +1A00..1A16 ; Consonant # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA +1A20..1A4C ; Consonant # Lo [45] TAI THAM LETTER HIGH KA..TAI THAM LETTER LOW HA +1A53..1A54 ; Consonant # Lo [2] TAI THAM LETTER LAE..TAI THAM LETTER GREAT SA +1B13..1B33 ; Consonant # Lo [33] BALINESE LETTER KA..BALINESE LETTER HA +1B45..1B4B ; Consonant # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B8A..1BA0 ; Consonant # Lo [23] SUNDANESE LETTER KA..SUNDANESE LETTER HA +1BAE..1BAF ; Consonant # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA +1BBB..1BBD ; Consonant # Lo [3] SUNDANESE LETTER REU..SUNDANESE LETTER BHA +1BC0..1BE3 ; Consonant # Lo [36] BATAK LETTER A..BATAK LETTER MBA +1C00..1C23 ; Consonant # Lo [36] LEPCHA LETTER KA..LEPCHA LETTER A +1C4D..1C4F ; Consonant # Lo [3] LEPCHA LETTER TTA..LEPCHA LETTER DDA +A807..A80A ; Consonant # Lo [4] SYLOTI NAGRI LETTER KO..SYLOTI NAGRI LETTER GHO +A80C..A822 ; Consonant # Lo [23] SYLOTI NAGRI LETTER CO..SYLOTI NAGRI LETTER HO +A840..A85D ; Consonant # Lo [30] PHAGS-PA LETTER KA..PHAGS-PA LETTER A +A862..A865 ; Consonant # Lo [4] PHAGS-PA LETTER QA..PHAGS-PA LETTER GGA +A869..A870 ; Consonant # Lo [8] PHAGS-PA LETTER TTA..PHAGS-PA LETTER ASPIRATED FA +A872 ; Consonant # Lo PHAGS-PA SUPERFIXED LETTER RA +A892..A8B3 ; Consonant # Lo [34] SAURASHTRA LETTER KA..SAURASHTRA LETTER LLA +A90A..A921 ; Consonant # Lo [24] KAYAH LI LETTER KA..KAYAH LI LETTER CA +A930..A946 ; Consonant # Lo [23] REJANG LETTER KA..REJANG LETTER A +A989..A98B ; Consonant # Lo [3] JAVANESE LETTER PA CEREK..JAVANESE LETTER NGA LELET RASWADI +A98F..A9B2 ; Consonant # Lo [36] JAVANESE LETTER KA..JAVANESE LETTER HA +A9E0..A9E4 ; Consonant # Lo [5] MYANMAR LETTER SHAN GHA..MYANMAR LETTER SHAN BHA +A9E7..A9EF ; Consonant # Lo [9] MYANMAR LETTER TAI LAING NYA..MYANMAR LETTER TAI LAING NNA +A9FA..A9FE ; Consonant # Lo [5] MYANMAR LETTER TAI LAING LLA..MYANMAR LETTER TAI LAING BHA +AA06..AA28 ; Consonant # Lo [35] CHAM LETTER KA..CHAM LETTER HA +AA60..AA6F ; Consonant # Lo [16] MYANMAR LETTER KHAMTI GA..MYANMAR LETTER KHAMTI FA +AA71..AA73 ; Consonant # Lo [3] MYANMAR LETTER KHAMTI XA..MYANMAR LETTER KHAMTI RA +AA7A ; Consonant # Lo MYANMAR LETTER AITON RA +AA7E..AA7F ; Consonant # Lo [2] MYANMAR LETTER SHWE PALAUNG CHA..MYANMAR LETTER SHWE PALAUNG SHA +AA80..AAAF ; Consonant # Lo [48] TAI VIET LETTER LOW KO..TAI VIET LETTER HIGH O +AAE2..AAEA ; Consonant # Lo [9] MEETEI MAYEK LETTER CHA..MEETEI MAYEK LETTER SSA +ABC0..ABCD ; Consonant # Lo [14] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER HUK +ABD0 ; Consonant # Lo MEETEI MAYEK LETTER PHAM +ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTER BHAM +10A00 ; Consonant # Lo KHAROSHTHI LETTER A +10A10..10A13 ; Consonant # Lo [4] KHAROSHTHI LETTER KA..KHAROSHTHI LETTER GHA +10A15..10A17 ; Consonant # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA +10A19..10A35 ; Consonant # Lo [29] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER VHA +11013..11037 ; Consonant # Lo [37] BRAHMI LETTER KA..BRAHMI LETTER OLD TAMIL NNNA +1108D..110AF ; Consonant # Lo [35] KAITHI LETTER KA..KAITHI LETTER HA +11107..11126 ; Consonant # Lo [32] CHAKMA LETTER KAA..CHAKMA LETTER HAA +11144 ; Consonant # Lo CHAKMA LETTER LHAA +11155..11172 ; Consonant # Lo [30] MAHAJANI LETTER KA..MAHAJANI LETTER RRA +11191..111B2 ; Consonant # Lo [34] SHARADA LETTER KA..SHARADA LETTER HA +11208..11211 ; Consonant # Lo [10] KHOJKI LETTER KA..KHOJKI LETTER JJA +11213..1122B ; Consonant # Lo [25] KHOJKI LETTER NYA..KHOJKI LETTER LLA +11284..11286 ; Consonant # Lo [3] MULTANI LETTER KA..MULTANI LETTER GA +11288 ; Consonant # Lo MULTANI LETTER GHA +1128A..1128D ; Consonant # Lo [4] MULTANI LETTER CA..MULTANI LETTER JJA +1128F..1129D ; Consonant # Lo [15] MULTANI LETTER NYA..MULTANI LETTER BA +1129F..112A8 ; Consonant # Lo [10] MULTANI LETTER BHA..MULTANI LETTER RHA +112BA..112DE ; Consonant # Lo [37] KHUDAWADI LETTER KA..KHUDAWADI LETTER HA +11315..11328 ; Consonant # Lo [20] GRANTHA LETTER KA..GRANTHA LETTER NA +1132A..11330 ; Consonant # Lo [7] GRANTHA LETTER PA..GRANTHA LETTER RA +11332..11333 ; Consonant # Lo [2] GRANTHA LETTER LA..GRANTHA LETTER LLA +11335..11339 ; Consonant # Lo [5] GRANTHA LETTER VA..GRANTHA LETTER HA +1140E..11434 ; Consonant # Lo [39] NEWA LETTER KA..NEWA LETTER HA +1148F..114AF ; Consonant # Lo [33] TIRHUTA LETTER KA..TIRHUTA LETTER HA +1158E..115AE ; Consonant # Lo [33] SIDDHAM LETTER KA..SIDDHAM LETTER HA +1160E..1162F ; Consonant # Lo [34] MODI LETTER KA..MODI LETTER LLA +1168A..116AA ; Consonant # Lo [33] TAKRI LETTER KA..TAKRI LETTER RRA +11700..1171A ; Consonant # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA +1180A..1182B ; Consonant # Lo [34] DOGRA LETTER KA..DOGRA LETTER RRA +11A0B..11A32 ; Consonant # Lo [40] ZANABAZAR SQUARE LETTER KA..ZANABAZAR SQUARE LETTER KSSA +11A5C..11A83 ; Consonant # Lo [40] SOYOMBO LETTER KA..SOYOMBO LETTER KSSA +11C0E..11C2E ; Consonant # Lo [33] BHAIKSUKI LETTER KA..BHAIKSUKI LETTER HA +11C72..11C8F ; Consonant # Lo [30] MARCHEN LETTER KA..MARCHEN LETTER A +11D0C..11D30 ; Consonant # Lo [37] MASARAM GONDI LETTER KA..MASARAM GONDI LETTER TRA +11D6C..11D89 ; Consonant # Lo [30] GUNJALA GONDI LETTER YA..GUNJALA GONDI LETTER SA +11EE0..11EF1 ; Consonant # Lo [18] MAKASAR LETTER KA..MAKASAR LETTER A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Dead + +# Dead Consonant (special consonant with killed vowel) + +# [Not derivable] + +09CE ; Consonant_Dead # Lo BENGALI LETTER KHANDA TA +0D54..0D56 ; Consonant_Dead # Lo [3] MALAYALAM LETTER CHILLU M..MALAYALAM LETTER CHILLU LLL +0D7A..0D7F ; Consonant_Dead # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K + +# ================================================ + +# Indic_Syllabic_Category=Consonant_With_Stacker + +# Consonants that may make stacked ligatures with the next consonant +# without the use of a virama + +# [Not derivable] + +0CF1..0CF2 ; Consonant_With_Stacker # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA +1CF5..1CF6 ; Consonant_With_Stacker # Lo [2] VEDIC SIGN JIHVAMULIYA..VEDIC SIGN UPADHMANIYA +11003..11004 ; Consonant_With_Stacker # Lo [2] BRAHMI SIGN JIHVAMULIYA..BRAHMI SIGN UPADHMANIYA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Prefixed + +# Cluster-initial consonants + +# [Not derivable] + +111C2..111C3 ; Consonant_Prefixed # Lo [2] SHARADA SIGN JIHVAMULIYA..SHARADA SIGN UPADHMANIYA +11A3A ; Consonant_Prefixed # Lo ZANABAZAR SQUARE CLUSTER-INITIAL LETTER RA +11A86..11A89 ; Consonant_Prefixed # Lo [4] SOYOMBO CLUSTER-INITIAL LETTER RA..SOYOMBO CLUSTER-INITIAL LETTER SA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Preceding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when preceding the main +# consonant. + +# [Not derivable] + +0D4E ; Consonant_Preceding_Repha # Lo MALAYALAM LETTER DOT REPH +11D46 ; Consonant_Preceding_Repha # Lo MASARAM GONDI REPHA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Initial_Postfixed + +# Consonants that succeed the main consonant in character sequences, but are +# pronounced before it. + +# [Not derivable] + +1A5A ; Consonant_Initial_Postfixed # Mn TAI THAM CONSONANT SIGN LOW PA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Succeeding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when succeeding the main +# consonant. + +# [Not derivable] + +17CC ; Consonant_Succeeding_Repha # Mn KHMER SIGN ROBAT +1B03 ; Consonant_Succeeding_Repha # Mn BALINESE SIGN SURANG +1B81 ; Consonant_Succeeding_Repha # Mn SUNDANESE SIGN PANGLAYAR +A982 ; Consonant_Succeeding_Repha # Mn JAVANESE SIGN LAYAR + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Subjoined + +# Subjoined Consonant (C2 form subtending a base consonant in Tibetan, etc.) + +# [Not derivable] + +0F8D..0F97 ; Consonant_Subjoined # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Consonant_Subjoined # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +1929..192B ; Consonant_Subjoined # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1A57 ; Consonant_Subjoined # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A5B..1A5E ; Consonant_Subjoined # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1BA1 ; Consonant_Subjoined # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA2..1BA3 ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BAC..1BAD ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C24..1C25 ; Consonant_Subjoined # Mc [2] LEPCHA SUBJOINED LETTER YA..LEPCHA SUBJOINED LETTER RA +A867..A868 ; Consonant_Subjoined # Lo [2] PHAGS-PA SUBJOINED LETTER WA..PHAGS-PA SUBJOINED LETTER YA +A871 ; Consonant_Subjoined # Lo PHAGS-PA SUBJOINED LETTER RA +A9BD ; Consonant_Subjoined # Mc JAVANESE CONSONANT SIGN KERET +11C92..11CA7 ; Consonant_Subjoined # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CA9 ; Consonant_Subjoined # Mc MARCHEN SUBJOINED LETTER YA +11CAA..11CAF ; Consonant_Subjoined # Mn [6] MARCHEN SUBJOINED LETTER RA..MARCHEN SUBJOINED LETTER A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Medial + +# Medial Consonant (medial liquid, occurring in clusters) + +# [Not derivable] + +0A75 ; Consonant_Medial # Mn GURMUKHI SIGN YAKASH +0EBC ; Consonant_Medial # Mn LAO SEMIVOWEL SIGN LO +0EBD ; Consonant_Medial # Lo LAO SEMIVOWEL SIGN NYO +103B..103C ; Consonant_Medial # Mc [2] MYANMAR CONSONANT SIGN MEDIAL YA..MYANMAR CONSONANT SIGN MEDIAL RA +103D..103E ; Consonant_Medial # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +105E..1060 ; Consonant_Medial # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Consonant_Medial # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +1A55 ; Consonant_Medial # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A56 ; Consonant_Medial # Mn TAI THAM CONSONANT SIGN MEDIAL LA +A8B4 ; Consonant_Medial # Mc SAURASHTRA CONSONANT SIGN HAARU +A9BE..A9BF ; Consonant_Medial # Mc [2] JAVANESE CONSONANT SIGN PENGKAL..JAVANESE CONSONANT SIGN CAKRA +AA33..AA34 ; Consonant_Medial # Mc [2] CHAM CONSONANT SIGN YA..CHAM CONSONANT SIGN RA +AA35..AA36 ; Consonant_Medial # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +1171D..1171F ; Consonant_Medial # Mn [3] AHOM CONSONANT SIGN MEDIAL LA..AHOM CONSONANT SIGN MEDIAL LIGATING RA +11A3B..11A3E ; Consonant_Medial # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11D47 ; Consonant_Medial # Mn MASARAM GONDI RA-KARA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Final + +# Final Consonant (special final forms which do not take vowels) + +# [Not derivable] + +1930..1931 ; Consonant_Final # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Consonant_Final # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +1939 ; Consonant_Final # Mn LIMBU SIGN MUKPHRENG +19C1..19C7 ; Consonant_Final # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B +1A58..1A59 ; Consonant_Final # Mn [2] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN FINAL NGA +1BBE..1BBF ; Consonant_Final # Lo [2] SUNDANESE LETTER FINAL K..SUNDANESE LETTER FINAL M +1BF0..1BF1 ; Consonant_Final # Mn [2] BATAK CONSONANT SIGN NG..BATAK CONSONANT SIGN H +1C2D..1C33 ; Consonant_Final # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +A94F..A951 ; Consonant_Final # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A952 ; Consonant_Final # Mc REJANG CONSONANT SIGN H +AA40..AA42 ; Consonant_Final # Lo [3] CHAM LETTER FINAL K..CHAM LETTER FINAL NG +AA43 ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL NG +AA44..AA4B ; Consonant_Final # Lo [8] CHAM LETTER FINAL CH..CHAM LETTER FINAL SS +AA4C ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL M +AA4D ; Consonant_Final # Mc CHAM CONSONANT SIGN FINAL H +ABDB..ABE2 ; Consonant_Final # Lo [8] MEETEI MAYEK LETTER KOK LONSUM..MEETEI MAYEK LETTER I LONSUM +11A8A..11A95 ; Consonant_Final # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Head_Letter + +# Head Letter (Tibetan) + +# [Not derivable] + +0F88..0F8C ; Consonant_Head_Letter # Lo [5] TIBETAN SIGN LCE TSA CAN..TIBETAN SIGN INVERTED MCHU CAN + +# ================================================ + +# Indic_Syllabic_Category=Modifying_Letter + +# Reanalyzed letters not participating in the abugida structure, but +# serving to modify the sound of an adjacent vowel or consonant. +# Note that this is not the same as General_Category=Modifier_Letter. + +# [Not derivable] + +0B83 ; Modifying_Letter # Lo TAMIL SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Tone_Letter + +# Tone Letter (spacing lexical tone mark with status as a letter) + +# [Not derivable] + +1970..1974 ; Tone_Letter # Lo [5] TAI LE LETTER TONE-2..TAI LE LETTER TONE-6 +AAC0 ; Tone_Letter # Lo TAI VIET TONE MAI NUENG +AAC2 ; Tone_Letter # Lo TAI VIET TONE MAI SONG + +# ================================================ + +# Indic_Syllabic_Category=Tone_Mark + +# Tone Mark (nonspacing or spacing lexical tone mark) + +# [Not derivable] + +0E48..0E4B ; Tone_Mark # Mn [4] THAI CHARACTER MAI EK..THAI CHARACTER MAI CHATTAWA +0EC8..0ECB ; Tone_Mark # Mn [4] LAO TONE MAI EK..LAO TONE MAI CATAWA +1037 ; Tone_Mark # Mn MYANMAR SIGN DOT BELOW +1063..1064 ; Tone_Mark # Mc [2] MYANMAR TONE MARK SGAW KAREN HATHI..MYANMAR TONE MARK SGAW KAREN KE PHO +1069..106D ; Tone_Mark # Mc [5] MYANMAR SIGN WESTERN PWO KAREN TONE-1..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1087..108C ; Tone_Mark # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108D ; Tone_Mark # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +108F ; Tone_Mark # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109B ; Tone_Mark # Mc [2] MYANMAR SIGN KHAMTI TONE-1..MYANMAR SIGN KHAMTI TONE-3 +19C8..19C9 ; Tone_Mark # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A75..1A79 ; Tone_Mark # Mn [5] TAI THAM SIGN TONE-1..TAI THAM SIGN KHUEN TONE-5 +A92B..A92D ; Tone_Mark # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +AA7B ; Tone_Mark # Mc MYANMAR SIGN PAO KAREN TONE +AA7C ; Tone_Mark # Mn MYANMAR SIGN TAI LAING TONE-2 +AA7D ; Tone_Mark # Mc MYANMAR SIGN TAI LAING TONE-5 +AABF ; Tone_Mark # Mn TAI VIET TONE MAI EK +AAC1 ; Tone_Mark # Mn TAI VIET TONE MAI THO +ABEC ; Tone_Mark # Mc MEETEI MAYEK LUM IYEK + +# ================================================ + +# Indic_Syllabic_Category=Gemination_Mark + +# Gemination Mark (doubling of the preceding or following consonant) + +# [Not derivable] + +0A71 ; Gemination_Mark # Mn GURMUKHI ADDAK +11237 ; Gemination_Mark # Mn KHOJKI SIGN SHADDA +11A98 ; Gemination_Mark # Mn SOYOMBO GEMINATION MARK + +# ================================================ + +# Indic_Syllabic_Category=Cantillation_Mark + +# Cantillation Mark (recitation marks, such as svara markers for the Samaveda) + +# [Not derivable] + +0951..0952 ; Cantillation_Mark # Mn [2] DEVANAGARI STRESS SIGN UDATTA..DEVANAGARI STRESS SIGN ANUDATTA +0A51 ; Cantillation_Mark # Mn GURMUKHI SIGN UDAAT +0AFA..0AFC ; Cantillation_Mark # Mn [3] GUJARATI SIGN SUKUN..GUJARATI SIGN MADDAH +1CD0..1CD2 ; Cantillation_Mark # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CD4..1CE0 ; Cantillation_Mark # Mn [13] VEDIC SIGN YAJURVEDIC MIDLINE SVARITA..VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CE1 ; Cantillation_Mark # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF4 ; Cantillation_Mark # Mn VEDIC TONE CANDRA ABOVE +1CF7 ; Cantillation_Mark # Mc VEDIC SIGN ATIKRAMA +1CF8..1CF9 ; Cantillation_Mark # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE +A8E0..A8F1 ; Cantillation_Mark # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +1123E ; Cantillation_Mark # Mn KHOJKI SIGN SUKUN +11366..1136C ; Cantillation_Mark # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Cantillation_Mark # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA + +# ================================================ + +# Indic_Syllabic_Category=Register_Shifter + +# Register Shifter (shifts register for consonants, akin to a tone mark) + +# [Not derivable] + +17C9..17CA ; Register_Shifter # Mn [2] KHMER SIGN MUUSIKATOAN..KHMER SIGN TRIISAP + +# ================================================ + +# Indic_Syllabic_Category=Syllable_Modifier + +# Syllable Modifier (miscellaneous combining characters that modify +# something in the orthographic syllable they succeed) + +# [Not derivable] + +00B2..00B3 ; Syllable_Modifier # No [2] SUPERSCRIPT TWO..SUPERSCRIPT THREE +09FE ; Syllable_Modifier # Mn BENGALI SANDHI MARK +0F35 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0FC6 ; Syllable_Modifier # Mn TIBETAN SYMBOL PADMA GDAN +17CB ; Syllable_Modifier # Mn KHMER SIGN BANTOC +17CE..17D0 ; Syllable_Modifier # Mn [3] KHMER SIGN KAKABAT..KHMER SIGN SAMYOK SANNYA +17D3 ; Syllable_Modifier # Mn KHMER SIGN BATHAMASAT +17DD ; Syllable_Modifier # Mn KHMER SIGN ATTHACAN +193B ; Syllable_Modifier # Mn LIMBU SIGN SA-I +1A7B..1A7C ; Syllable_Modifier # Mn [2] TAI THAM SIGN MAI SAM..TAI THAM SIGN KHUEN-LUE KARAN +1A7F ; Syllable_Modifier # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1C36 ; Syllable_Modifier # Mn LEPCHA SIGN RAN +1DFB ; Syllable_Modifier # Mn COMBINING DELETION MARK +2074 ; Syllable_Modifier # No SUPERSCRIPT FOUR +2082..2084 ; Syllable_Modifier # No [3] SUBSCRIPT TWO..SUBSCRIPT FOUR +111C9 ; Syllable_Modifier # Mn SHARADA SANDHI MARK +1145E ; Syllable_Modifier # Mn NEWA SANDHI MARK +11A33 ; Syllable_Modifier # Mn ZANABAZAR SQUARE FINAL CONSONANT MARK + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Killer + +# Consonant Killer (signifies that the previous consonant or consonants are +# not pronounced) + +# [Not derivable] + +0E4C ; Consonant_Killer # Mn THAI CHARACTER THANTHAKHAT +17CD ; Consonant_Killer # Mn KHMER SIGN TOANDAKHIAT + +# ================================================ + +# Indic_Syllabic_Category=Non_Joiner + +# Non_Joiner (Zero Width Non-Joiner) + +# [Not derivable] + +200C ; Non_Joiner # Cf ZERO WIDTH NON-JOINER + +# ================================================ + +# Indic_Syllabic_Category=Joiner + +# Joiner (Zero Width Joiner) + +# [Not derivable] + +200D ; Joiner # Cf ZERO WIDTH JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number_Joiner + +# Number_Joiner (forms ligatures between numbers for multiplication) + +# [Not derivable] + +1107F ; Number_Joiner # Mn BRAHMI NUMBER JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number + +# Number (can be used as vowel-holders like consonant placeholders) +# Note: A number may even hold subjoined consonants which may in turn +# have been formed using a virama or a stacker, e.g. the sequence +# where THAI THAM LETTER LOW TA is subjoined to +# TAI THAM THAM DIGIT THREE using an invisible stacker. + +# [Not derivable] + +0030..0039 ; Number # Nd [10] DIGIT ZERO..DIGIT NINE +0966..096F ; Number # Nd [10] DEVANAGARI DIGIT ZERO..DEVANAGARI DIGIT NINE +09E6..09EF ; Number # Nd [10] BENGALI DIGIT ZERO..BENGALI DIGIT NINE +0A66..0A6F ; Number # Nd [10] GURMUKHI DIGIT ZERO..GURMUKHI DIGIT NINE +0AE6..0AEF ; Number # Nd [10] GUJARATI DIGIT ZERO..GUJARATI DIGIT NINE +0B66..0B6F ; Number # Nd [10] ORIYA DIGIT ZERO..ORIYA DIGIT NINE +0BE6..0BEF ; Number # Nd [10] TAMIL DIGIT ZERO..TAMIL DIGIT NINE +0C66..0C6F ; Number # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE +0CE6..0CEF ; Number # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE +0D66..0D6F ; Number # Nd [10] MALAYALAM DIGIT ZERO..MALAYALAM DIGIT NINE +0DE6..0DEF ; Number # Nd [10] SINHALA LITH DIGIT ZERO..SINHALA LITH DIGIT NINE +0E50..0E59 ; Number # Nd [10] THAI DIGIT ZERO..THAI DIGIT NINE +0ED0..0ED9 ; Number # Nd [10] LAO DIGIT ZERO..LAO DIGIT NINE +0F20..0F29 ; Number # Nd [10] TIBETAN DIGIT ZERO..TIBETAN DIGIT NINE +0F2A..0F33 ; Number # No [10] TIBETAN DIGIT HALF ONE..TIBETAN DIGIT HALF ZERO +1040..1049 ; Number # Nd [10] MYANMAR DIGIT ZERO..MYANMAR DIGIT NINE +1090..1099 ; Number # Nd [10] MYANMAR SHAN DIGIT ZERO..MYANMAR SHAN DIGIT NINE +17E0..17E9 ; Number # Nd [10] KHMER DIGIT ZERO..KHMER DIGIT NINE +1946..194F ; Number # Nd [10] LIMBU DIGIT ZERO..LIMBU DIGIT NINE +19D0..19D9 ; Number # Nd [10] NEW TAI LUE DIGIT ZERO..NEW TAI LUE DIGIT NINE +1A80..1A89 ; Number # Nd [10] TAI THAM HORA DIGIT ZERO..TAI THAM HORA DIGIT NINE +1A90..1A99 ; Number # Nd [10] TAI THAM THAM DIGIT ZERO..TAI THAM THAM DIGIT NINE +1B50..1B59 ; Number # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE +1BB0..1BB9 ; Number # Nd [10] SUNDANESE DIGIT ZERO..SUNDANESE DIGIT NINE +1C40..1C49 ; Number # Nd [10] LEPCHA DIGIT ZERO..LEPCHA DIGIT NINE +A8D0..A8D9 ; Number # Nd [10] SAURASHTRA DIGIT ZERO..SAURASHTRA DIGIT NINE +A900..A909 ; Number # Nd [10] KAYAH LI DIGIT ZERO..KAYAH LI DIGIT NINE +A9D0..A9D9 ; Number # Nd [10] JAVANESE DIGIT ZERO..JAVANESE DIGIT NINE +A9F0..A9F9 ; Number # Nd [10] MYANMAR TAI LAING DIGIT ZERO..MYANMAR TAI LAING DIGIT NINE +AA50..AA59 ; Number # Nd [10] CHAM DIGIT ZERO..CHAM DIGIT NINE +ABF0..ABF9 ; Number # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE +10A40..10A48 ; Number # No [9] KHAROSHTHI DIGIT ONE..KHAROSHTHI FRACTION ONE HALF +11066..1106F ; Number # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11136..1113F ; Number # Nd [10] CHAKMA DIGIT ZERO..CHAKMA DIGIT NINE +111D0..111D9 ; Number # Nd [10] SHARADA DIGIT ZERO..SHARADA DIGIT NINE +111E1..111F4 ; Number # No [20] SINHALA ARCHAIC DIGIT ONE..SINHALA ARCHAIC NUMBER ONE THOUSAND +112F0..112F9 ; Number # Nd [10] KHUDAWADI DIGIT ZERO..KHUDAWADI DIGIT NINE +11450..11459 ; Number # Nd [10] NEWA DIGIT ZERO..NEWA DIGIT NINE +114D0..114D9 ; Number # Nd [10] TIRHUTA DIGIT ZERO..TIRHUTA DIGIT NINE +11650..11659 ; Number # Nd [10] MODI DIGIT ZERO..MODI DIGIT NINE +116C0..116C9 ; Number # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE +11730..11739 ; Number # Nd [10] AHOM DIGIT ZERO..AHOM DIGIT NINE +1173A..1173B ; Number # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY +11C50..11C59 ; Number # Nd [10] BHAIKSUKI DIGIT ZERO..BHAIKSUKI DIGIT NINE +11C5A..11C6C ; Number # No [19] BHAIKSUKI NUMBER ONE..BHAIKSUKI HUNDREDS UNIT MARK +11D50..11D59 ; Number # Nd [10] MASARAM GONDI DIGIT ZERO..MASARAM GONDI DIGIT NINE +11DA0..11DA9 ; Number # Nd [10] GUNJALA GONDI DIGIT ZERO..GUNJALA GONDI DIGIT NINE + +# ================================================ + +# Indic_Syllabic_Category=Brahmi_Joining_Number + +# Brahmi Joining Number (similar to Number in that in can be used as +# vowel-holders like Consonant_Placeholder, but may also be joined by +# a Number_Joiner of the same script, e.g. in Brahmi) + +# [Not derivable] + +11052..11065 ; Brahmi_Joining_Number # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND + +# EOF diff --git a/data/12.0.0-indic-positional-category.txt b/data/12.0.0-indic-positional-category.txt new file mode 100644 index 0000000..d4224a8 --- /dev/null +++ b/data/12.0.0-indic-positional-category.txt @@ -0,0 +1,755 @@ +# IndicPositionalCategory-12.0.0.txt +# Date: 2019-01-31, 02:26:00 GMT [KW, RP] +# © 2019 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# +# For documentation, see UAX #44: Unicode Character Database, +# at http://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Positional_Category enumerated property +# +# Scope: This property is aimed at the problem of +# the specification of syllabic structure for Indic scripts. +# Because dependent vowels (matras), visible viramas, and other +# characters are placed in notional slots around the consonant (or +# consonant cluster) core of an Indic syllable, there may be +# cooccurrence constraints or other interactions. Also, it may be +# desirable, in cases where more than one such character may occur in +# sequence, as for example, in a top slot and a bottom slot, to +# specify preferred orders for spelling. As such, this property +# is designed primarily to supplement the Indic_Syllabic_Category +# property. +# +# Note that this property is *not* intended as +# a prescriptive property regarding display or font design, +# for a number of reasons. Good font design requires information +# that is outside the context of a character encoding standard, +# and is best handled in other venues. For Indic dependent +# vowels and similar characters, in particular: +# +# 1. Matra placement may vary somewhat based on typeface design. +# 2. Matra placement, even within a single script, may vary +# somewhat according to historic period or local conventions. +# 3. Matra placement may be changed by explicit orthographic reform +# decisions. +# 4. Matras may ligate in various ways with a consonant (or even +# other elements of a syllable) instead of occurring in a +# discrete location. +# 5. Matra display may be contextually determined. This is +# notable, for example, in the Tamil script, where the shape +# and placement of -u and -uu vowels depends strongly on +# which consonant they adjoin. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Positional_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as containing dependent vowels or similar characters +# in the structural sense used for the Indic_Positional_Category are the +# following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Dogra, Grantha, Gujarati, Gunjala Gondi, +# Gurmukhi, Hanunoo, Javanese, Kaithi, Kannada, Kharoshthi, Khmer, +# Khojki, Khudawadi, Lao, Lepcha, Limbu, Makasar, Malayalam, Marchen, +# Masaram Gondi, Meetei Mayek, Modi, Myanmar, Nandinagari, Newa, +# New Tai Lue, Oriya, Rejang, Saurashtra, Sharada, Siddham, Sinhala, +# Soyombo, Sundanese, Syloti Nagri, Tagalog, Tagbanwa, Tai Tham, Tai +# Viet, Takri, Tamil, Telugu, Thai, Tibetan, Tirhuta, and Zanabazar +# Square. +# +# All characters for all other scripts not in that list +# take the default value for this property. +# +# See IndicSyllabicCategory.txt for a slightly more extended +# list of Indic scripts, including those which do not have +# positional characters. Currently, those additional +# Indic scripts without positional characters are +# Kayah Li, Mahajani, Multani, Phags-pa, and Tai Le. +# +# Notes: +# +# 1. The following characters are all assigned the positional category Right, +# but may have different positions in some cases: +# * U+0BC1 TAMIL VOWEL SIGN U and U+0BC2 TAMIL VOWEL SIGN UU have +# contextually variable placement in Tamil. +# * U+0D41 MALAYALAM VOWEL SIGN U and U+0D42 MALAYALAM VOWEL SIGN UU form +# complex ligatures with consonants in older Malayalam orthography. +# * U+11341 GRANTHA VOWEL SIGN U and U+11342 GRANTHA VOWEL SIGN UU have +# contextually variable placement in Grantha. +# * U+11440 NEWA VOWEL SIGN O and U+11441 NEWA VOWEL SIGN AU have contextually +# variable placement in Newa. +# +# 2. The following characters are all assigned the positional category Top, +# but may have different positions in some cases: +# * U+1143E NEWA VOWEL SIGN E and U+1143F NEWA VOWEL SIGN AI have contextually +# variable placement in Newa. +# +# 3. The following characters are all assigned the positional category Bottom, +# but may have different positions in some cases: +# * U+102F MYANMAR VOWEL SIGN U and U+1030 MYANMAR VOWEL SIGN UU have +# contextually variable placement in Myanmar. +# * U+1A69 TAI THAM VOWEL SIGN U and U+1A6A TAI THAM VOWEL SIGN UU have +# contextually variable placement in Tai Tham. +# +# 4. The following character is assigned the positional category Left, but +# may have different positions in different styles: +# * U+119D2 NANDINAGARI VOWEL SIGN I has stylistically variable placement +# in Nandinagari. + + +# ================================================ + +# Property: Indic_Positional_Category +# +# All code points not explicitly listed for Indic_Positional_Category +# have the value NA (not applicable). +# +# @missing: 0000..10FFFF; NA + +# ------------------------------------------------ + +# Indic_Positional_Category=Right + +0903 ; Right # Mc DEVANAGARI SIGN VISARGA +093B ; Right # Mc DEVANAGARI VOWEL SIGN OOE +093E ; Right # Mc DEVANAGARI VOWEL SIGN AA +0940 ; Right # Mc DEVANAGARI VOWEL SIGN II +0949..094C ; Right # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094F ; Right # Mc DEVANAGARI VOWEL SIGN AW +0982..0983 ; Right # Mc [2] BENGALI SIGN ANUSVARA..BENGALI SIGN VISARGA +09BE ; Right # Mc BENGALI VOWEL SIGN AA +09C0 ; Right # Mc BENGALI VOWEL SIGN II +09D7 ; Right # Mc BENGALI AU LENGTH MARK +0A03 ; Right # Mc GURMUKHI SIGN VISARGA +0A3E ; Right # Mc GURMUKHI VOWEL SIGN AA +0A40 ; Right # Mc GURMUKHI VOWEL SIGN II +0A83 ; Right # Mc GUJARATI SIGN VISARGA +0ABE ; Right # Mc GUJARATI VOWEL SIGN AA +0AC0 ; Right # Mc GUJARATI VOWEL SIGN II +0ACB..0ACC ; Right # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0B02..0B03 ; Right # Mc [2] ORIYA SIGN ANUSVARA..ORIYA SIGN VISARGA +0B3E ; Right # Mc ORIYA VOWEL SIGN AA +0B40 ; Right # Mc ORIYA VOWEL SIGN II +0BBE..0BBF ; Right # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC1..0BC2 ; Right # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BD7 ; Right # Mc TAMIL AU LENGTH MARK +0C01..0C03 ; Right # Mc [3] TELUGU SIGN CANDRABINDU..TELUGU SIGN VISARGA +0C41..0C44 ; Right # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C82..0C83 ; Right # Mc [2] KANNADA SIGN ANUSVARA..KANNADA SIGN VISARGA +0CBE ; Right # Mc KANNADA VOWEL SIGN AA +0CC1..0CC4 ; Right # Mc [4] KANNADA VOWEL SIGN U..KANNADA VOWEL SIGN VOCALIC RR +0CD5..0CD6 ; Right # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0D02..0D03 ; Right # Mc [2] MALAYALAM SIGN ANUSVARA..MALAYALAM SIGN VISARGA +0D3E..0D40 ; Right # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D42 ; Right # Mn [2] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN UU +0D57 ; Right # Mc MALAYALAM AU LENGTH MARK +0D82..0D83 ; Right # Mc [2] SINHALA SIGN ANUSVARAYA..SINHALA SIGN VISARGAYA +0DCF..0DD1 ; Right # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD8 ; Right # Mc SINHALA VOWEL SIGN GAETTA-PILLA +0DDF ; Right # Mc SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Right # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Right # Lo THAI CHARACTER SARA A +0E32..0E33 ; Right # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E45 ; Right # Lo THAI CHARACTER LAKKHANGYAO +0EB0 ; Right # Lo LAO VOWEL SIGN A +0EB2..0EB3 ; Right # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0F3E ; Right # Mc TIBETAN SIGN YAR TSHES +0F7F ; Right # Mc TIBETAN SIGN RNAM BCAD +102B..102C ; Right # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +1038 ; Right # Mc MYANMAR SIGN VISARGA +103B ; Right # Mc MYANMAR CONSONANT SIGN MEDIAL YA +1056..1057 ; Right # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1062..1064 ; Right # Mc [3] MYANMAR VOWEL SIGN SGAW KAREN EU..MYANMAR TONE MARK SGAW KAREN KE PHO +1067..106D ; Right # Mc [7] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1083 ; Right # Mc MYANMAR VOWEL SIGN SHAN AA +1087..108C ; Right # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108F ; Right # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109C ; Right # Mc [3] MYANMAR SIGN KHAMTI TONE-1..MYANMAR VOWEL SIGN AITON A +17B6 ; Right # Mc KHMER VOWEL SIGN AA +17C7..17C8 ; Right # Mc [2] KHMER SIGN REAHMUK..KHMER SIGN YUUKALEAPINTU +1923..1924 ; Right # Mc [2] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AI +1929..192B ; Right # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1930..1931 ; Right # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Right # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +19B0..19B4 ; Right # Lo [5] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN UU +19B8..19B9 ; Right # Lo [2] NEW TAI LUE VOWEL SIGN OA..NEW TAI LUE VOWEL SIGN UE +19BB..19C0 ; Right # Lo [6] NEW TAI LUE VOWEL SIGN AAY..NEW TAI LUE VOWEL SIGN IY +19C8..19C9 ; Right # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A1A ; Right # Mc BUGINESE VOWEL SIGN O +1A57 ; Right # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A61 ; Right # Mc TAI THAM VOWEL SIGN A +1A63..1A64 ; Right # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A6D ; Right # Mc TAI THAM VOWEL SIGN OY +1B04 ; Right # Mc BALINESE SIGN BISAH +1B35 ; Right # Mc BALINESE VOWEL SIGN TEDUNG +1B44 ; Right # Mc BALINESE ADEG ADEG +1B82 ; Right # Mc SUNDANESE SIGN PANGWISAD +1BA1 ; Right # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA7 ; Right # Mc SUNDANESE VOWEL SIGN PANOLONG +1BAA ; Right # Mc SUNDANESE SIGN PAMAAEH +1BE7 ; Right # Mc BATAK VOWEL SIGN E +1BEA..1BEC ; Right # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BEE ; Right # Mc BATAK VOWEL SIGN U +1BF2..1BF3 ; Right # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +1C24..1C26 ; Right # Mc [3] LEPCHA SUBJOINED LETTER YA..LEPCHA VOWEL SIGN AA +1C2A..1C2B ; Right # Mc [2] LEPCHA VOWEL SIGN U..LEPCHA VOWEL SIGN UU +1CE1 ; Right # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF7 ; Right # Mc VEDIC SIGN ATIKRAMA +A823..A824 ; Right # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A827 ; Right # Mc SYLOTI NAGRI VOWEL SIGN OO +A880..A881 ; Right # Mc [2] SAURASHTRA SIGN ANUSVARA..SAURASHTRA SIGN VISARGA +A8B4..A8C3 ; Right # Mc [16] SAURASHTRA CONSONANT SIGN HAARU..SAURASHTRA VOWEL SIGN AU +A952..A953 ; Right # Mc [2] REJANG CONSONANT SIGN H..REJANG VIRAMA +A983 ; Right # Mc JAVANESE SIGN WIGNYAN +A9B4..A9B5 ; Right # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9BE ; Right # Mc JAVANESE CONSONANT SIGN PENGKAL +AA33 ; Right # Mc CHAM CONSONANT SIGN YA +AA4D ; Right # Mc CHAM CONSONANT SIGN FINAL H +AA7B ; Right # Mc MYANMAR SIGN PAO KAREN TONE +AA7D ; Right # Mc MYANMAR SIGN TAI LAING TONE-5 +AAB1 ; Right # Lo TAI VIET VOWEL AA +AABA ; Right # Lo TAI VIET VOWEL UA +AABD ; Right # Lo TAI VIET VOWEL AN +AAEF ; Right # Mc MEETEI MAYEK VOWEL SIGN AAU +AAF5 ; Right # Mc MEETEI MAYEK VOWEL SIGN VISARGA +ABE3..ABE4 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE6..ABE7 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE9..ABEA ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +ABEC ; Right # Mc MEETEI MAYEK LUM IYEK +11000 ; Right # Mc BRAHMI SIGN CANDRABINDU +11002 ; Right # Mc BRAHMI SIGN VISARGA +11082 ; Right # Mc KAITHI SIGN VISARGA +110B0 ; Right # Mc KAITHI VOWEL SIGN AA +110B2 ; Right # Mc KAITHI VOWEL SIGN II +110B7..110B8 ; Right # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11145..11146 ; Right # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI +11182 ; Right # Mc SHARADA SIGN VISARGA +111B3 ; Right # Mc SHARADA VOWEL SIGN AA +111B5 ; Right # Mc SHARADA VOWEL SIGN II +111C0 ; Right # Mc SHARADA SIGN VIRAMA +1122C..1122E ; Right # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +11235 ; Right # Mc KHOJKI SIGN VIRAMA +112E0 ; Right # Mc KHUDAWADI VOWEL SIGN AA +112E2 ; Right # Mc KHUDAWADI VOWEL SIGN II +11302..11303 ; Right # Mc [2] GRANTHA SIGN ANUSVARA..GRANTHA SIGN VISARGA +1133E..1133F ; Right # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11341..11344 ; Right # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +1134D ; Right # Mc GRANTHA SIGN VIRAMA +11357 ; Right # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Right # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +11435 ; Right # Mc NEWA VOWEL SIGN AA +11437 ; Right # Mc NEWA VOWEL SIGN II +11440..11441 ; Right # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +11445 ; Right # Mc NEWA SIGN VISARGA +114B0 ; Right # Mc TIRHUTA VOWEL SIGN AA +114B2 ; Right # Mc TIRHUTA VOWEL SIGN II +114BD ; Right # Mc TIRHUTA VOWEL SIGN SHORT O +114C1 ; Right # Mc TIRHUTA SIGN VISARGA +115AF ; Right # Mc SIDDHAM VOWEL SIGN AA +115B1 ; Right # Mc SIDDHAM VOWEL SIGN II +115BE ; Right # Mc SIDDHAM SIGN VISARGA +11630..11632 ; Right # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +1163B..1163C ; Right # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +1163E ; Right # Mc MODI SIGN VISARGA +116AC ; Right # Mc TAKRI SIGN VISARGA +116AF ; Right # Mc TAKRI VOWEL SIGN II +116B6 ; Right # Mc TAKRI SIGN VIRAMA +11720..11721 ; Right # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +1182C ; Right # Mc DOGRA VOWEL SIGN AA +1182E ; Right # Mc DOGRA VOWEL SIGN II +11838 ; Right # Mc DOGRA SIGN VISARGA +119D1 ; Right # Mc NANDINAGARI VOWEL SIGN AA +119D3 ; Right # Mc NANDINAGARI VOWEL SIGN II +119DC..119DF ; Right # Mc [4] NANDINAGARI VOWEL SIGN O..NANDINAGARI SIGN VISARGA +11A39 ; Right # Mc ZANABAZAR SQUARE SIGN VISARGA +11A57..11A58 ; Right # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A97 ; Right # Mc SOYOMBO SIGN VISARGA +11C2F ; Right # Mc BHAIKSUKI VOWEL SIGN AA +11C3E ; Right # Mc BHAIKSUKI SIGN VISARGA +11CA9 ; Right # Mc MARCHEN SUBJOINED LETTER YA +11CB4 ; Right # Mc MARCHEN VOWEL SIGN O +11D8A..11D8E ; Right # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU +11D93..11D94 ; Right # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU +11D96 ; Right # Mc GUNJALA GONDI SIGN VISARGA +11EF6 ; Right # Mc MAKASAR VOWEL SIGN O + +# Indic_Positional_Category=Left + +093F ; Left # Mc DEVANAGARI VOWEL SIGN I +094E ; Left # Mc DEVANAGARI VOWEL SIGN PRISHTHAMATRA E +09BF ; Left # Mc BENGALI VOWEL SIGN I +09C7..09C8 ; Left # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +0A3F ; Left # Mc GURMUKHI VOWEL SIGN I +0ABF ; Left # Mc GUJARATI VOWEL SIGN I +0B47 ; Left # Mc ORIYA VOWEL SIGN E +0BC6..0BC8 ; Left # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0D46..0D48 ; Left # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0DD9 ; Left # Mc SINHALA VOWEL SIGN KOMBUVA +0DDB ; Left # Mc SINHALA VOWEL SIGN KOMBU DEKA +0F3F ; Left # Mc TIBETAN SIGN MAR TSHES +1031 ; Left # Mc MYANMAR VOWEL SIGN E +1084 ; Left # Mc MYANMAR VOWEL SIGN SHAN E +17C1..17C3 ; Left # Mc [3] KHMER VOWEL SIGN E..KHMER VOWEL SIGN AI +1A19 ; Left # Mc BUGINESE VOWEL SIGN E +1A55 ; Left # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A6E..1A72 ; Left # Mc [5] TAI THAM VOWEL SIGN E..TAI THAM VOWEL SIGN THAM AI +1B3E..1B3F ; Left # Mc [2] BALINESE VOWEL SIGN TALING..BALINESE VOWEL SIGN TALING REPA +1BA6 ; Left # Mc SUNDANESE VOWEL SIGN PANAELAENG +1C27..1C28 ; Left # Mc [2] LEPCHA VOWEL SIGN I..LEPCHA VOWEL SIGN O +1C34..1C35 ; Left # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A9BA..A9BB ; Left # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +AA2F..AA30 ; Left # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA34 ; Left # Mc CHAM CONSONANT SIGN RA +AAEB ; Left # Mc MEETEI MAYEK VOWEL SIGN II +AAEE ; Left # Mc MEETEI MAYEK VOWEL SIGN AU +110B1 ; Left # Mc KAITHI VOWEL SIGN I +1112C ; Left # Mc CHAKMA VOWEL SIGN E +111B4 ; Left # Mc SHARADA VOWEL SIGN I +112E1 ; Left # Mc KHUDAWADI VOWEL SIGN I +11347..11348 ; Left # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +11436 ; Left # Mc NEWA VOWEL SIGN I +114B1 ; Left # Mc TIRHUTA VOWEL SIGN I +114B9 ; Left # Mc TIRHUTA VOWEL SIGN E +115B0 ; Left # Mc SIDDHAM VOWEL SIGN I +115B8 ; Left # Mc SIDDHAM VOWEL SIGN E +116AE ; Left # Mc TAKRI VOWEL SIGN I +11726 ; Left # Mc AHOM VOWEL SIGN E +1182D ; Left # Mc DOGRA VOWEL SIGN I +119D2 ; Left # Mc NANDINAGARI VOWEL SIGN I +119E4 ; Left # Mc NANDINAGARI VOWEL SIGN PRISHTHAMATRA E +11CB1 ; Left # Mc MARCHEN VOWEL SIGN I +11EF5 ; Left # Mc MAKASAR VOWEL SIGN E + +# Indic_Positional_Category=Visual_Order_Left + +# These are dependent vowels that occur to the left of the consonant +# letter in a syllable, but which occur in scripts using the visual order +# model, instead of the logical order model. Because of the different +# model, these left-side vowels occur first in the backing store (before +# the consonant letter) and are not reordered during text rendering. +# +# [Derivation: Logical_Order_Exception=Yes] + +0E40..0E44 ; Visual_Order_Left # Lo [5] THAI CHARACTER SARA E..THAI CHARACTER SARA AI MAIMALAI +0EC0..0EC4 ; Visual_Order_Left # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +19B5..19B7 ; Visual_Order_Left # Lo [3] NEW TAI LUE VOWEL SIGN E..NEW TAI LUE VOWEL SIGN O +19BA ; Visual_Order_Left # Lo NEW TAI LUE VOWEL SIGN AY +AAB5..AAB6 ; Visual_Order_Left # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB9 ; Visual_Order_Left # Lo TAI VIET VOWEL UEA +AABB..AABC ; Visual_Order_Left # Lo [2] TAI VIET VOWEL AUE..TAI VIET VOWEL AY + +# Indic_Positional_Category=Left_And_Right + +09CB..09CC ; Left_And_Right # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +0B4B ; Left_And_Right # Mc ORIYA VOWEL SIGN O +0BCA..0BCC ; Left_And_Right # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0D4A..0D4C ; Left_And_Right # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0DDC ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA +0DDE ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA +17C0 ; Left_And_Right # Mc KHMER VOWEL SIGN IE +17C4..17C5 ; Left_And_Right # Mc [2] KHMER VOWEL SIGN OO..KHMER VOWEL SIGN AU +1B40..1B41 ; Left_And_Right # Mc [2] BALINESE VOWEL SIGN TALING TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1134B..1134C ; Left_And_Right # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +114BC ; Left_And_Right # Mc TIRHUTA VOWEL SIGN O +114BE ; Left_And_Right # Mc TIRHUTA VOWEL SIGN AU +115BA ; Left_And_Right # Mc SIDDHAM VOWEL SIGN O + +# Indic_Positional_Category=Top + +0900..0902 ; Top # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +093A ; Top # Mn DEVANAGARI VOWEL SIGN OE +0945..0948 ; Top # Mn [4] DEVANAGARI VOWEL SIGN CANDRA E..DEVANAGARI VOWEL SIGN AI +0951 ; Top # Mn DEVANAGARI STRESS SIGN UDATTA +0953..0955 ; Top # Mn [3] DEVANAGARI GRAVE ACCENT..DEVANAGARI VOWEL SIGN CANDRA LONG E +0981 ; Top # Mn BENGALI SIGN CANDRABINDU +09FE ; Top # Mn BENGALI SANDHI MARK +0A01..0A02 ; Top # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A47..0A48 ; Top # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Top # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0A70..0A71 ; Top # Mn [2] GURMUKHI TIPPI..GURMUKHI ADDAK +0A81..0A82 ; Top # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0AC5 ; Top # Mn GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Top # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AFA..0AFF ; Top # Mn [6] GUJARATI SIGN SUKUN..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B01 ; Top # Mn ORIYA SIGN CANDRABINDU +0B3F ; Top # Mn ORIYA VOWEL SIGN I +0B56 ; Top # Mn ORIYA AI LENGTH MARK +0B82 ; Top # Mn TAMIL SIGN ANUSVARA +0BC0 ; Top # Mn TAMIL VOWEL SIGN II +0BCD ; Top # Mn TAMIL SIGN VIRAMA +0C00 ; Top # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C04 ; Top # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C3E..0C40 ; Top # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C46..0C47 ; Top # Mn [2] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN EE +0C4A..0C4D ; Top # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA +0C55 ; Top # Mn TELUGU LENGTH MARK +0C81 ; Top # Mn KANNADA SIGN CANDRABINDU +0CBF ; Top # Mn KANNADA VOWEL SIGN I +0CC6 ; Top # Mn KANNADA VOWEL SIGN E +0CCC..0CCD ; Top # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA +0D00..0D01 ; Top # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU +0D3B..0D3C ; Top # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA +0D4D ; Top # Mn MALAYALAM SIGN VIRAMA +0DCA ; Top # Mn SINHALA SIGN AL-LAKUNA +0DD2..0DD3 ; Top # Mn [2] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN DIGA IS-PILLA +0E31 ; Top # Mn THAI CHARACTER MAI HAN-AKAT +0E34..0E37 ; Top # Mn [4] THAI CHARACTER SARA I..THAI CHARACTER SARA UEE +0E47..0E4E ; Top # Mn [8] THAI CHARACTER MAITAIKHU..THAI CHARACTER YAMAKKAN +0EB1 ; Top # Mn LAO VOWEL SIGN MAI KAN +0EB4..0EB7 ; Top # Mn [4] LAO VOWEL SIGN I..LAO VOWEL SIGN YY +0EBB ; Top # Mn LAO VOWEL SIGN MAI KON +0EC8..0ECD ; Top # Mn [6] LAO TONE MAI EK..LAO NIGGAHITA +0F39 ; Top # Mn TIBETAN MARK TSA -PHRU +0F72 ; Top # Mn TIBETAN VOWEL SIGN I +0F7A..0F7E ; Top # Mn [5] TIBETAN VOWEL SIGN E..TIBETAN SIGN RJES SU NGA RO +0F80 ; Top # Mn TIBETAN VOWEL SIGN REVERSED I +0F82..0F83 ; Top # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +0F86..0F87 ; Top # Mn [2] TIBETAN SIGN LCI RTAGS..TIBETAN SIGN YANG RTAGS +102D..102E ; Top # Mn [2] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN II +1032..1036 ; Top # Mn [5] MYANMAR VOWEL SIGN AI..MYANMAR SIGN ANUSVARA +103A ; Top # Mn MYANMAR SIGN ASAT +1071..1074 ; Top # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1085..1086 ; Top # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109D ; Top # Mn MYANMAR VOWEL SIGN AITON AI +1712 ; Top # Mn TAGALOG VOWEL SIGN I +1732 ; Top # Mn HANUNOO VOWEL SIGN I +1752 ; Top # Mn BUHID VOWEL SIGN I +1772 ; Top # Mn TAGBANWA VOWEL SIGN I +17B7..17BA ; Top # Mn [4] KHMER VOWEL SIGN I..KHMER VOWEL SIGN YY +17C6 ; Top # Mn KHMER SIGN NIKAHIT +17C9..17D1 ; Top # Mn [9] KHMER SIGN MUUSIKATOAN..KHMER SIGN VIRIAM +17D3 ; Top # Mn KHMER SIGN BATHAMASAT +17DD ; Top # Mn KHMER SIGN ATTHACAN +1920..1921 ; Top # Mn [2] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN I +1927..1928 ; Top # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Top # Mn LIMBU SIGN KEMPHRENG +1A17 ; Top # Mn BUGINESE VOWEL SIGN I +1A1B ; Top # Mn BUGINESE VOWEL SIGN AE +1A58..1A5A ; Top # Mn [3] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN LOW PA +1A62 ; Top # Mn TAI THAM VOWEL SIGN MAI SAT +1A65..1A68 ; Top # Mn [4] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN UUE +1A6B ; Top # Mn TAI THAM VOWEL SIGN O +1A73..1A7C ; Top # Mn [10] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN KHUEN-LUE KARAN +1B00..1B03 ; Top # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG +1B34 ; Top # Mn BALINESE SIGN REREKAN +1B36..1B37 ; Top # Mn [2] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN ULU SARI +1B42 ; Top # Mn BALINESE VOWEL SIGN PEPET +1B6B ; Top # Mn BALINESE MUSICAL SYMBOL COMBINING TEGEH +1B6D..1B73 ; Top # Mn [7] BALINESE MUSICAL SYMBOL COMBINING KEMPUL..BALINESE MUSICAL SYMBOL COMBINING GONG +1B80..1B81 ; Top # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR +1BA4 ; Top # Mn SUNDANESE VOWEL SIGN PANGHULU +1BA8..1BA9 ; Top # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE6 ; Top # Mn BATAK SIGN TOMPI +1BE8..1BE9 ; Top # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BED ; Top # Mn BATAK VOWEL SIGN KARO O +1BEF..1BF1 ; Top # Mn [3] BATAK VOWEL SIGN U FOR SIMALUNGUN SA..BATAK CONSONANT SIGN H +1C2D..1C33 ; Top # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +1C36 ; Top # Mn LEPCHA SIGN RAN +1CD0..1CD2 ; Top # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CDA..1CDB ; Top # Mn [2] VEDIC TONE DOUBLE SVARITA..VEDIC TONE TRIPLE SVARITA +1CE0 ; Top # Mn VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CF4 ; Top # Mn VEDIC TONE CANDRA ABOVE +1DFB ; Top # Mn COMBINING DELETION MARK +20F0 ; Top # Mn COMBINING ASTERISK ABOVE +A802 ; Top # Mn SYLOTI NAGRI SIGN DVISVARA +A806 ; Top # Mn SYLOTI NAGRI SIGN HASANTA +A80B ; Top # Mn SYLOTI NAGRI SIGN ANUSVARA +A826 ; Top # Mn SYLOTI NAGRI VOWEL SIGN E +A8C5 ; Top # Mn SAURASHTRA SIGN CANDRABINDU +A8E0..A8F1 ; Top # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +A8FF ; Top # Mn DEVANAGARI VOWEL SIGN AY +A94A ; Top # Mn REJANG VOWEL SIGN AI +A94F..A951 ; Top # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A980..A982 ; Top # Mn [3] JAVANESE SIGN PANYANGGA..JAVANESE SIGN LAYAR +A9B3 ; Top # Mn JAVANESE SIGN CECAK TELU +A9B6..A9B7 ; Top # Mn [2] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN WULU MELIK +A9BC ; Top # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Top # Mn MYANMAR SIGN SHAN SAW +AA29..AA2C ; Top # Mn [4] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN EI +AA2E ; Top # Mn CHAM VOWEL SIGN OE +AA31 ; Top # Mn CHAM VOWEL SIGN AU +AA43 ; Top # Mn CHAM CONSONANT SIGN FINAL NG +AA4C ; Top # Mn CHAM CONSONANT SIGN FINAL M +AA7C ; Top # Mn MYANMAR SIGN TAI LAING TONE-2 +AAB0 ; Top # Mn TAI VIET MAI KANG +AAB2..AAB3 ; Top # Mn [2] TAI VIET VOWEL I..TAI VIET VOWEL UE +AAB7..AAB8 ; Top # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AABE..AABF ; Top # Mn [2] TAI VIET VOWEL AM..TAI VIET TONE MAI EK +AAC1 ; Top # Mn TAI VIET TONE MAI THO +AAED ; Top # Mn MEETEI MAYEK VOWEL SIGN AAI +ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP +10A05 ; Top # Mn KHAROSHTHI VOWEL SIGN E +10A0F ; Top # Mn KHAROSHTHI SIGN VISARGA +10A38 ; Top # Mn KHAROSHTHI SIGN BAR ABOVE +11001 ; Top # Mn BRAHMI SIGN ANUSVARA +11038..1103B ; Top # Mn [4] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN II +11042..11046 ; Top # Mn [5] BRAHMI VOWEL SIGN E..BRAHMI VIRAMA +11080..11081 ; Top # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +110B5..110B6 ; Top # Mn [2] KAITHI VOWEL SIGN E..KAITHI VOWEL SIGN AI +11100..11102 ; Top # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA +11127..11129 ; Top # Mn [3] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN II +1112D ; Top # Mn CHAKMA VOWEL SIGN AI +11130 ; Top # Mn CHAKMA VOWEL SIGN OI +11134 ; Top # Mn CHAKMA MAAYYAA +11180..11181 ; Top # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +111BC..111BE ; Top # Mn [3] SHARADA VOWEL SIGN E..SHARADA VOWEL SIGN O +111CB ; Top # Mn SHARADA VOWEL MODIFIER MARK +11230..11231 ; Top # Mn [2] KHOJKI VOWEL SIGN E..KHOJKI VOWEL SIGN AI +11234 ; Top # Mn KHOJKI SIGN ANUSVARA +11236..11237 ; Top # Mn [2] KHOJKI SIGN NUKTA..KHOJKI SIGN SHADDA +1123E ; Top # Mn KHOJKI SIGN SUKUN +112DF ; Top # Mn KHUDAWADI SIGN ANUSVARA +112E5..112E8 ; Top # Mn [4] KHUDAWADI VOWEL SIGN E..KHUDAWADI VOWEL SIGN AU +11300..11301 ; Top # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11340 ; Top # Mn GRANTHA VOWEL SIGN II +11366..1136C ; Top # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Top # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA +1143E..1143F ; Top # Mn [2] NEWA VOWEL SIGN E..NEWA VOWEL SIGN AI +11443..11444 ; Top # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +1145E ; Top # Mn NEWA SANDHI MARK +114BA ; Top # Mn TIRHUTA VOWEL SIGN SHORT E +114BF..114C0 ; Top # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Top # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +11639..1163A ; Top # Mn [2] MODI VOWEL SIGN E..MODI VOWEL SIGN AI +1163D ; Top # Mn MODI SIGN ANUSVARA +11640 ; Top # Mn MODI SIGN ARDHACANDRA +116AB ; Top # Mn TAKRI SIGN ANUSVARA +116AD ; Top # Mn TAKRI VOWEL SIGN AA +116B2..116B5 ; Top # Mn [4] TAKRI VOWEL SIGN E..TAKRI VOWEL SIGN AU +1171F ; Top # Mn AHOM CONSONANT SIGN MEDIAL LIGATING RA +11722..11723 ; Top # Mn [2] AHOM VOWEL SIGN I..AHOM VOWEL SIGN II +11727 ; Top # Mn AHOM VOWEL SIGN AW +11729..1172B ; Top # Mn [3] AHOM VOWEL SIGN AI..AHOM SIGN KILLER +11833..11837 ; Top # Mn [5] DOGRA VOWEL SIGN E..DOGRA SIGN ANUSVARA +119DA..119DB ; Top # Mn [2] NANDINAGARI VOWEL SIGN E..NANDINAGARI VOWEL SIGN AI +11A01 ; Top # Mn ZANABAZAR SQUARE VOWEL SIGN I +11A04..11A09 ; Top # Mn [6] ZANABAZAR SQUARE VOWEL SIGN E..ZANABAZAR SQUARE VOWEL SIGN REVERSED I +11A35..11A38 ; Top # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A51 ; Top # Mn SOYOMBO VOWEL SIGN I +11A54..11A56 ; Top # Mn [3] SOYOMBO VOWEL SIGN E..SOYOMBO VOWEL SIGN OE +11A96 ; Top # Mn SOYOMBO SIGN ANUSVARA +11A98 ; Top # Mn SOYOMBO GEMINATION MARK +11C30..11C31 ; Top # Mn [2] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN II +11C38..11C3D ; Top # Mn [6] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI SIGN ANUSVARA +11CB3 ; Top # Mn MARCHEN VOWEL SIGN E +11CB5..11CB6 ; Top # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D31..11D35 ; Top # Mn [5] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN UU +11D3A ; Top # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Top # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F..11D41 ; Top # Mn [3] MASARAM GONDI VOWEL SIGN AU..MASARAM GONDI SIGN VISARGA +11D43 ; Top # Mn MASARAM GONDI SIGN CANDRA +11D90..11D91 ; Top # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI +11D95 ; Top # Mn GUNJALA GONDI SIGN ANUSVARA +11EF3 ; Top # Mn MAKASAR VOWEL SIGN I + +# Indic_Positional_Category=Bottom + +093C ; Bottom # Mn DEVANAGARI SIGN NUKTA +0941..0944 ; Bottom # Mn [4] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN VOCALIC RR +094D ; Bottom # Mn DEVANAGARI SIGN VIRAMA +0952 ; Bottom # Mn DEVANAGARI STRESS SIGN ANUDATTA +0956..0957 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN UE..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BC ; Bottom # Mn BENGALI SIGN NUKTA +09C1..09C4 ; Bottom # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09CD ; Bottom # Mn BENGALI SIGN VIRAMA +09E2..09E3 ; Bottom # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3C ; Bottom # Mn GURMUKHI SIGN NUKTA +0A41..0A42 ; Bottom # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A4D ; Bottom # Mn GURMUKHI SIGN VIRAMA +0A51 ; Bottom # Mn GURMUKHI SIGN UDAAT +0A75 ; Bottom # Mn GURMUKHI SIGN YAKASH +0ABC ; Bottom # Mn GUJARATI SIGN NUKTA +0AC1..0AC4 ; Bottom # Mn [4] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN VOCALIC RR +0ACD ; Bottom # Mn GUJARATI SIGN VIRAMA +0AE2..0AE3 ; Bottom # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3C ; Bottom # Mn ORIYA SIGN NUKTA +0B41..0B44 ; Bottom # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B4D ; Bottom # Mn ORIYA SIGN VIRAMA +0B62..0B63 ; Bottom # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0C56 ; Bottom # Mn TELUGU AI LENGTH MARK +0C62..0C63 ; Bottom # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBC ; Bottom # Mn KANNADA SIGN NUKTA +0CE2..0CE3 ; Bottom # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D43..0D44 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC R..MALAYALAM VOWEL SIGN VOCALIC RR +0D62..0D63 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DD4 ; Bottom # Mn SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Bottom # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0E38..0E3A ; Bottom # Mn [3] THAI CHARACTER SARA U..THAI CHARACTER PHINTHU +0EB8..0EBA ; Bottom # Mn [3] LAO VOWEL SIGN U..LAO SIGN PALI VIRAMA +0EBC ; Bottom # Mn LAO SEMIVOWEL SIGN LO +0F18..0F19 ; Bottom # Mn [2] TIBETAN ASTROLOGICAL SIGN -KHYUD PA..TIBETAN ASTROLOGICAL SIGN SDONG TSHUGS +0F35 ; Bottom # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Bottom # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0F71 ; Bottom # Mn TIBETAN VOWEL SIGN AA +0F74..0F75 ; Bottom # Mn [2] TIBETAN VOWEL SIGN U..TIBETAN VOWEL SIGN UU +0F84 ; Bottom # Mn TIBETAN MARK HALANTA +0F8D..0F97 ; Bottom # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Bottom # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +0FC6 ; Bottom # Mn TIBETAN SYMBOL PADMA GDAN +102F..1030 ; Bottom # Mn [2] MYANMAR VOWEL SIGN U..MYANMAR VOWEL SIGN UU +1037 ; Bottom # Mn MYANMAR SIGN DOT BELOW +103D..103E ; Bottom # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +1058..1059 ; Bottom # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +105E..1060 ; Bottom # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Bottom # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +108D ; Bottom # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +1713..1714 ; Bottom # Mn [2] TAGALOG VOWEL SIGN U..TAGALOG SIGN VIRAMA +1733..1734 ; Bottom # Mn [2] HANUNOO VOWEL SIGN U..HANUNOO SIGN PAMUDPOD +1753 ; Bottom # Mn BUHID VOWEL SIGN U +1773 ; Bottom # Mn TAGBANWA VOWEL SIGN U +17BB..17BD ; Bottom # Mn [3] KHMER VOWEL SIGN U..KHMER VOWEL SIGN UA +1922 ; Bottom # Mn LIMBU VOWEL SIGN U +1932 ; Bottom # Mn LIMBU SMALL LETTER ANUSVARA +1939 ; Bottom # Mn LIMBU SIGN MUKPHRENG +193B ; Bottom # Mn LIMBU SIGN SA-I +1A18 ; Bottom # Mn BUGINESE VOWEL SIGN U +1A56 ; Bottom # Mn TAI THAM CONSONANT SIGN MEDIAL LA +1A5B..1A5E ; Bottom # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1A69..1A6A ; Bottom # Mn [2] TAI THAM VOWEL SIGN U..TAI THAM VOWEL SIGN UU +1A6C ; Bottom # Mn TAI THAM VOWEL SIGN OA BELOW +1A7F ; Bottom # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1B38..1B3A ; Bottom # Mn [3] BALINESE VOWEL SIGN SUKU..BALINESE VOWEL SIGN RA REPA +1B6C ; Bottom # Mn BALINESE MUSICAL SYMBOL COMBINING ENDEP +1BA2..1BA3 ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BA5 ; Bottom # Mn SUNDANESE VOWEL SIGN PANYUKU +1BAC..1BAD ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C2C ; Bottom # Mn LEPCHA VOWEL SIGN E +1C37 ; Bottom # Mn LEPCHA SIGN NUKTA +1CD5..1CD9 ; Bottom # Mn [5] VEDIC TONE YAJURVEDIC AGGRAVATED INDEPENDENT SVARITA..VEDIC TONE YAJURVEDIC KATHAKA INDEPENDENT SVARITA SCHROEDER +1CDC..1CDF ; Bottom # Mn [4] VEDIC TONE KATHAKA ANUDATTA..VEDIC TONE THREE DOTS BELOW +1CED ; Bottom # Mn VEDIC SIGN TIRYAK +A825 ; Bottom # Mn SYLOTI NAGRI VOWEL SIGN U +A8C4 ; Bottom # Mn SAURASHTRA SIGN VIRAMA +A92B..A92D ; Bottom # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +A947..A949 ; Bottom # Mn [3] REJANG VOWEL SIGN I..REJANG VOWEL SIGN E +A94B..A94E ; Bottom # Mn [4] REJANG VOWEL SIGN O..REJANG VOWEL SIGN EA +A9B8..A9B9 ; Bottom # Mn [2] JAVANESE VOWEL SIGN SUKU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BD ; Bottom # Mn JAVANESE CONSONANT SIGN KERET +AA2D ; Bottom # Mn CHAM VOWEL SIGN U +AA32 ; Bottom # Mn CHAM VOWEL SIGN UE +AA35..AA36 ; Bottom # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +AAB4 ; Bottom # Mn TAI VIET VOWEL U +AAEC ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UU +ABE8 ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK +10A02..10A03 ; Bottom # Mn [2] KHAROSHTHI VOWEL SIGN U..KHAROSHTHI VOWEL SIGN VOCALIC R +10A0C..10A0E ; Bottom # Mn [3] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN ANUSVARA +10A39..10A3A ; Bottom # Mn [2] KHAROSHTHI SIGN CAUDA..KHAROSHTHI SIGN DOT BELOW +1103C..11041 ; Bottom # Mn [6] BRAHMI VOWEL SIGN U..BRAHMI VOWEL SIGN VOCALIC LL +110B3..110B4 ; Bottom # Mn [2] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN UU +110B9..110BA ; Bottom # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +1112A..1112B ; Bottom # Mn [2] CHAKMA VOWEL SIGN U..CHAKMA VOWEL SIGN UU +11131..11132 ; Bottom # Mn [2] CHAKMA O MARK..CHAKMA AU MARK +11173 ; Bottom # Mn MAHAJANI SIGN NUKTA +111B6..111BB ; Bottom # Mn [6] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN VOCALIC LL +111C9..111CA ; Bottom # Mn [2] SHARADA SANDHI MARK..SHARADA SIGN NUKTA +111CC ; Bottom # Mn SHARADA EXTRA SHORT VOWEL MARK +1122F ; Bottom # Mn KHOJKI VOWEL SIGN U +112E3..112E4 ; Bottom # Mn [2] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN UU +112E9..112EA ; Bottom # Mn [2] KHUDAWADI SIGN NUKTA..KHUDAWADI SIGN VIRAMA +1133B..1133C ; Bottom # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA +11438..1143D ; Bottom # Mn [6] NEWA VOWEL SIGN U..NEWA VOWEL SIGN VOCALIC LL +11442 ; Bottom # Mn NEWA SIGN VIRAMA +11446 ; Bottom # Mn NEWA SIGN NUKTA +114B3..114B8 ; Bottom # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114C2..114C3 ; Bottom # Mn [2] TIRHUTA SIGN VIRAMA..TIRHUTA SIGN NUKTA +115B2..115B5 ; Bottom # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115BF..115C0 ; Bottom # Mn [2] SIDDHAM SIGN VIRAMA..SIDDHAM SIGN NUKTA +115DC..115DD ; Bottom # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11633..11638 ; Bottom # Mn [6] MODI VOWEL SIGN U..MODI VOWEL SIGN VOCALIC LL +1163F ; Bottom # Mn MODI SIGN VIRAMA +116B0..116B1 ; Bottom # Mn [2] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN UU +116B7 ; Bottom # Mn TAKRI SIGN NUKTA +1171D ; Bottom # Mn AHOM CONSONANT SIGN MEDIAL LA +11724..11725 ; Bottom # Mn [2] AHOM VOWEL SIGN U..AHOM VOWEL SIGN UU +11728 ; Bottom # Mn AHOM VOWEL SIGN O +1182F..11832 ; Bottom # Mn [4] DOGRA VOWEL SIGN U..DOGRA VOWEL SIGN VOCALIC RR +11839..1183A ; Bottom # Mn [2] DOGRA SIGN VIRAMA..DOGRA SIGN NUKTA +119D4..119D7 ; Bottom # Mn [4] NANDINAGARI VOWEL SIGN U..NANDINAGARI VOWEL SIGN VOCALIC RR +119E0 ; Bottom # Mn NANDINAGARI SIGN VIRAMA +11A02..11A03 ; Bottom # Mn [2] ZANABAZAR SQUARE VOWEL SIGN UE..ZANABAZAR SQUARE VOWEL SIGN U +11A0A ; Bottom # Mn ZANABAZAR SQUARE VOWEL LENGTH MARK +11A33..11A34 ; Bottom # Mn [2] ZANABAZAR SQUARE FINAL CONSONANT MARK..ZANABAZAR SQUARE SIGN VIRAMA +11A3B..11A3E ; Bottom # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11A52..11A53 ; Bottom # Mn [2] SOYOMBO VOWEL SIGN UE..SOYOMBO VOWEL SIGN U +11A59..11A5B ; Bottom # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11A8A..11A95 ; Bottom # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A +11C32..11C36 ; Bottom # Mn [5] BHAIKSUKI VOWEL SIGN U..BHAIKSUKI VOWEL SIGN VOCALIC L +11C3F ; Bottom # Mn BHAIKSUKI SIGN VIRAMA +11C92..11CA7 ; Bottom # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CAA..11CB0 ; Bottom # Mn [7] MARCHEN SUBJOINED LETTER RA..MARCHEN VOWEL SIGN AA +11CB2 ; Bottom # Mn MARCHEN VOWEL SIGN U +11D36 ; Bottom # Mn MASARAM GONDI VOWEL SIGN VOCALIC R +11D42 ; Bottom # Mn MASARAM GONDI SIGN NUKTA +11D44 ; Bottom # Mn MASARAM GONDI SIGN HALANTA +11D47 ; Bottom # Mn MASARAM GONDI RA-KARA +11EF4 ; Bottom # Mn MAKASAR VOWEL SIGN U + +# Indic_Positional_Category=Top_And_Bottom + +0C48 ; Top_And_Bottom # Mn TELUGU VOWEL SIGN AI +0F73 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN II +0F76..0F79 ; Top_And_Bottom # Mn [4] TIBETAN VOWEL SIGN VOCALIC R..TIBETAN VOWEL SIGN VOCALIC LL +0F81 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN REVERSED II +1B3C ; Top_And_Bottom # Mn BALINESE VOWEL SIGN LA LENGA +1112E..1112F ; Top_And_Bottom # Mn [2] CHAKMA VOWEL SIGN O..CHAKMA VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Right + +0AC9 ; Top_And_Right # Mc GUJARATI VOWEL SIGN CANDRA O +0B57 ; Top_And_Right # Mc ORIYA AU LENGTH MARK +0CC0 ; Top_And_Right # Mc KANNADA VOWEL SIGN II +0CC7..0CC8 ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +1925..1926 ; Top_And_Right # Mc [2] LIMBU VOWEL SIGN OO..LIMBU VOWEL SIGN AU +1B43 ; Top_And_Right # Mc BALINESE VOWEL SIGN PEPET TEDUNG +111BF ; Top_And_Right # Mc SHARADA VOWEL SIGN AU +11232..11233 ; Top_And_Right # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Left + +0B48 ; Top_And_Left # Mc ORIYA VOWEL SIGN AI +0DDA ; Top_And_Left # Mc SINHALA VOWEL SIGN DIGA KOMBUVA +17BE ; Top_And_Left # Mc KHMER VOWEL SIGN OE +1C29 ; Top_And_Left # Mc LEPCHA VOWEL SIGN OO +114BB ; Top_And_Left # Mc TIRHUTA VOWEL SIGN AI +115B9 ; Top_And_Left # Mc SIDDHAM VOWEL SIGN AI + +# Indic_Positional_Category=Top_And_Left_And_Right + +0B4C ; Top_And_Left_And_Right # Mc ORIYA VOWEL SIGN AU +0DDD ; Top_And_Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA +17BF ; Top_And_Left_And_Right # Mc KHMER VOWEL SIGN YA +115BB ; Top_And_Left_And_Right # Mc SIDDHAM VOWEL SIGN AU + +# Indic_Positional_Category=Bottom_And_Right + +1B3B ; Bottom_And_Right # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +A9C0 ; Bottom_And_Right # Mc JAVANESE PANGKON + +# Indic_Positional_Category=Bottom_And_Left + +A9BF ; Bottom_And_Left # Mc JAVANESE CONSONANT SIGN CAKRA + +# Indic_Positional_Category=Top_And_Bottom_And_Right + +1B3D ; Top_And_Bottom_And_Right # Mc BALINESE VOWEL SIGN LA LENGA TEDUNG + +# Indic_Positional_Category=Overstruck + +1CD4 ; Overstruck # Mn VEDIC SIGN YAJURVEDIC MIDLINE SVARITA +1CE2..1CE8 ; Overstruck # Mn [7] VEDIC SIGN VISARGA SVARITA..VEDIC SIGN VISARGA ANUDATTA WITH TAIL +10A01 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN I +10A06 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN O + +# EOF diff --git a/data/12.0.0-indic-syllabic-category.txt b/data/12.0.0-indic-syllabic-category.txt new file mode 100644 index 0000000..723a669 --- /dev/null +++ b/data/12.0.0-indic-syllabic-category.txt @@ -0,0 +1,1286 @@ +# IndicSyllabicCategory-12.0.0.txt +# Date: 2019-01-31, 02:26:00 GMT [KW, RP] +# © 2019 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# +# For documentation, see UAX #44: Unicode Character Database, +# at http://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Syllabic_Category enumerated property +# +# Scope: This property is aimed at two general problem +# areas involving the analysis and processing of Indic scripts: +# +# 1. Specification of syllabic structure. +# 2. Specification of segmentation rules. +# +# Both of these problem areas may benefit from having defined subtypes +# of Indic script characters which are relevant to how Indic +# syllables (or aksaras) are constructed. Note that rules for +# syllabic structure in Indic scripts may differ significantly +# from how phonological syllables are defined. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Syllabic_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as Indic in the structural sense used for the +# Indic_Syllabic_Category are the following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Dogra, Grantha, Gujarati, Gunjala Gondi, +# Gurmukhi, Hanunoo, Javanese, Kaithi, Kannada, Kayah Li, Kharoshthi, +# Khmer, Khojki, Khudawadi, Lao, Lepcha, Limbu, Mahajani, Makasar, +# Malayalam, Marchen, Masaram Gondi, Meetei Mayek, Modi, Multani, +# Myanmar, Nandinagari, Newa, New Tai Lue, Oriya, Phags-pa, Rejang, +# Saurashtra, Sharada, Siddham, Sinhala, Soyombo, Sundanese, Syloti +# Nagri, Tagalog, Tagbanwa, Tai Le, Tai Tham, Tai Viet, Takri, Tamil, +# Telugu, Thai, Tibetan, Tirhuta, and Zanabazar Square. +# +# All characters for all other scripts not in that list +# take the default value for this property, unless they +# are individually listed in this data file. +# + +# ================================================ + +# Property: Indic_Syllabic_Category +# +# All code points not explicitly listed for Indic_Syllabic_Category +# have the value Other. +# +# @missing: 0000..10FFFF; Other + +# ================================================ + +# Indic_Syllabic_Category=Bindu + +# Bindu/Anusvara (nasalization or -n) + +# [Not derivable] + +0900..0902 ; Bindu # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +0981 ; Bindu # Mn BENGALI SIGN CANDRABINDU +0982 ; Bindu # Mc BENGALI SIGN ANUSVARA +09FC ; Bindu # Lo BENGALI LETTER VEDIC ANUSVARA +0A01..0A02 ; Bindu # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A70 ; Bindu # Mn GURMUKHI TIPPI +0A81..0A82 ; Bindu # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0B01 ; Bindu # Mn ORIYA SIGN CANDRABINDU +0B02 ; Bindu # Mc ORIYA SIGN ANUSVARA +0B82 ; Bindu # Mn TAMIL SIGN ANUSVARA +0C00 ; Bindu # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C01..0C02 ; Bindu # Mc [2] TELUGU SIGN CANDRABINDU..TELUGU SIGN ANUSVARA +0C04 ; Bindu # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C80 ; Bindu # Lo KANNADA SIGN SPACING CANDRABINDU +0C81 ; Bindu # Mn KANNADA SIGN CANDRABINDU +0C82 ; Bindu # Mc KANNADA SIGN ANUSVARA +0D00..0D01 ; Bindu # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU +0D02 ; Bindu # Mc MALAYALAM SIGN ANUSVARA +0D82 ; Bindu # Mc SINHALA SIGN ANUSVARAYA +0E4D ; Bindu # Mn THAI CHARACTER NIKHAHIT +0ECD ; Bindu # Mn LAO NIGGAHITA +0F7E ; Bindu # Mn TIBETAN SIGN RJES SU NGA RO +0F82..0F83 ; Bindu # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +1036 ; Bindu # Mn MYANMAR SIGN ANUSVARA +17C6 ; Bindu # Mn KHMER SIGN NIKAHIT +1932 ; Bindu # Mn LIMBU SMALL LETTER ANUSVARA +1A74 ; Bindu # Mn TAI THAM SIGN MAI KANG +1B00..1B02 ; Bindu # Mn [3] BALINESE SIGN ULU RICEM..BALINESE SIGN CECEK +1B80 ; Bindu # Mn SUNDANESE SIGN PANYECEK +1C34..1C35 ; Bindu # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A80B ; Bindu # Mn SYLOTI NAGRI SIGN ANUSVARA +A873 ; Bindu # Lo PHAGS-PA LETTER CANDRABINDU +A880 ; Bindu # Mc SAURASHTRA SIGN ANUSVARA +A8C5 ; Bindu # Mn SAURASHTRA SIGN CANDRABINDU +A8F2..A8F3 ; Bindu # Lo [2] DEVANAGARI SIGN SPACING CANDRABINDU..DEVANAGARI SIGN CANDRABINDU VIRAMA +A980..A981 ; Bindu # Mn [2] JAVANESE SIGN PANYANGGA..JAVANESE SIGN CECAK +10A0E ; Bindu # Mn KHAROSHTHI SIGN ANUSVARA +11000 ; Bindu # Mc BRAHMI SIGN CANDRABINDU +11001 ; Bindu # Mn BRAHMI SIGN ANUSVARA +11080..11081 ; Bindu # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +11100..11101 ; Bindu # Mn [2] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN ANUSVARA +11180..11181 ; Bindu # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +11234 ; Bindu # Mn KHOJKI SIGN ANUSVARA +112DF ; Bindu # Mn KHUDAWADI SIGN ANUSVARA +11300..11301 ; Bindu # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11302 ; Bindu # Mc GRANTHA SIGN ANUSVARA +1135E..1135F ; Bindu # Lo [2] GRANTHA LETTER VEDIC ANUSVARA..GRANTHA LETTER VEDIC DOUBLE ANUSVARA +11443..11444 ; Bindu # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +1145F ; Bindu # Lo NEWA LETTER VEDIC ANUSVARA +114BF..114C0 ; Bindu # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Bindu # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +1163D ; Bindu # Mn MODI SIGN ANUSVARA +116AB ; Bindu # Mn TAKRI SIGN ANUSVARA +11837 ; Bindu # Mn DOGRA SIGN ANUSVARA +119DE ; Bindu # Mc NANDINAGARI SIGN ANUSVARA +11A35..11A38 ; Bindu # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A96 ; Bindu # Mn SOYOMBO SIGN ANUSVARA +11C3C..11C3D ; Bindu # Mn [2] BHAIKSUKI SIGN CANDRABINDU..BHAIKSUKI SIGN ANUSVARA +11CB5..11CB6 ; Bindu # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D40 ; Bindu # Mn MASARAM GONDI SIGN ANUSVARA +11D95 ; Bindu # Mn GUNJALA GONDI SIGN ANUSVARA + +# ================================================ + +# Indic_Syllabic_Category=Visarga + +# Visarga (-h) +# Excludes letters for jihvamuliya and upadhmaniya, which are +# related, but structured somewhat differently. + +# [Not derivable] + +0903 ; Visarga # Mc DEVANAGARI SIGN VISARGA +0983 ; Visarga # Mc BENGALI SIGN VISARGA +0A03 ; Visarga # Mc GURMUKHI SIGN VISARGA +0A83 ; Visarga # Mc GUJARATI SIGN VISARGA +0B03 ; Visarga # Mc ORIYA SIGN VISARGA +0C03 ; Visarga # Mc TELUGU SIGN VISARGA +0C83 ; Visarga # Mc KANNADA SIGN VISARGA +0D03 ; Visarga # Mc MALAYALAM SIGN VISARGA +0D83 ; Visarga # Mc SINHALA SIGN VISARGAYA +0F7F ; Visarga # Mc TIBETAN SIGN RNAM BCAD +1038 ; Visarga # Mc MYANMAR SIGN VISARGA +17C7 ; Visarga # Mc KHMER SIGN REAHMUK +1B04 ; Visarga # Mc BALINESE SIGN BISAH +1B82 ; Visarga # Mc SUNDANESE SIGN PANGWISAD +A881 ; Visarga # Mc SAURASHTRA SIGN VISARGA +A983 ; Visarga # Mc JAVANESE SIGN WIGNYAN +AAF5 ; Visarga # Mc MEETEI MAYEK VOWEL SIGN VISARGA +10A0F ; Visarga # Mn KHAROSHTHI SIGN VISARGA +11002 ; Visarga # Mc BRAHMI SIGN VISARGA +11082 ; Visarga # Mc KAITHI SIGN VISARGA +11102 ; Visarga # Mn CHAKMA SIGN VISARGA +11182 ; Visarga # Mc SHARADA SIGN VISARGA +11303 ; Visarga # Mc GRANTHA SIGN VISARGA +11445 ; Visarga # Mc NEWA SIGN VISARGA +114C1 ; Visarga # Mc TIRHUTA SIGN VISARGA +115BE ; Visarga # Mc SIDDHAM SIGN VISARGA +1163E ; Visarga # Mc MODI SIGN VISARGA +116AC ; Visarga # Mc TAKRI SIGN VISARGA +11838 ; Visarga # Mc DOGRA SIGN VISARGA +119DF ; Visarga # Mc NANDINAGARI SIGN VISARGA +11A39 ; Visarga # Mc ZANABAZAR SQUARE SIGN VISARGA +11A97 ; Visarga # Mc SOYOMBO SIGN VISARGA +11C3E ; Visarga # Mc BHAIKSUKI SIGN VISARGA +11D41 ; Visarga # Mn MASARAM GONDI SIGN VISARGA +11D96 ; Visarga # Mc GUNJALA GONDI SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Avagraha + +# Avagraha (elision of initial a- in sandhi) + +# [Not derivable] + +093D ; Avagraha # Lo DEVANAGARI SIGN AVAGRAHA +09BD ; Avagraha # Lo BENGALI SIGN AVAGRAHA +0ABD ; Avagraha # Lo GUJARATI SIGN AVAGRAHA +0B3D ; Avagraha # Lo ORIYA SIGN AVAGRAHA +0C3D ; Avagraha # Lo TELUGU SIGN AVAGRAHA +0CBD ; Avagraha # Lo KANNADA SIGN AVAGRAHA +0D3D ; Avagraha # Lo MALAYALAM SIGN AVAGRAHA +0F85 ; Avagraha # Po TIBETAN MARK PALUTA +17DC ; Avagraha # Lo KHMER SIGN AVAKRAHASANYA +1BBA ; Avagraha # Lo SUNDANESE AVAGRAHA +111C1 ; Avagraha # Lo SHARADA SIGN AVAGRAHA +1133D ; Avagraha # Lo GRANTHA SIGN AVAGRAHA +11447 ; Avagraha # Lo NEWA SIGN AVAGRAHA +114C4 ; Avagraha # Lo TIRHUTA SIGN AVAGRAHA +119E1 ; Avagraha # Lo NANDINAGARI SIGN AVAGRAHA +11A9D ; Avagraha # Lo SOYOMBO MARK PLUTA +11C40 ; Avagraha # Lo BHAIKSUKI SIGN AVAGRAHA + +# ================================================ + +# Indic_Syllabic_Category=Nukta + +# Nukta (diacritic for borrowed consonants or other consonant +# modifications). Note that while the resulting sound is typically a +# consonant, the base letter a nukta follows may be an independent +# vowel. For example, is used to transcribe ARABIC LETTER +# AIN. + +# [Not derivable] + +093C ; Nukta # Mn DEVANAGARI SIGN NUKTA +09BC ; Nukta # Mn BENGALI SIGN NUKTA +0A3C ; Nukta # Mn GURMUKHI SIGN NUKTA +0ABC ; Nukta # Mn GUJARATI SIGN NUKTA +0AFD..0AFF ; Nukta # Mn [3] GUJARATI SIGN THREE-DOT NUKTA ABOVE..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B3C ; Nukta # Mn ORIYA SIGN NUKTA +0CBC ; Nukta # Mn KANNADA SIGN NUKTA +0F39 ; Nukta # Mn TIBETAN MARK TSA -PHRU +1B34 ; Nukta # Mn BALINESE SIGN REREKAN +1BE6 ; Nukta # Mn BATAK SIGN TOMPI +1C37 ; Nukta # Mn LEPCHA SIGN NUKTA +A9B3 ; Nukta # Mn JAVANESE SIGN CECAK TELU +10A38..10A3A ; Nukta # Mn [3] KHAROSHTHI SIGN BAR ABOVE..KHAROSHTHI SIGN DOT BELOW +110BA ; Nukta # Mn KAITHI SIGN NUKTA +11173 ; Nukta # Mn MAHAJANI SIGN NUKTA +111CA ; Nukta # Mn SHARADA SIGN NUKTA +11236 ; Nukta # Mn KHOJKI SIGN NUKTA +112E9 ; Nukta # Mn KHUDAWADI SIGN NUKTA +1133B..1133C ; Nukta # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA +11446 ; Nukta # Mn NEWA SIGN NUKTA +114C3 ; Nukta # Mn TIRHUTA SIGN NUKTA +115C0 ; Nukta # Mn SIDDHAM SIGN NUKTA +116B7 ; Nukta # Mn TAKRI SIGN NUKTA +1183A ; Nukta # Mn DOGRA SIGN NUKTA +11D42 ; Nukta # Mn MASARAM GONDI SIGN NUKTA + +# ================================================ + +# Indic_Syllabic_Category=Virama + +# Virama (killing of inherent vowel in consonant sequence +# or consonant stacker) +# Only includes characters that can act both as visible killer viramas +# and consonant stackers. Separate property values exist for characters +# that can only act as pure killers or only as consonant stackers. + +# [Derivation: (ccc=9) - (InSC=Pure_Killer) - (InSC=Invisible_Stacker) +# - (InSC=Number_Joiner) - 2D7F] + +094D ; Virama # Mn DEVANAGARI SIGN VIRAMA +09CD ; Virama # Mn BENGALI SIGN VIRAMA +0A4D ; Virama # Mn GURMUKHI SIGN VIRAMA +0ACD ; Virama # Mn GUJARATI SIGN VIRAMA +0B4D ; Virama # Mn ORIYA SIGN VIRAMA +0BCD ; Virama # Mn TAMIL SIGN VIRAMA +0C4D ; Virama # Mn TELUGU SIGN VIRAMA +0CCD ; Virama # Mn KANNADA SIGN VIRAMA +0D4D ; Virama # Mn MALAYALAM SIGN VIRAMA +0DCA ; Virama # Mn SINHALA SIGN AL-LAKUNA +1B44 ; Virama # Mc BALINESE ADEG ADEG +A806 ; Virama # Mn SYLOTI NAGRI SIGN HASANTA +A8C4 ; Virama # Mn SAURASHTRA SIGN VIRAMA +A9C0 ; Virama # Mc JAVANESE PANGKON +11046 ; Virama # Mn BRAHMI VIRAMA +110B9 ; Virama # Mn KAITHI SIGN VIRAMA +111C0 ; Virama # Mc SHARADA SIGN VIRAMA +11235 ; Virama # Mc KHOJKI SIGN VIRAMA +1134D ; Virama # Mc GRANTHA SIGN VIRAMA +11442 ; Virama # Mn NEWA SIGN VIRAMA +114C2 ; Virama # Mn TIRHUTA SIGN VIRAMA +115BF ; Virama # Mn SIDDHAM SIGN VIRAMA +1163F ; Virama # Mn MODI SIGN VIRAMA +116B6 ; Virama # Mc TAKRI SIGN VIRAMA +11839 ; Virama # Mn DOGRA SIGN VIRAMA +119E0 ; Virama # Mn NANDINAGARI SIGN VIRAMA +11C3F ; Virama # Mn BHAIKSUKI SIGN VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Pure_Killer + +# Pure killer (killing of inherent vowel in consonant sequence, +# with no consonant stacking behavior) + +# [Not derivable] + +0D3B..0D3C ; Pure_Killer # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA +0E3A ; Pure_Killer # Mn THAI CHARACTER PHINTHU +0E4E ; Pure_Killer # Mn THAI CHARACTER YAMAKKAN +0EBA ; Pure_Killer # Mn LAO SIGN PALI VIRAMA +0F84 ; Pure_Killer # Mn TIBETAN MARK HALANTA +103A ; Pure_Killer # Mn MYANMAR SIGN ASAT +1714 ; Pure_Killer # Mn TAGALOG SIGN VIRAMA +1734 ; Pure_Killer # Mn HANUNOO SIGN PAMUDPOD +17D1 ; Pure_Killer # Mn KHMER SIGN VIRIAM +1A7A ; Pure_Killer # Mn TAI THAM SIGN RA HAAM +1BAA ; Pure_Killer # Mc SUNDANESE SIGN PAMAAEH +1BF2..1BF3 ; Pure_Killer # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +A953 ; Pure_Killer # Mc REJANG VIRAMA +ABED ; Pure_Killer # Mn MEETEI MAYEK APUN IYEK +11134 ; Pure_Killer # Mn CHAKMA MAAYYAA +112EA ; Pure_Killer # Mn KHUDAWADI SIGN VIRAMA +1172B ; Pure_Killer # Mn AHOM SIGN KILLER +11A34 ; Pure_Killer # Mn ZANABAZAR SQUARE SIGN VIRAMA +11D44 ; Pure_Killer # Mn MASARAM GONDI SIGN HALANTA + +# ================================================ + +# Indic_Syllabic_Category=Invisible_Stacker + +# Invisible stacker (invisible consonant stacker virama). +# +# Note that in some scripts, such as Kharoshthi and Masaram Gondi, an invisible +# stacker may have a second function, changing the shape and/or location of the +# consonant preceding it, even when there is no consonant following the +# invisible stacker. + +# [Not derivable] + +1039 ; Invisible_Stacker # Mn MYANMAR SIGN VIRAMA +17D2 ; Invisible_Stacker # Mn KHMER SIGN COENG +1A60 ; Invisible_Stacker # Mn TAI THAM SIGN SAKOT +1BAB ; Invisible_Stacker # Mn SUNDANESE SIGN VIRAMA +AAF6 ; Invisible_Stacker # Mn MEETEI MAYEK VIRAMA +10A3F ; Invisible_Stacker # Mn KHAROSHTHI VIRAMA +11133 ; Invisible_Stacker # Mn CHAKMA VIRAMA +11A47 ; Invisible_Stacker # Mn ZANABAZAR SQUARE SUBJOINER +11A99 ; Invisible_Stacker # Mn SOYOMBO SUBJOINER +11D45 ; Invisible_Stacker # Mn MASARAM GONDI VIRAMA +11D97 ; Invisible_Stacker # Mn GUNJALA GONDI VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Independent + +# Independent Vowels (contrasted with matras) + +# [Not derivable] + +0904..0914 ; Vowel_Independent # Lo [17] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER AU +0960..0961 ; Vowel_Independent # Lo [2] DEVANAGARI LETTER VOCALIC RR..DEVANAGARI LETTER VOCALIC LL +0972..0977 ; Vowel_Independent # Lo [6] DEVANAGARI LETTER CANDRA A..DEVANAGARI LETTER UUE +0985..098C ; Vowel_Independent # Lo [8] BENGALI LETTER A..BENGALI LETTER VOCALIC L +098F..0990 ; Vowel_Independent # Lo [2] BENGALI LETTER E..BENGALI LETTER AI +0993..0994 ; Vowel_Independent # Lo [2] BENGALI LETTER O..BENGALI LETTER AU +09E0..09E1 ; Vowel_Independent # Lo [2] BENGALI LETTER VOCALIC RR..BENGALI LETTER VOCALIC LL +0A05..0A0A ; Vowel_Independent # Lo [6] GURMUKHI LETTER A..GURMUKHI LETTER UU +0A0F..0A10 ; Vowel_Independent # Lo [2] GURMUKHI LETTER EE..GURMUKHI LETTER AI +0A13..0A14 ; Vowel_Independent # Lo [2] GURMUKHI LETTER OO..GURMUKHI LETTER AU +0A85..0A8D ; Vowel_Independent # Lo [9] GUJARATI LETTER A..GUJARATI VOWEL CANDRA E +0A8F..0A91 ; Vowel_Independent # Lo [3] GUJARATI LETTER E..GUJARATI VOWEL CANDRA O +0A93..0A94 ; Vowel_Independent # Lo [2] GUJARATI LETTER O..GUJARATI LETTER AU +0AE0..0AE1 ; Vowel_Independent # Lo [2] GUJARATI LETTER VOCALIC RR..GUJARATI LETTER VOCALIC LL +0B05..0B0C ; Vowel_Independent # Lo [8] ORIYA LETTER A..ORIYA LETTER VOCALIC L +0B0F..0B10 ; Vowel_Independent # Lo [2] ORIYA LETTER E..ORIYA LETTER AI +0B13..0B14 ; Vowel_Independent # Lo [2] ORIYA LETTER O..ORIYA LETTER AU +0B60..0B61 ; Vowel_Independent # Lo [2] ORIYA LETTER VOCALIC RR..ORIYA LETTER VOCALIC LL +0B85..0B8A ; Vowel_Independent # Lo [6] TAMIL LETTER A..TAMIL LETTER UU +0B8E..0B90 ; Vowel_Independent # Lo [3] TAMIL LETTER E..TAMIL LETTER AI +0B92..0B94 ; Vowel_Independent # Lo [3] TAMIL LETTER O..TAMIL LETTER AU +0C05..0C0C ; Vowel_Independent # Lo [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L +0C0E..0C10 ; Vowel_Independent # Lo [3] TELUGU LETTER E..TELUGU LETTER AI +0C12..0C14 ; Vowel_Independent # Lo [3] TELUGU LETTER O..TELUGU LETTER AU +0C60..0C61 ; Vowel_Independent # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL +0C85..0C8C ; Vowel_Independent # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L +0C8E..0C90 ; Vowel_Independent # Lo [3] KANNADA LETTER E..KANNADA LETTER AI +0C92..0C94 ; Vowel_Independent # Lo [3] KANNADA LETTER O..KANNADA LETTER AU +0CE0..0CE1 ; Vowel_Independent # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL +0D05..0D0C ; Vowel_Independent # Lo [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L +0D0E..0D10 ; Vowel_Independent # Lo [3] MALAYALAM LETTER E..MALAYALAM LETTER AI +0D12..0D14 ; Vowel_Independent # Lo [3] MALAYALAM LETTER O..MALAYALAM LETTER AU +0D5F..0D61 ; Vowel_Independent # Lo [3] MALAYALAM LETTER ARCHAIC II..MALAYALAM LETTER VOCALIC LL +0D85..0D96 ; Vowel_Independent # Lo [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA +1021..102A ; Vowel_Independent # Lo [10] MYANMAR LETTER A..MYANMAR LETTER AU +1052..1055 ; Vowel_Independent # Lo [4] MYANMAR LETTER VOCALIC R..MYANMAR LETTER VOCALIC LL +1700..1702 ; Vowel_Independent # Lo [3] TAGALOG LETTER A..TAGALOG LETTER U +1720..1722 ; Vowel_Independent # Lo [3] HANUNOO LETTER A..HANUNOO LETTER U +1740..1742 ; Vowel_Independent # Lo [3] BUHID LETTER A..BUHID LETTER U +1760..1762 ; Vowel_Independent # Lo [3] TAGBANWA LETTER A..TAGBANWA LETTER U +17A3..17B3 ; Vowel_Independent # Lo [17] KHMER INDEPENDENT VOWEL QAQ..KHMER INDEPENDENT VOWEL QAU +1A4D..1A52 ; Vowel_Independent # Lo [6] TAI THAM LETTER I..TAI THAM LETTER OO +1B05..1B12 ; Vowel_Independent # Lo [14] BALINESE LETTER AKARA..BALINESE LETTER OKARA TEDUNG +1B83..1B89 ; Vowel_Independent # Lo [7] SUNDANESE LETTER A..SUNDANESE LETTER EU +1BE4..1BE5 ; Vowel_Independent # Lo [2] BATAK LETTER I..BATAK LETTER U +A800..A801 ; Vowel_Independent # Lo [2] SYLOTI NAGRI LETTER A..SYLOTI NAGRI LETTER I +A803..A805 ; Vowel_Independent # Lo [3] SYLOTI NAGRI LETTER U..SYLOTI NAGRI LETTER O +A882..A891 ; Vowel_Independent # Lo [16] SAURASHTRA LETTER A..SAURASHTRA LETTER AU +A8FE ; Vowel_Independent # Lo DEVANAGARI LETTER AY +A984..A988 ; Vowel_Independent # Lo [5] JAVANESE LETTER A..JAVANESE LETTER U +A98C..A98E ; Vowel_Independent # Lo [3] JAVANESE LETTER E..JAVANESE LETTER O +AA00..AA05 ; Vowel_Independent # Lo [6] CHAM LETTER A..CHAM LETTER O +AAE0..AAE1 ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER E..MEETEI MAYEK LETTER O +ABCE..ABCF ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER UN..MEETEI MAYEK LETTER I +ABD1 ; Vowel_Independent # Lo MEETEI MAYEK LETTER ATIYA +11005..11012 ; Vowel_Independent # Lo [14] BRAHMI LETTER A..BRAHMI LETTER AU +11083..1108C ; Vowel_Independent # Lo [10] KAITHI LETTER A..KAITHI LETTER AU +11103..11106 ; Vowel_Independent # Lo [4] CHAKMA LETTER AA..CHAKMA LETTER E +11183..11190 ; Vowel_Independent # Lo [14] SHARADA LETTER A..SHARADA LETTER AU +11200..11207 ; Vowel_Independent # Lo [8] KHOJKI LETTER A..KHOJKI LETTER AU +11280..11283 ; Vowel_Independent # Lo [4] MULTANI LETTER A..MULTANI LETTER E +112B0..112B9 ; Vowel_Independent # Lo [10] KHUDAWADI LETTER A..KHUDAWADI LETTER AU +11305..1130C ; Vowel_Independent # Lo [8] GRANTHA LETTER A..GRANTHA LETTER VOCALIC L +1130F..11310 ; Vowel_Independent # Lo [2] GRANTHA LETTER EE..GRANTHA LETTER AI +11313..11314 ; Vowel_Independent # Lo [2] GRANTHA LETTER OO..GRANTHA LETTER AU +11360..11361 ; Vowel_Independent # Lo [2] GRANTHA LETTER VOCALIC RR..GRANTHA LETTER VOCALIC LL +11400..1140D ; Vowel_Independent # Lo [14] NEWA LETTER A..NEWA LETTER AU +11481..1148E ; Vowel_Independent # Lo [14] TIRHUTA LETTER A..TIRHUTA LETTER AU +11580..1158D ; Vowel_Independent # Lo [14] SIDDHAM LETTER A..SIDDHAM LETTER AU +115D8..115DB ; Vowel_Independent # Lo [4] SIDDHAM LETTER THREE-CIRCLE ALTERNATE I..SIDDHAM LETTER ALTERNATE U +11600..1160D ; Vowel_Independent # Lo [14] MODI LETTER A..MODI LETTER AU +11680..11689 ; Vowel_Independent # Lo [10] TAKRI LETTER A..TAKRI LETTER AU +11800..11809 ; Vowel_Independent # Lo [10] DOGRA LETTER A..DOGRA LETTER AU +119A0..119A7 ; Vowel_Independent # Lo [8] NANDINAGARI LETTER A..NANDINAGARI LETTER VOCALIC RR +119AA..119AD ; Vowel_Independent # Lo [4] NANDINAGARI LETTER E..NANDINAGARI LETTER AU +11A00 ; Vowel_Independent # Lo ZANABAZAR SQUARE LETTER A +11A50 ; Vowel_Independent # Lo SOYOMBO LETTER A +11C00..11C08 ; Vowel_Independent # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L +11C0A..11C0D ; Vowel_Independent # Lo [4] BHAIKSUKI LETTER E..BHAIKSUKI LETTER AU +11D00..11D06 ; Vowel_Independent # Lo [7] MASARAM GONDI LETTER A..MASARAM GONDI LETTER E +11D08..11D09 ; Vowel_Independent # Lo [2] MASARAM GONDI LETTER AI..MASARAM GONDI LETTER O +11D0B ; Vowel_Independent # Lo MASARAM GONDI LETTER AU +11D60..11D65 ; Vowel_Independent # Lo [6] GUNJALA GONDI LETTER A..GUNJALA GONDI LETTER UU +11D67..11D68 ; Vowel_Independent # Lo [2] GUNJALA GONDI LETTER EE..GUNJALA GONDI LETTER AI +11D6A..11D6B ; Vowel_Independent # Lo [2] GUNJALA GONDI LETTER OO..GUNJALA GONDI LETTER AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Dependent + +# Dependent Vowels (contrasted with independent vowels and/or with +# complex placement). Known as matras in Indic scripts. Also +# includes vowel modifiers that follow dependent (and sometimes +# independent) vowels. + +# [Not derivable] + +093A ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN OE +093B ; Vowel_Dependent # Mc DEVANAGARI VOWEL SIGN OOE +093E..0940 ; Vowel_Dependent # Mc [3] DEVANAGARI VOWEL SIGN AA..DEVANAGARI VOWEL SIGN II +0941..0948 ; Vowel_Dependent # Mn [8] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN AI +0949..094C ; Vowel_Dependent # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094E..094F ; Vowel_Dependent # Mc [2] DEVANAGARI VOWEL SIGN PRISHTHAMATRA E..DEVANAGARI VOWEL SIGN AW +0955..0957 ; Vowel_Dependent # Mn [3] DEVANAGARI VOWEL SIGN CANDRA LONG E..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Vowel_Dependent # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BE..09C0 ; Vowel_Dependent # Mc [3] BENGALI VOWEL SIGN AA..BENGALI VOWEL SIGN II +09C1..09C4 ; Vowel_Dependent # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09C7..09C8 ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +09CB..09CC ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +09D7 ; Vowel_Dependent # Mc BENGALI AU LENGTH MARK +09E2..09E3 ; Vowel_Dependent # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3E..0A40 ; Vowel_Dependent # Mc [3] GURMUKHI VOWEL SIGN AA..GURMUKHI VOWEL SIGN II +0A41..0A42 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A47..0A48 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0ABE..0AC0 ; Vowel_Dependent # Mc [3] GUJARATI VOWEL SIGN AA..GUJARATI VOWEL SIGN II +0AC1..0AC5 ; Vowel_Dependent # Mn [5] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AC9 ; Vowel_Dependent # Mc GUJARATI VOWEL SIGN CANDRA O +0ACB..0ACC ; Vowel_Dependent # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0AE2..0AE3 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3E ; Vowel_Dependent # Mc ORIYA VOWEL SIGN AA +0B3F ; Vowel_Dependent # Mn ORIYA VOWEL SIGN I +0B40 ; Vowel_Dependent # Mc ORIYA VOWEL SIGN II +0B41..0B44 ; Vowel_Dependent # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B47..0B48 ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI +0B4B..0B4C ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN O..ORIYA VOWEL SIGN AU +0B56 ; Vowel_Dependent # Mn ORIYA AI LENGTH MARK +0B57 ; Vowel_Dependent # Mc ORIYA AU LENGTH MARK +0B62..0B63 ; Vowel_Dependent # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BBE..0BBF ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC0 ; Vowel_Dependent # Mn TAMIL VOWEL SIGN II +0BC1..0BC2 ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BC6..0BC8 ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0BCA..0BCC ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0BD7 ; Vowel_Dependent # Mc TAMIL AU LENGTH MARK +0C3E..0C40 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C41..0C44 ; Vowel_Dependent # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C46..0C48 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI +0C4A..0C4C ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C55..0C56 ; Vowel_Dependent # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK +0C62..0C63 ; Vowel_Dependent # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBE ; Vowel_Dependent # Mc KANNADA VOWEL SIGN AA +0CBF ; Vowel_Dependent # Mn KANNADA VOWEL SIGN I +0CC0..0CC4 ; Vowel_Dependent # Mc [5] KANNADA VOWEL SIGN II..KANNADA VOWEL SIGN VOCALIC RR +0CC6 ; Vowel_Dependent # Mn KANNADA VOWEL SIGN E +0CC7..0CC8 ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +0CCC ; Vowel_Dependent # Mn KANNADA VOWEL SIGN AU +0CD5..0CD6 ; Vowel_Dependent # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CE2..0CE3 ; Vowel_Dependent # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D3E..0D40 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D44 ; Vowel_Dependent # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR +0D46..0D48 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0D4A..0D4C ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0D57 ; Vowel_Dependent # Mc MALAYALAM AU LENGTH MARK +0D62..0D63 ; Vowel_Dependent # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DCF..0DD1 ; Vowel_Dependent # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD2..0DD4 ; Vowel_Dependent # Mn [3] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Vowel_Dependent # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0DD8..0DDF ; Vowel_Dependent # Mc [8] SINHALA VOWEL SIGN GAETTA-PILLA..SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Vowel_Dependent # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Vowel_Dependent # Lo THAI CHARACTER SARA A +0E31 ; Vowel_Dependent # Mn THAI CHARACTER MAI HAN-AKAT +0E32..0E33 ; Vowel_Dependent # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E34..0E39 ; Vowel_Dependent # Mn [6] THAI CHARACTER SARA I..THAI CHARACTER SARA UU +0E40..0E45 ; Vowel_Dependent # Lo [6] THAI CHARACTER SARA E..THAI CHARACTER LAKKHANGYAO +0E47 ; Vowel_Dependent # Mn THAI CHARACTER MAITAIKHU +0EB0 ; Vowel_Dependent # Lo LAO VOWEL SIGN A +0EB1 ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KAN +0EB2..0EB3 ; Vowel_Dependent # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0EB4..0EB9 ; Vowel_Dependent # Mn [6] LAO VOWEL SIGN I..LAO VOWEL SIGN UU +0EBB ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KON +0EC0..0EC4 ; Vowel_Dependent # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +0F71..0F7D ; Vowel_Dependent # Mn [13] TIBETAN VOWEL SIGN AA..TIBETAN VOWEL SIGN OO +0F80..0F81 ; Vowel_Dependent # Mn [2] TIBETAN VOWEL SIGN REVERSED I..TIBETAN VOWEL SIGN REVERSED II +102B..102C ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +102D..1030 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN UU +1031 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN E +1032..1035 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +1056..1057 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1058..1059 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1062 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1071..1074 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1083..1084 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN SHAN AA..MYANMAR VOWEL SIGN SHAN E +1085..1086 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109C ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN AITON A +109D ; Vowel_Dependent # Mn MYANMAR VOWEL SIGN AITON AI +1712..1713 ; Vowel_Dependent # Mn [2] TAGALOG VOWEL SIGN I..TAGALOG VOWEL SIGN U +1732..1733 ; Vowel_Dependent # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1752..1753 ; Vowel_Dependent # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U +1772..1773 ; Vowel_Dependent # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U +17B6 ; Vowel_Dependent # Mc KHMER VOWEL SIGN AA +17B7..17BD ; Vowel_Dependent # Mn [7] KHMER VOWEL SIGN I..KHMER VOWEL SIGN UA +17BE..17C5 ; Vowel_Dependent # Mc [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU +17C8 ; Vowel_Dependent # Mc KHMER SIGN YUUKALEAPINTU +1920..1922 ; Vowel_Dependent # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U +1923..1926 ; Vowel_Dependent # Mc [4] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AU +1927..1928 ; Vowel_Dependent # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Vowel_Dependent # Mn LIMBU SIGN KEMPHRENG +19B0..19C0 ; Vowel_Dependent # Lo [17] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN IY +1A17..1A18 ; Vowel_Dependent # Mn [2] BUGINESE VOWEL SIGN I..BUGINESE VOWEL SIGN U +1A19..1A1A ; Vowel_Dependent # Mc [2] BUGINESE VOWEL SIGN E..BUGINESE VOWEL SIGN O +1A1B ; Vowel_Dependent # Mn BUGINESE VOWEL SIGN AE +1A61 ; Vowel_Dependent # Mc TAI THAM VOWEL SIGN A +1A62 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN MAI SAT +1A63..1A64 ; Vowel_Dependent # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A65..1A6C ; Vowel_Dependent # Mn [8] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN OA BELOW +1A6D..1A72 ; Vowel_Dependent # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI +1A73 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN OA ABOVE +1B35 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN TEDUNG +1B36..1B3A ; Vowel_Dependent # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA +1B3B ; Vowel_Dependent # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +1B3C ; Vowel_Dependent # Mn BALINESE VOWEL SIGN LA LENGA +1B3D..1B41 ; Vowel_Dependent # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1B42 ; Vowel_Dependent # Mn BALINESE VOWEL SIGN PEPET +1B43 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN PEPET TEDUNG +1BA4..1BA5 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PANGHULU..SUNDANESE VOWEL SIGN PANYUKU +1BA6..1BA7 ; Vowel_Dependent # Mc [2] SUNDANESE VOWEL SIGN PANAELAENG..SUNDANESE VOWEL SIGN PANOLONG +1BA8..1BA9 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE7 ; Vowel_Dependent # Mc BATAK VOWEL SIGN E +1BE8..1BE9 ; Vowel_Dependent # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BEA..1BEC ; Vowel_Dependent # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BED ; Vowel_Dependent # Mn BATAK VOWEL SIGN KARO O +1BEE ; Vowel_Dependent # Mc BATAK VOWEL SIGN U +1BEF ; Vowel_Dependent # Mn BATAK VOWEL SIGN U FOR SIMALUNGUN SA +1C26..1C2B ; Vowel_Dependent # Mc [6] LEPCHA VOWEL SIGN AA..LEPCHA VOWEL SIGN UU +1C2C ; Vowel_Dependent # Mn LEPCHA VOWEL SIGN E +A802 ; Vowel_Dependent # Mn SYLOTI NAGRI SIGN DVISVARA +A823..A824 ; Vowel_Dependent # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A825..A826 ; Vowel_Dependent # Mn [2] SYLOTI NAGRI VOWEL SIGN U..SYLOTI NAGRI VOWEL SIGN E +A827 ; Vowel_Dependent # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Vowel_Dependent # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A8FF ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN AY +A947..A94E ; Vowel_Dependent # Mn [8] REJANG VOWEL SIGN I..REJANG VOWEL SIGN EA +A9B4..A9B5 ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9B6..A9B9 ; Vowel_Dependent # Mn [4] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BA..A9BB ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +A9BC ; Vowel_Dependent # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Vowel_Dependent # Mn MYANMAR SIGN SHAN SAW +AA29..AA2E ; Vowel_Dependent # Mn [6] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN OE +AA2F..AA30 ; Vowel_Dependent # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA31..AA32 ; Vowel_Dependent # Mn [2] CHAM VOWEL SIGN AU..CHAM VOWEL SIGN UE +AAB0 ; Vowel_Dependent # Mn TAI VIET MAI KANG +AAB1 ; Vowel_Dependent # Lo TAI VIET VOWEL AA +AAB2..AAB4 ; Vowel_Dependent # Mn [3] TAI VIET VOWEL I..TAI VIET VOWEL U +AAB5..AAB6 ; Vowel_Dependent # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB7..AAB8 ; Vowel_Dependent # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AAB9..AABD ; Vowel_Dependent # Lo [5] TAI VIET VOWEL UEA..TAI VIET VOWEL AN +AABE ; Vowel_Dependent # Mn TAI VIET VOWEL AM +AAEB ; Vowel_Dependent # Mc MEETEI MAYEK VOWEL SIGN II +AAEC..AAED ; Vowel_Dependent # Mn [2] MEETEI MAYEK VOWEL SIGN UU..MEETEI MAYEK VOWEL SIGN AAI +AAEE..AAEF ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN AU..MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE5 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN ANAP +ABE6..ABE7 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE8 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABE9..ABEA ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +10A01..10A03 ; Vowel_Dependent # Mn [3] KHAROSHTHI VOWEL SIGN I..KHAROSHTHI VOWEL SIGN VOCALIC R +10A05..10A06 ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O +10A0C..10A0D ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN DOUBLE RING BELOW +11038..11045 ; Vowel_Dependent # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +110B0..110B2 ; Vowel_Dependent # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II +110B3..110B6 ; Vowel_Dependent # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI +110B7..110B8 ; Vowel_Dependent # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11127..1112B ; Vowel_Dependent # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU +1112C ; Vowel_Dependent # Mc CHAKMA VOWEL SIGN E +1112D..11132 ; Vowel_Dependent # Mn [6] CHAKMA VOWEL SIGN AI..CHAKMA AU MARK +11145..11146 ; Vowel_Dependent # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI +111B3..111B5 ; Vowel_Dependent # Mc [3] SHARADA VOWEL SIGN AA..SHARADA VOWEL SIGN II +111B6..111BE ; Vowel_Dependent # Mn [9] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN O +111BF ; Vowel_Dependent # Mc SHARADA VOWEL SIGN AU +111CB..111CC ; Vowel_Dependent # Mn [2] SHARADA VOWEL MODIFIER MARK..SHARADA EXTRA SHORT VOWEL MARK +1122C..1122E ; Vowel_Dependent # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +1122F..11231 ; Vowel_Dependent # Mn [3] KHOJKI VOWEL SIGN U..KHOJKI VOWEL SIGN AI +11232..11233 ; Vowel_Dependent # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU +112E0..112E2 ; Vowel_Dependent # Mc [3] KHUDAWADI VOWEL SIGN AA..KHUDAWADI VOWEL SIGN II +112E3..112E8 ; Vowel_Dependent # Mn [6] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN AU +1133E..1133F ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11340 ; Vowel_Dependent # Mn GRANTHA VOWEL SIGN II +11341..11344 ; Vowel_Dependent # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +11347..11348 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +1134B..1134C ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +11357 ; Vowel_Dependent # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +11435..11437 ; Vowel_Dependent # Mc [3] NEWA VOWEL SIGN AA..NEWA VOWEL SIGN II +11438..1143F ; Vowel_Dependent # Mn [8] NEWA VOWEL SIGN U..NEWA VOWEL SIGN AI +11440..11441 ; Vowel_Dependent # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +114B0..114B2 ; Vowel_Dependent # Mc [3] TIRHUTA VOWEL SIGN AA..TIRHUTA VOWEL SIGN II +114B3..114B8 ; Vowel_Dependent # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114B9 ; Vowel_Dependent # Mc TIRHUTA VOWEL SIGN E +114BA ; Vowel_Dependent # Mn TIRHUTA VOWEL SIGN SHORT E +114BB..114BE ; Vowel_Dependent # Mc [4] TIRHUTA VOWEL SIGN AI..TIRHUTA VOWEL SIGN AU +115AF..115B1 ; Vowel_Dependent # Mc [3] SIDDHAM VOWEL SIGN AA..SIDDHAM VOWEL SIGN II +115B2..115B5 ; Vowel_Dependent # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115B8..115BB ; Vowel_Dependent # Mc [4] SIDDHAM VOWEL SIGN E..SIDDHAM VOWEL SIGN AU +115DC..115DD ; Vowel_Dependent # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11630..11632 ; Vowel_Dependent # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +11633..1163A ; Vowel_Dependent # Mn [8] MODI VOWEL SIGN U..MODI VOWEL SIGN AI +1163B..1163C ; Vowel_Dependent # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +11640 ; Vowel_Dependent # Mn MODI SIGN ARDHACANDRA +116AD ; Vowel_Dependent # Mn TAKRI VOWEL SIGN AA +116AE..116AF ; Vowel_Dependent # Mc [2] TAKRI VOWEL SIGN I..TAKRI VOWEL SIGN II +116B0..116B5 ; Vowel_Dependent # Mn [6] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN AU +11720..11721 ; Vowel_Dependent # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +11722..11725 ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN I..AHOM VOWEL SIGN UU +11726 ; Vowel_Dependent # Mc AHOM VOWEL SIGN E +11727..1172A ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN AW..AHOM VOWEL SIGN AM +1182C..1182E ; Vowel_Dependent # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II +1182F..11836 ; Vowel_Dependent # Mn [8] DOGRA VOWEL SIGN U..DOGRA VOWEL SIGN AU +119D1..119D3 ; Vowel_Dependent # Mc [3] NANDINAGARI VOWEL SIGN AA..NANDINAGARI VOWEL SIGN II +119D4..119D7 ; Vowel_Dependent # Mn [4] NANDINAGARI VOWEL SIGN U..NANDINAGARI VOWEL SIGN VOCALIC RR +119DA..119DB ; Vowel_Dependent # Mn [2] NANDINAGARI VOWEL SIGN E..NANDINAGARI VOWEL SIGN AI +119DC..119DD ; Vowel_Dependent # Mc [2] NANDINAGARI VOWEL SIGN O..NANDINAGARI VOWEL SIGN AU +119E4 ; Vowel_Dependent # Mc NANDINAGARI VOWEL SIGN PRISHTHAMATRA E +11A01..11A0A ; Vowel_Dependent # Mn [10] ZANABAZAR SQUARE VOWEL SIGN I..ZANABAZAR SQUARE VOWEL LENGTH MARK +11A51..11A56 ; Vowel_Dependent # Mn [6] SOYOMBO VOWEL SIGN I..SOYOMBO VOWEL SIGN OE +11A57..11A58 ; Vowel_Dependent # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A59..11A5B ; Vowel_Dependent # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11C2F ; Vowel_Dependent # Mc BHAIKSUKI VOWEL SIGN AA +11C30..11C36 ; Vowel_Dependent # Mn [7] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN VOCALIC L +11C38..11C3B ; Vowel_Dependent # Mn [4] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI VOWEL SIGN AU +11CB0 ; Vowel_Dependent # Mn MARCHEN VOWEL SIGN AA +11CB1 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN I +11CB2..11CB3 ; Vowel_Dependent # Mn [2] MARCHEN VOWEL SIGN U..MARCHEN VOWEL SIGN E +11CB4 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN O +11D31..11D36 ; Vowel_Dependent # Mn [6] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN VOCALIC R +11D3A ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Vowel_Dependent # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN AU +11D43 ; Vowel_Dependent # Mn MASARAM GONDI SIGN CANDRA +11D8A..11D8E ; Vowel_Dependent # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU +11D90..11D91 ; Vowel_Dependent # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI +11D93..11D94 ; Vowel_Dependent # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU +11EF3..11EF4 ; Vowel_Dependent # Mn [2] MAKASAR VOWEL SIGN I..MAKASAR VOWEL SIGN U +11EF5..11EF6 ; Vowel_Dependent # Mc [2] MAKASAR VOWEL SIGN E..MAKASAR VOWEL SIGN O + +# ================================================ + +# Indic_Syllabic_Category=Vowel + +# (Other) Vowels (reanalyzed as ordinary alphabetic letters or marks) + +# [Not derivable] + +1963..196D ; Vowel # Lo [11] TAI LE LETTER A..TAI LE LETTER AI +A85E..A861 ; Vowel # Lo [4] PHAGS-PA LETTER I..PHAGS-PA LETTER O +A866 ; Vowel # Lo PHAGS-PA LETTER EE +A922..A925 ; Vowel # Lo [4] KAYAH LI LETTER A..KAYAH LI LETTER OO +A926..A92A ; Vowel # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O +11150..11154 ; Vowel # Lo [5] MAHAJANI LETTER A..MAHAJANI LETTER O + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Placeholder + +# Consonant Placeholder +# This includes generic placeholders used for +# Indic script layout (NBSP and dotted circle), as well as a few script- +# specific vowel-holder characters which are not technically +# consonants, but serve instead as bases for placement of vowel marks. + +# [Not derivable] + +002D ; Consonant_Placeholder # Pd HYPHEN-MINUS +00A0 ; Consonant_Placeholder # Zs NO-BREAK SPACE +00D7 ; Consonant_Placeholder # Sm MULTIPLICATION SIGN +0980 ; Consonant_Placeholder # Lo BENGALI ANJI +0A72..0A73 ; Consonant_Placeholder # Lo [2] GURMUKHI IRI..GURMUKHI URA +104B ; Consonant_Placeholder # Po MYANMAR SIGN SECTION +104E ; Consonant_Placeholder # Po MYANMAR SYMBOL AFOREMENTIONED +1900 ; Consonant_Placeholder # Lo LIMBU VOWEL-CARRIER LETTER +1CFA ; Consonant_Placeholder # Lo VEDIC SIGN DOUBLE ANUSVARA ANTARGOMUKHA +2010..2014 ; Consonant_Placeholder # Pd [5] HYPHEN..EM DASH +25CC ; Consonant_Placeholder # So DOTTED CIRCLE +AA74..AA76 ; Consonant_Placeholder # Lo [3] MYANMAR LOGOGRAM KHAMTI OAY..MYANMAR LOGOGRAM KHAMTI HM +11A3F ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL HEAD MARK +11A45 ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL DOUBLE-LINED HEAD MARK +11EF2 ; Consonant_Placeholder # Lo MAKASAR ANGKA + +# ================================================ + +# Indic_Syllabic_Category=Consonant + +# Consonant (ordinary abugida consonants, with inherent vowels) + +# [Not derivable] + +0915..0939 ; Consonant # Lo [37] DEVANAGARI LETTER KA..DEVANAGARI LETTER HA +0958..095F ; Consonant # Lo [8] DEVANAGARI LETTER QA..DEVANAGARI LETTER YYA +0978..097F ; Consonant # Lo [8] DEVANAGARI LETTER MARWARI DDA..DEVANAGARI LETTER BBA +0995..09A8 ; Consonant # Lo [20] BENGALI LETTER KA..BENGALI LETTER NA +09AA..09B0 ; Consonant # Lo [7] BENGALI LETTER PA..BENGALI LETTER RA +09B2 ; Consonant # Lo BENGALI LETTER LA +09B6..09B9 ; Consonant # Lo [4] BENGALI LETTER SHA..BENGALI LETTER HA +09DC..09DD ; Consonant # Lo [2] BENGALI LETTER RRA..BENGALI LETTER RHA +09DF ; Consonant # Lo BENGALI LETTER YYA +09F0..09F1 ; Consonant # Lo [2] BENGALI LETTER RA WITH MIDDLE DIAGONAL..BENGALI LETTER RA WITH LOWER DIAGONAL +0A15..0A28 ; Consonant # Lo [20] GURMUKHI LETTER KA..GURMUKHI LETTER NA +0A2A..0A30 ; Consonant # Lo [7] GURMUKHI LETTER PA..GURMUKHI LETTER RA +0A32..0A33 ; Consonant # Lo [2] GURMUKHI LETTER LA..GURMUKHI LETTER LLA +0A35..0A36 ; Consonant # Lo [2] GURMUKHI LETTER VA..GURMUKHI LETTER SHA +0A38..0A39 ; Consonant # Lo [2] GURMUKHI LETTER SA..GURMUKHI LETTER HA +0A59..0A5C ; Consonant # Lo [4] GURMUKHI LETTER KHHA..GURMUKHI LETTER RRA +0A5E ; Consonant # Lo GURMUKHI LETTER FA +0A95..0AA8 ; Consonant # Lo [20] GUJARATI LETTER KA..GUJARATI LETTER NA +0AAA..0AB0 ; Consonant # Lo [7] GUJARATI LETTER PA..GUJARATI LETTER RA +0AB2..0AB3 ; Consonant # Lo [2] GUJARATI LETTER LA..GUJARATI LETTER LLA +0AB5..0AB9 ; Consonant # Lo [5] GUJARATI LETTER VA..GUJARATI LETTER HA +0AF9 ; Consonant # Lo GUJARATI LETTER ZHA +0B15..0B28 ; Consonant # Lo [20] ORIYA LETTER KA..ORIYA LETTER NA +0B2A..0B30 ; Consonant # Lo [7] ORIYA LETTER PA..ORIYA LETTER RA +0B32..0B33 ; Consonant # Lo [2] ORIYA LETTER LA..ORIYA LETTER LLA +0B35..0B39 ; Consonant # Lo [5] ORIYA LETTER VA..ORIYA LETTER HA +0B5C..0B5D ; Consonant # Lo [2] ORIYA LETTER RRA..ORIYA LETTER RHA +0B5F ; Consonant # Lo ORIYA LETTER YYA +0B71 ; Consonant # Lo ORIYA LETTER WA +0B95 ; Consonant # Lo TAMIL LETTER KA +0B99..0B9A ; Consonant # Lo [2] TAMIL LETTER NGA..TAMIL LETTER CA +0B9C ; Consonant # Lo TAMIL LETTER JA +0B9E..0B9F ; Consonant # Lo [2] TAMIL LETTER NYA..TAMIL LETTER TTA +0BA3..0BA4 ; Consonant # Lo [2] TAMIL LETTER NNA..TAMIL LETTER TA +0BA8..0BAA ; Consonant # Lo [3] TAMIL LETTER NA..TAMIL LETTER PA +0BAE..0BB9 ; Consonant # Lo [12] TAMIL LETTER MA..TAMIL LETTER HA +0C15..0C28 ; Consonant # Lo [20] TELUGU LETTER KA..TELUGU LETTER NA +0C2A..0C39 ; Consonant # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C58..0C5A ; Consonant # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C95..0CA8 ; Consonant # Lo [20] KANNADA LETTER KA..KANNADA LETTER NA +0CAA..0CB3 ; Consonant # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA +0CB5..0CB9 ; Consonant # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA +0CDE ; Consonant # Lo KANNADA LETTER FA +0D15..0D3A ; Consonant # Lo [38] MALAYALAM LETTER KA..MALAYALAM LETTER TTTA +0D9A..0DB1 ; Consonant # Lo [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA +0DB3..0DBB ; Consonant # Lo [9] SINHALA LETTER SANYAKA DAYANNA..SINHALA LETTER RAYANNA +0DBD ; Consonant # Lo SINHALA LETTER DANTAJA LAYANNA +0DC0..0DC6 ; Consonant # Lo [7] SINHALA LETTER VAYANNA..SINHALA LETTER FAYANNA +0E01..0E2E ; Consonant # Lo [46] THAI CHARACTER KO KAI..THAI CHARACTER HO NOKHUK +0E81..0E82 ; Consonant # Lo [2] LAO LETTER KO..LAO LETTER KHO SUNG +0E84 ; Consonant # Lo LAO LETTER KHO TAM +0E86..0E8A ; Consonant # Lo [5] LAO LETTER PALI GHA..LAO LETTER SO TAM +0E8C..0EA3 ; Consonant # Lo [24] LAO LETTER PALI JHA..LAO LETTER LO LING +0EA5 ; Consonant # Lo LAO LETTER LO LOOT +0EA7..0EAE ; Consonant # Lo [8] LAO LETTER WO..LAO LETTER HO TAM +0EDC..0EDF ; Consonant # Lo [4] LAO HO NO..LAO LETTER KHMU NYO +0F40..0F47 ; Consonant # Lo [8] TIBETAN LETTER KA..TIBETAN LETTER JA +0F49..0F6C ; Consonant # Lo [36] TIBETAN LETTER NYA..TIBETAN LETTER RRA +1000..1020 ; Consonant # Lo [33] MYANMAR LETTER KA..MYANMAR LETTER LLA +103F ; Consonant # Lo MYANMAR LETTER GREAT SA +1050..1051 ; Consonant # Lo [2] MYANMAR LETTER SHA..MYANMAR LETTER SSA +105A..105D ; Consonant # Lo [4] MYANMAR LETTER MON NGA..MYANMAR LETTER MON BBE +1061 ; Consonant # Lo MYANMAR LETTER SGAW KAREN SHA +1065..1066 ; Consonant # Lo [2] MYANMAR LETTER WESTERN PWO KAREN THA..MYANMAR LETTER WESTERN PWO KAREN PWA +106E..1070 ; Consonant # Lo [3] MYANMAR LETTER EASTERN PWO KAREN NNA..MYANMAR LETTER EASTERN PWO KAREN GHWA +1075..1081 ; Consonant # Lo [13] MYANMAR LETTER SHAN KA..MYANMAR LETTER SHAN HA +108E ; Consonant # Lo MYANMAR LETTER RUMAI PALAUNG FA +1703..170C ; Consonant # Lo [10] TAGALOG LETTER KA..TAGALOG LETTER YA +170E..1711 ; Consonant # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1723..1731 ; Consonant # Lo [15] HANUNOO LETTER KA..HANUNOO LETTER HA +1743..1751 ; Consonant # Lo [15] BUHID LETTER KA..BUHID LETTER HA +1763..176C ; Consonant # Lo [10] TAGBANWA LETTER KA..TAGBANWA LETTER YA +176E..1770 ; Consonant # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA +1780..17A2 ; Consonant # Lo [35] KHMER LETTER KA..KHMER LETTER QA +1901..191E ; Consonant # Lo [30] LIMBU LETTER KA..LIMBU LETTER TRA +1950..1962 ; Consonant # Lo [19] TAI LE LETTER KA..TAI LE LETTER NA +1980..19AB ; Consonant # Lo [44] NEW TAI LUE LETTER HIGH QA..NEW TAI LUE LETTER LOW SUA +1A00..1A16 ; Consonant # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA +1A20..1A4C ; Consonant # Lo [45] TAI THAM LETTER HIGH KA..TAI THAM LETTER LOW HA +1A53..1A54 ; Consonant # Lo [2] TAI THAM LETTER LAE..TAI THAM LETTER GREAT SA +1B13..1B33 ; Consonant # Lo [33] BALINESE LETTER KA..BALINESE LETTER HA +1B45..1B4B ; Consonant # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B8A..1BA0 ; Consonant # Lo [23] SUNDANESE LETTER KA..SUNDANESE LETTER HA +1BAE..1BAF ; Consonant # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA +1BBB..1BBD ; Consonant # Lo [3] SUNDANESE LETTER REU..SUNDANESE LETTER BHA +1BC0..1BE3 ; Consonant # Lo [36] BATAK LETTER A..BATAK LETTER MBA +1C00..1C23 ; Consonant # Lo [36] LEPCHA LETTER KA..LEPCHA LETTER A +1C4D..1C4F ; Consonant # Lo [3] LEPCHA LETTER TTA..LEPCHA LETTER DDA +A807..A80A ; Consonant # Lo [4] SYLOTI NAGRI LETTER KO..SYLOTI NAGRI LETTER GHO +A80C..A822 ; Consonant # Lo [23] SYLOTI NAGRI LETTER CO..SYLOTI NAGRI LETTER HO +A840..A85D ; Consonant # Lo [30] PHAGS-PA LETTER KA..PHAGS-PA LETTER A +A862..A865 ; Consonant # Lo [4] PHAGS-PA LETTER QA..PHAGS-PA LETTER GGA +A869..A870 ; Consonant # Lo [8] PHAGS-PA LETTER TTA..PHAGS-PA LETTER ASPIRATED FA +A872 ; Consonant # Lo PHAGS-PA SUPERFIXED LETTER RA +A892..A8B3 ; Consonant # Lo [34] SAURASHTRA LETTER KA..SAURASHTRA LETTER LLA +A90A..A921 ; Consonant # Lo [24] KAYAH LI LETTER KA..KAYAH LI LETTER CA +A930..A946 ; Consonant # Lo [23] REJANG LETTER KA..REJANG LETTER A +A989..A98B ; Consonant # Lo [3] JAVANESE LETTER PA CEREK..JAVANESE LETTER NGA LELET RASWADI +A98F..A9B2 ; Consonant # Lo [36] JAVANESE LETTER KA..JAVANESE LETTER HA +A9E0..A9E4 ; Consonant # Lo [5] MYANMAR LETTER SHAN GHA..MYANMAR LETTER SHAN BHA +A9E7..A9EF ; Consonant # Lo [9] MYANMAR LETTER TAI LAING NYA..MYANMAR LETTER TAI LAING NNA +A9FA..A9FE ; Consonant # Lo [5] MYANMAR LETTER TAI LAING LLA..MYANMAR LETTER TAI LAING BHA +AA06..AA28 ; Consonant # Lo [35] CHAM LETTER KA..CHAM LETTER HA +AA60..AA6F ; Consonant # Lo [16] MYANMAR LETTER KHAMTI GA..MYANMAR LETTER KHAMTI FA +AA71..AA73 ; Consonant # Lo [3] MYANMAR LETTER KHAMTI XA..MYANMAR LETTER KHAMTI RA +AA7A ; Consonant # Lo MYANMAR LETTER AITON RA +AA7E..AA7F ; Consonant # Lo [2] MYANMAR LETTER SHWE PALAUNG CHA..MYANMAR LETTER SHWE PALAUNG SHA +AA80..AAAF ; Consonant # Lo [48] TAI VIET LETTER LOW KO..TAI VIET LETTER HIGH O +AAE2..AAEA ; Consonant # Lo [9] MEETEI MAYEK LETTER CHA..MEETEI MAYEK LETTER SSA +ABC0..ABCD ; Consonant # Lo [14] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER HUK +ABD0 ; Consonant # Lo MEETEI MAYEK LETTER PHAM +ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTER BHAM +10A00 ; Consonant # Lo KHAROSHTHI LETTER A +10A10..10A13 ; Consonant # Lo [4] KHAROSHTHI LETTER KA..KHAROSHTHI LETTER GHA +10A15..10A17 ; Consonant # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA +10A19..10A35 ; Consonant # Lo [29] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER VHA +11013..11037 ; Consonant # Lo [37] BRAHMI LETTER KA..BRAHMI LETTER OLD TAMIL NNNA +1108D..110AF ; Consonant # Lo [35] KAITHI LETTER KA..KAITHI LETTER HA +11107..11126 ; Consonant # Lo [32] CHAKMA LETTER KAA..CHAKMA LETTER HAA +11144 ; Consonant # Lo CHAKMA LETTER LHAA +11155..11172 ; Consonant # Lo [30] MAHAJANI LETTER KA..MAHAJANI LETTER RRA +11191..111B2 ; Consonant # Lo [34] SHARADA LETTER KA..SHARADA LETTER HA +11208..11211 ; Consonant # Lo [10] KHOJKI LETTER KA..KHOJKI LETTER JJA +11213..1122B ; Consonant # Lo [25] KHOJKI LETTER NYA..KHOJKI LETTER LLA +11284..11286 ; Consonant # Lo [3] MULTANI LETTER KA..MULTANI LETTER GA +11288 ; Consonant # Lo MULTANI LETTER GHA +1128A..1128D ; Consonant # Lo [4] MULTANI LETTER CA..MULTANI LETTER JJA +1128F..1129D ; Consonant # Lo [15] MULTANI LETTER NYA..MULTANI LETTER BA +1129F..112A8 ; Consonant # Lo [10] MULTANI LETTER BHA..MULTANI LETTER RHA +112BA..112DE ; Consonant # Lo [37] KHUDAWADI LETTER KA..KHUDAWADI LETTER HA +11315..11328 ; Consonant # Lo [20] GRANTHA LETTER KA..GRANTHA LETTER NA +1132A..11330 ; Consonant # Lo [7] GRANTHA LETTER PA..GRANTHA LETTER RA +11332..11333 ; Consonant # Lo [2] GRANTHA LETTER LA..GRANTHA LETTER LLA +11335..11339 ; Consonant # Lo [5] GRANTHA LETTER VA..GRANTHA LETTER HA +1140E..11434 ; Consonant # Lo [39] NEWA LETTER KA..NEWA LETTER HA +1148F..114AF ; Consonant # Lo [33] TIRHUTA LETTER KA..TIRHUTA LETTER HA +1158E..115AE ; Consonant # Lo [33] SIDDHAM LETTER KA..SIDDHAM LETTER HA +1160E..1162F ; Consonant # Lo [34] MODI LETTER KA..MODI LETTER LLA +1168A..116AA ; Consonant # Lo [33] TAKRI LETTER KA..TAKRI LETTER RRA +116B8 ; Consonant # Lo TAKRI LETTER ARCHAIC KHA +11700..1171A ; Consonant # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA +1180A..1182B ; Consonant # Lo [34] DOGRA LETTER KA..DOGRA LETTER RRA +119AE..119D0 ; Consonant # Lo [35] NANDINAGARI LETTER KA..NANDINAGARI LETTER RRA +11A0B..11A32 ; Consonant # Lo [40] ZANABAZAR SQUARE LETTER KA..ZANABAZAR SQUARE LETTER KSSA +11A5C..11A83 ; Consonant # Lo [40] SOYOMBO LETTER KA..SOYOMBO LETTER KSSA +11C0E..11C2E ; Consonant # Lo [33] BHAIKSUKI LETTER KA..BHAIKSUKI LETTER HA +11C72..11C8F ; Consonant # Lo [30] MARCHEN LETTER KA..MARCHEN LETTER A +11D0C..11D30 ; Consonant # Lo [37] MASARAM GONDI LETTER KA..MASARAM GONDI LETTER TRA +11D6C..11D89 ; Consonant # Lo [30] GUNJALA GONDI LETTER YA..GUNJALA GONDI LETTER SA +11EE0..11EF1 ; Consonant # Lo [18] MAKASAR LETTER KA..MAKASAR LETTER A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Dead + +# Dead Consonant (special consonant with killed vowel) + +# [Not derivable] + +09CE ; Consonant_Dead # Lo BENGALI LETTER KHANDA TA +0D54..0D56 ; Consonant_Dead # Lo [3] MALAYALAM LETTER CHILLU M..MALAYALAM LETTER CHILLU LLL +0D7A..0D7F ; Consonant_Dead # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K +1CF2..1CF3 ; Consonant_Dead # Lo [2] VEDIC SIGN ARDHAVISARGA..VEDIC SIGN ROTATED ARDHAVISARGA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_With_Stacker + +# Consonants that may make stacked ligatures with the next consonant +# without the use of a virama + +# [Not derivable] + +0CF1..0CF2 ; Consonant_With_Stacker # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA +1CF5..1CF6 ; Consonant_With_Stacker # Lo [2] VEDIC SIGN JIHVAMULIYA..VEDIC SIGN UPADHMANIYA +11003..11004 ; Consonant_With_Stacker # Lo [2] BRAHMI SIGN JIHVAMULIYA..BRAHMI SIGN UPADHMANIYA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Prefixed + +# Cluster-initial consonants + +# [Not derivable] + +111C2..111C3 ; Consonant_Prefixed # Lo [2] SHARADA SIGN JIHVAMULIYA..SHARADA SIGN UPADHMANIYA +11A3A ; Consonant_Prefixed # Lo ZANABAZAR SQUARE CLUSTER-INITIAL LETTER RA +11A84..11A89 ; Consonant_Prefixed # Lo [6] SOYOMBO SIGN JIHVAMULIYA..SOYOMBO CLUSTER-INITIAL LETTER SA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Preceding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when preceding the main +# consonant. + +# [Not derivable] + +0D4E ; Consonant_Preceding_Repha # Lo MALAYALAM LETTER DOT REPH +11D46 ; Consonant_Preceding_Repha # Lo MASARAM GONDI REPHA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Initial_Postfixed + +# Consonants that succeed the main consonant in character sequences, but are +# pronounced before it. + +# [Not derivable] + +1A5A ; Consonant_Initial_Postfixed # Mn TAI THAM CONSONANT SIGN LOW PA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Succeeding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when succeeding the main +# consonant. + +# [Not derivable] + +17CC ; Consonant_Succeeding_Repha # Mn KHMER SIGN ROBAT +1B03 ; Consonant_Succeeding_Repha # Mn BALINESE SIGN SURANG +1B81 ; Consonant_Succeeding_Repha # Mn SUNDANESE SIGN PANGLAYAR +A982 ; Consonant_Succeeding_Repha # Mn JAVANESE SIGN LAYAR + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Subjoined + +# Subjoined Consonant (C2 form subtending a base consonant in Tibetan, etc.) + +# [Not derivable] + +0F8D..0F97 ; Consonant_Subjoined # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Consonant_Subjoined # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +1929..192B ; Consonant_Subjoined # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1A57 ; Consonant_Subjoined # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A5B..1A5E ; Consonant_Subjoined # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1BA1 ; Consonant_Subjoined # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA2..1BA3 ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BAC..1BAD ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C24..1C25 ; Consonant_Subjoined # Mc [2] LEPCHA SUBJOINED LETTER YA..LEPCHA SUBJOINED LETTER RA +A867..A868 ; Consonant_Subjoined # Lo [2] PHAGS-PA SUBJOINED LETTER WA..PHAGS-PA SUBJOINED LETTER YA +A871 ; Consonant_Subjoined # Lo PHAGS-PA SUBJOINED LETTER RA +11C92..11CA7 ; Consonant_Subjoined # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CA9 ; Consonant_Subjoined # Mc MARCHEN SUBJOINED LETTER YA +11CAA..11CAF ; Consonant_Subjoined # Mn [6] MARCHEN SUBJOINED LETTER RA..MARCHEN SUBJOINED LETTER A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Medial + +# Medial Consonant (medial liquid, occurring in clusters) + +# [Not derivable] + +0A75 ; Consonant_Medial # Mn GURMUKHI SIGN YAKASH +0EBC ; Consonant_Medial # Mn LAO SEMIVOWEL SIGN LO +0EBD ; Consonant_Medial # Lo LAO SEMIVOWEL SIGN NYO +103B..103C ; Consonant_Medial # Mc [2] MYANMAR CONSONANT SIGN MEDIAL YA..MYANMAR CONSONANT SIGN MEDIAL RA +103D..103E ; Consonant_Medial # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +105E..1060 ; Consonant_Medial # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Consonant_Medial # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +1A55 ; Consonant_Medial # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A56 ; Consonant_Medial # Mn TAI THAM CONSONANT SIGN MEDIAL LA +A8B4 ; Consonant_Medial # Mc SAURASHTRA CONSONANT SIGN HAARU +A9BD ; Consonant_Medial # Mn JAVANESE CONSONANT SIGN KERET +A9BE..A9BF ; Consonant_Medial # Mc [2] JAVANESE CONSONANT SIGN PENGKAL..JAVANESE CONSONANT SIGN CAKRA +AA33..AA34 ; Consonant_Medial # Mc [2] CHAM CONSONANT SIGN YA..CHAM CONSONANT SIGN RA +AA35..AA36 ; Consonant_Medial # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +1171D..1171F ; Consonant_Medial # Mn [3] AHOM CONSONANT SIGN MEDIAL LA..AHOM CONSONANT SIGN MEDIAL LIGATING RA +11A3B..11A3E ; Consonant_Medial # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11D47 ; Consonant_Medial # Mn MASARAM GONDI RA-KARA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Final + +# Final Consonant (special final forms which do not take vowels) + +# [Not derivable] + +1930..1931 ; Consonant_Final # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Consonant_Final # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +1939 ; Consonant_Final # Mn LIMBU SIGN MUKPHRENG +19C1..19C7 ; Consonant_Final # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B +1A58..1A59 ; Consonant_Final # Mn [2] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN FINAL NGA +1BBE..1BBF ; Consonant_Final # Lo [2] SUNDANESE LETTER FINAL K..SUNDANESE LETTER FINAL M +1BF0..1BF1 ; Consonant_Final # Mn [2] BATAK CONSONANT SIGN NG..BATAK CONSONANT SIGN H +1C2D..1C33 ; Consonant_Final # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +A94F..A951 ; Consonant_Final # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A952 ; Consonant_Final # Mc REJANG CONSONANT SIGN H +AA40..AA42 ; Consonant_Final # Lo [3] CHAM LETTER FINAL K..CHAM LETTER FINAL NG +AA43 ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL NG +AA44..AA4B ; Consonant_Final # Lo [8] CHAM LETTER FINAL CH..CHAM LETTER FINAL SS +AA4C ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL M +AA4D ; Consonant_Final # Mc CHAM CONSONANT SIGN FINAL H +ABDB..ABE2 ; Consonant_Final # Lo [8] MEETEI MAYEK LETTER KOK LONSUM..MEETEI MAYEK LETTER I LONSUM +11A8A..11A95 ; Consonant_Final # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Head_Letter + +# Head Letter (Tibetan) + +# [Not derivable] + +0F88..0F8C ; Consonant_Head_Letter # Lo [5] TIBETAN SIGN LCE TSA CAN..TIBETAN SIGN INVERTED MCHU CAN + +# ================================================ + +# Indic_Syllabic_Category=Modifying_Letter + +# Reanalyzed letters not participating in the abugida structure, but +# serving to modify the sound of an adjacent vowel or consonant. +# Note that this is not the same as General_Category=Modifier_Letter. + +# [Not derivable] + +0B83 ; Modifying_Letter # Lo TAMIL SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Tone_Letter + +# Tone Letter (spacing lexical tone mark with status as a letter) + +# [Not derivable] + +1970..1974 ; Tone_Letter # Lo [5] TAI LE LETTER TONE-2..TAI LE LETTER TONE-6 +AAC0 ; Tone_Letter # Lo TAI VIET TONE MAI NUENG +AAC2 ; Tone_Letter # Lo TAI VIET TONE MAI SONG + +# ================================================ + +# Indic_Syllabic_Category=Tone_Mark + +# Tone Mark (nonspacing or spacing lexical tone mark) + +# [Not derivable] + +0E48..0E4B ; Tone_Mark # Mn [4] THAI CHARACTER MAI EK..THAI CHARACTER MAI CHATTAWA +0EC8..0ECB ; Tone_Mark # Mn [4] LAO TONE MAI EK..LAO TONE MAI CATAWA +1037 ; Tone_Mark # Mn MYANMAR SIGN DOT BELOW +1063..1064 ; Tone_Mark # Mc [2] MYANMAR TONE MARK SGAW KAREN HATHI..MYANMAR TONE MARK SGAW KAREN KE PHO +1069..106D ; Tone_Mark # Mc [5] MYANMAR SIGN WESTERN PWO KAREN TONE-1..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1087..108C ; Tone_Mark # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108D ; Tone_Mark # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +108F ; Tone_Mark # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109B ; Tone_Mark # Mc [2] MYANMAR SIGN KHAMTI TONE-1..MYANMAR SIGN KHAMTI TONE-3 +19C8..19C9 ; Tone_Mark # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A75..1A79 ; Tone_Mark # Mn [5] TAI THAM SIGN TONE-1..TAI THAM SIGN KHUEN TONE-5 +A92B..A92D ; Tone_Mark # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +AA7B ; Tone_Mark # Mc MYANMAR SIGN PAO KAREN TONE +AA7C ; Tone_Mark # Mn MYANMAR SIGN TAI LAING TONE-2 +AA7D ; Tone_Mark # Mc MYANMAR SIGN TAI LAING TONE-5 +AABF ; Tone_Mark # Mn TAI VIET TONE MAI EK +AAC1 ; Tone_Mark # Mn TAI VIET TONE MAI THO +ABEC ; Tone_Mark # Mc MEETEI MAYEK LUM IYEK + +# ================================================ + +# Indic_Syllabic_Category=Gemination_Mark + +# Gemination Mark (doubling of the preceding or following consonant) + +# [Not derivable] + +0A71 ; Gemination_Mark # Mn GURMUKHI ADDAK +11237 ; Gemination_Mark # Mn KHOJKI SIGN SHADDA +11A98 ; Gemination_Mark # Mn SOYOMBO GEMINATION MARK + +# ================================================ + +# Indic_Syllabic_Category=Cantillation_Mark + +# Cantillation Mark (recitation marks, such as svara markers for the Samaveda) + +# [Not derivable] + +0951..0952 ; Cantillation_Mark # Mn [2] DEVANAGARI STRESS SIGN UDATTA..DEVANAGARI STRESS SIGN ANUDATTA +0A51 ; Cantillation_Mark # Mn GURMUKHI SIGN UDAAT +0AFA..0AFC ; Cantillation_Mark # Mn [3] GUJARATI SIGN SUKUN..GUJARATI SIGN MADDAH +1CD0..1CD2 ; Cantillation_Mark # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CD4..1CE0 ; Cantillation_Mark # Mn [13] VEDIC SIGN YAJURVEDIC MIDLINE SVARITA..VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CE1 ; Cantillation_Mark # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF4 ; Cantillation_Mark # Mn VEDIC TONE CANDRA ABOVE +1CF7 ; Cantillation_Mark # Mc VEDIC SIGN ATIKRAMA +1CF8..1CF9 ; Cantillation_Mark # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE +20F0 ; Cantillation_Mark # Mn COMBINING ASTERISK ABOVE +A8E0..A8F1 ; Cantillation_Mark # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +1123E ; Cantillation_Mark # Mn KHOJKI SIGN SUKUN +11366..1136C ; Cantillation_Mark # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Cantillation_Mark # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA + +# ================================================ + +# Indic_Syllabic_Category=Register_Shifter + +# Register Shifter (shifts register for consonants, akin to a tone mark) + +# [Not derivable] + +17C9..17CA ; Register_Shifter # Mn [2] KHMER SIGN MUUSIKATOAN..KHMER SIGN TRIISAP + +# ================================================ + +# Indic_Syllabic_Category=Syllable_Modifier + +# Syllable Modifier (miscellaneous combining characters that modify +# something in the orthographic syllable they succeed) + +# [Not derivable] + +00B2..00B3 ; Syllable_Modifier # No [2] SUPERSCRIPT TWO..SUPERSCRIPT THREE +09FE ; Syllable_Modifier # Mn BENGALI SANDHI MARK +0F35 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0FC6 ; Syllable_Modifier # Mn TIBETAN SYMBOL PADMA GDAN +17CB ; Syllable_Modifier # Mn KHMER SIGN BANTOC +17CE..17D0 ; Syllable_Modifier # Mn [3] KHMER SIGN KAKABAT..KHMER SIGN SAMYOK SANNYA +17D3 ; Syllable_Modifier # Mn KHMER SIGN BATHAMASAT +17DD ; Syllable_Modifier # Mn KHMER SIGN ATTHACAN +193B ; Syllable_Modifier # Mn LIMBU SIGN SA-I +1A7B..1A7C ; Syllable_Modifier # Mn [2] TAI THAM SIGN MAI SAM..TAI THAM SIGN KHUEN-LUE KARAN +1A7F ; Syllable_Modifier # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1C36 ; Syllable_Modifier # Mn LEPCHA SIGN RAN +1DFB ; Syllable_Modifier # Mn COMBINING DELETION MARK +2074 ; Syllable_Modifier # No SUPERSCRIPT FOUR +2082..2084 ; Syllable_Modifier # No [3] SUBSCRIPT TWO..SUBSCRIPT FOUR +111C9 ; Syllable_Modifier # Mn SHARADA SANDHI MARK +1145E ; Syllable_Modifier # Mn NEWA SANDHI MARK +11A33 ; Syllable_Modifier # Mn ZANABAZAR SQUARE FINAL CONSONANT MARK + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Killer + +# Consonant Killer (signifies that the previous consonant or consonants are +# not pronounced) + +# [Not derivable] + +0E4C ; Consonant_Killer # Mn THAI CHARACTER THANTHAKHAT +17CD ; Consonant_Killer # Mn KHMER SIGN TOANDAKHIAT + +# ================================================ + +# Indic_Syllabic_Category=Non_Joiner + +# Non_Joiner (Zero Width Non-Joiner) + +# [Not derivable] + +200C ; Non_Joiner # Cf ZERO WIDTH NON-JOINER + +# ================================================ + +# Indic_Syllabic_Category=Joiner + +# Joiner (Zero Width Joiner) + +# [Not derivable] + +200D ; Joiner # Cf ZERO WIDTH JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number_Joiner + +# Number_Joiner (forms ligatures between numbers for multiplication) + +# [Not derivable] + +1107F ; Number_Joiner # Mn BRAHMI NUMBER JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number + +# Number (can be used as vowel-holders like consonant placeholders) +# Note: A number may even hold subjoined consonants which may in turn +# have been formed using a virama or a stacker, e.g. the sequence +# where THAI THAM LETTER LOW TA is subjoined to +# TAI THAM THAM DIGIT THREE using an invisible stacker. + +# [Not derivable] + +0030..0039 ; Number # Nd [10] DIGIT ZERO..DIGIT NINE +0966..096F ; Number # Nd [10] DEVANAGARI DIGIT ZERO..DEVANAGARI DIGIT NINE +09E6..09EF ; Number # Nd [10] BENGALI DIGIT ZERO..BENGALI DIGIT NINE +0A66..0A6F ; Number # Nd [10] GURMUKHI DIGIT ZERO..GURMUKHI DIGIT NINE +0AE6..0AEF ; Number # Nd [10] GUJARATI DIGIT ZERO..GUJARATI DIGIT NINE +0B66..0B6F ; Number # Nd [10] ORIYA DIGIT ZERO..ORIYA DIGIT NINE +0BE6..0BEF ; Number # Nd [10] TAMIL DIGIT ZERO..TAMIL DIGIT NINE +0C66..0C6F ; Number # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE +0CE6..0CEF ; Number # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE +0D66..0D6F ; Number # Nd [10] MALAYALAM DIGIT ZERO..MALAYALAM DIGIT NINE +0DE6..0DEF ; Number # Nd [10] SINHALA LITH DIGIT ZERO..SINHALA LITH DIGIT NINE +0E50..0E59 ; Number # Nd [10] THAI DIGIT ZERO..THAI DIGIT NINE +0ED0..0ED9 ; Number # Nd [10] LAO DIGIT ZERO..LAO DIGIT NINE +0F20..0F29 ; Number # Nd [10] TIBETAN DIGIT ZERO..TIBETAN DIGIT NINE +0F2A..0F33 ; Number # No [10] TIBETAN DIGIT HALF ONE..TIBETAN DIGIT HALF ZERO +1040..1049 ; Number # Nd [10] MYANMAR DIGIT ZERO..MYANMAR DIGIT NINE +1090..1099 ; Number # Nd [10] MYANMAR SHAN DIGIT ZERO..MYANMAR SHAN DIGIT NINE +17E0..17E9 ; Number # Nd [10] KHMER DIGIT ZERO..KHMER DIGIT NINE +1946..194F ; Number # Nd [10] LIMBU DIGIT ZERO..LIMBU DIGIT NINE +19D0..19D9 ; Number # Nd [10] NEW TAI LUE DIGIT ZERO..NEW TAI LUE DIGIT NINE +19DA ; Number # No NEW TAI LUE THAM DIGIT ONE +1A80..1A89 ; Number # Nd [10] TAI THAM HORA DIGIT ZERO..TAI THAM HORA DIGIT NINE +1A90..1A99 ; Number # Nd [10] TAI THAM THAM DIGIT ZERO..TAI THAM THAM DIGIT NINE +1B50..1B59 ; Number # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE +1BB0..1BB9 ; Number # Nd [10] SUNDANESE DIGIT ZERO..SUNDANESE DIGIT NINE +1C40..1C49 ; Number # Nd [10] LEPCHA DIGIT ZERO..LEPCHA DIGIT NINE +A8D0..A8D9 ; Number # Nd [10] SAURASHTRA DIGIT ZERO..SAURASHTRA DIGIT NINE +A900..A909 ; Number # Nd [10] KAYAH LI DIGIT ZERO..KAYAH LI DIGIT NINE +A9D0..A9D9 ; Number # Nd [10] JAVANESE DIGIT ZERO..JAVANESE DIGIT NINE +A9F0..A9F9 ; Number # Nd [10] MYANMAR TAI LAING DIGIT ZERO..MYANMAR TAI LAING DIGIT NINE +AA50..AA59 ; Number # Nd [10] CHAM DIGIT ZERO..CHAM DIGIT NINE +ABF0..ABF9 ; Number # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE +10A40..10A48 ; Number # No [9] KHAROSHTHI DIGIT ONE..KHAROSHTHI FRACTION ONE HALF +11066..1106F ; Number # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11136..1113F ; Number # Nd [10] CHAKMA DIGIT ZERO..CHAKMA DIGIT NINE +111D0..111D9 ; Number # Nd [10] SHARADA DIGIT ZERO..SHARADA DIGIT NINE +111E1..111F4 ; Number # No [20] SINHALA ARCHAIC DIGIT ONE..SINHALA ARCHAIC NUMBER ONE THOUSAND +112F0..112F9 ; Number # Nd [10] KHUDAWADI DIGIT ZERO..KHUDAWADI DIGIT NINE +11450..11459 ; Number # Nd [10] NEWA DIGIT ZERO..NEWA DIGIT NINE +114D0..114D9 ; Number # Nd [10] TIRHUTA DIGIT ZERO..TIRHUTA DIGIT NINE +11650..11659 ; Number # Nd [10] MODI DIGIT ZERO..MODI DIGIT NINE +116C0..116C9 ; Number # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE +11730..11739 ; Number # Nd [10] AHOM DIGIT ZERO..AHOM DIGIT NINE +1173A..1173B ; Number # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY +11C50..11C59 ; Number # Nd [10] BHAIKSUKI DIGIT ZERO..BHAIKSUKI DIGIT NINE +11C5A..11C6C ; Number # No [19] BHAIKSUKI NUMBER ONE..BHAIKSUKI HUNDREDS UNIT MARK +11D50..11D59 ; Number # Nd [10] MASARAM GONDI DIGIT ZERO..MASARAM GONDI DIGIT NINE +11DA0..11DA9 ; Number # Nd [10] GUNJALA GONDI DIGIT ZERO..GUNJALA GONDI DIGIT NINE + +# ================================================ + +# Indic_Syllabic_Category=Brahmi_Joining_Number + +# Brahmi Joining Number (similar to Number in that in can be used as +# vowel-holders like Consonant_Placeholder, but may also be joined by +# a Number_Joiner of the same script, e.g. in Brahmi) + +# [Not derivable] + +11052..11065 ; Brahmi_Joining_Number # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND + +# EOF diff --git a/data/12.1.0-indic-positional-category.txt b/data/12.1.0-indic-positional-category.txt new file mode 100644 index 0000000..24a82b3 --- /dev/null +++ b/data/12.1.0-indic-positional-category.txt @@ -0,0 +1,755 @@ +# IndicPositionalCategory-12.1.0.txt +# Date: 2019-03-08, 23:59:00 GMT [KW, RP] +# © 2019 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# +# For documentation, see UAX #44: Unicode Character Database, +# at http://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Positional_Category enumerated property +# +# Scope: This property is aimed at the problem of +# the specification of syllabic structure for Indic scripts. +# Because dependent vowels (matras), visible viramas, and other +# characters are placed in notional slots around the consonant (or +# consonant cluster) core of an Indic syllable, there may be +# cooccurrence constraints or other interactions. Also, it may be +# desirable, in cases where more than one such character may occur in +# sequence, as for example, in a top slot and a bottom slot, to +# specify preferred orders for spelling. As such, this property +# is designed primarily to supplement the Indic_Syllabic_Category +# property. +# +# Note that this property is *not* intended as +# a prescriptive property regarding display or font design, +# for a number of reasons. Good font design requires information +# that is outside the context of a character encoding standard, +# and is best handled in other venues. For Indic dependent +# vowels and similar characters, in particular: +# +# 1. Matra placement may vary somewhat based on typeface design. +# 2. Matra placement, even within a single script, may vary +# somewhat according to historic period or local conventions. +# 3. Matra placement may be changed by explicit orthographic reform +# decisions. +# 4. Matras may ligate in various ways with a consonant (or even +# other elements of a syllable) instead of occurring in a +# discrete location. +# 5. Matra display may be contextually determined. This is +# notable, for example, in the Tamil script, where the shape +# and placement of -u and -uu vowels depends strongly on +# which consonant they adjoin. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Positional_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as containing dependent vowels or similar characters +# in the structural sense used for the Indic_Positional_Category are the +# following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Dogra, Grantha, Gujarati, Gunjala Gondi, +# Gurmukhi, Hanunoo, Javanese, Kaithi, Kannada, Kharoshthi, Khmer, +# Khojki, Khudawadi, Lao, Lepcha, Limbu, Makasar, Malayalam, Marchen, +# Masaram Gondi, Meetei Mayek, Modi, Myanmar, Nandinagari, Newa, +# New Tai Lue, Oriya, Rejang, Saurashtra, Sharada, Siddham, Sinhala, +# Soyombo, Sundanese, Syloti Nagri, Tagalog, Tagbanwa, Tai Tham, Tai +# Viet, Takri, Tamil, Telugu, Thai, Tibetan, Tirhuta, and Zanabazar +# Square. +# +# All characters for all other scripts not in that list +# take the default value for this property. +# +# See IndicSyllabicCategory.txt for a slightly more extended +# list of Indic scripts, including those which do not have +# positional characters. Currently, those additional +# Indic scripts without positional characters are +# Kayah Li, Mahajani, Multani, Phags-pa, and Tai Le. +# +# Notes: +# +# 1. The following characters are all assigned the positional category Right, +# but may have different positions in some cases: +# * U+0BC1 TAMIL VOWEL SIGN U and U+0BC2 TAMIL VOWEL SIGN UU have +# contextually variable placement in Tamil. +# * U+0D41 MALAYALAM VOWEL SIGN U and U+0D42 MALAYALAM VOWEL SIGN UU form +# complex ligatures with consonants in older Malayalam orthography. +# * U+11341 GRANTHA VOWEL SIGN U and U+11342 GRANTHA VOWEL SIGN UU have +# contextually variable placement in Grantha. +# * U+11440 NEWA VOWEL SIGN O and U+11441 NEWA VOWEL SIGN AU have contextually +# variable placement in Newa. +# +# 2. The following characters are all assigned the positional category Top, +# but may have different positions in some cases: +# * U+1143E NEWA VOWEL SIGN E and U+1143F NEWA VOWEL SIGN AI have contextually +# variable placement in Newa. +# +# 3. The following characters are all assigned the positional category Bottom, +# but may have different positions in some cases: +# * U+102F MYANMAR VOWEL SIGN U and U+1030 MYANMAR VOWEL SIGN UU have +# contextually variable placement in Myanmar. +# * U+1A69 TAI THAM VOWEL SIGN U and U+1A6A TAI THAM VOWEL SIGN UU have +# contextually variable placement in Tai Tham. +# +# 4. The following character is assigned the positional category Left, but +# may have different positions in different styles: +# * U+119D2 NANDINAGARI VOWEL SIGN I has stylistically variable placement +# in Nandinagari. + + +# ================================================ + +# Property: Indic_Positional_Category +# +# All code points not explicitly listed for Indic_Positional_Category +# have the value NA (not applicable). +# +# @missing: 0000..10FFFF; NA + +# ------------------------------------------------ + +# Indic_Positional_Category=Right + +0903 ; Right # Mc DEVANAGARI SIGN VISARGA +093B ; Right # Mc DEVANAGARI VOWEL SIGN OOE +093E ; Right # Mc DEVANAGARI VOWEL SIGN AA +0940 ; Right # Mc DEVANAGARI VOWEL SIGN II +0949..094C ; Right # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094F ; Right # Mc DEVANAGARI VOWEL SIGN AW +0982..0983 ; Right # Mc [2] BENGALI SIGN ANUSVARA..BENGALI SIGN VISARGA +09BE ; Right # Mc BENGALI VOWEL SIGN AA +09C0 ; Right # Mc BENGALI VOWEL SIGN II +09D7 ; Right # Mc BENGALI AU LENGTH MARK +0A03 ; Right # Mc GURMUKHI SIGN VISARGA +0A3E ; Right # Mc GURMUKHI VOWEL SIGN AA +0A40 ; Right # Mc GURMUKHI VOWEL SIGN II +0A83 ; Right # Mc GUJARATI SIGN VISARGA +0ABE ; Right # Mc GUJARATI VOWEL SIGN AA +0AC0 ; Right # Mc GUJARATI VOWEL SIGN II +0ACB..0ACC ; Right # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0B02..0B03 ; Right # Mc [2] ORIYA SIGN ANUSVARA..ORIYA SIGN VISARGA +0B3E ; Right # Mc ORIYA VOWEL SIGN AA +0B40 ; Right # Mc ORIYA VOWEL SIGN II +0BBE..0BBF ; Right # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC1..0BC2 ; Right # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BD7 ; Right # Mc TAMIL AU LENGTH MARK +0C01..0C03 ; Right # Mc [3] TELUGU SIGN CANDRABINDU..TELUGU SIGN VISARGA +0C41..0C44 ; Right # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C82..0C83 ; Right # Mc [2] KANNADA SIGN ANUSVARA..KANNADA SIGN VISARGA +0CBE ; Right # Mc KANNADA VOWEL SIGN AA +0CC1..0CC4 ; Right # Mc [4] KANNADA VOWEL SIGN U..KANNADA VOWEL SIGN VOCALIC RR +0CD5..0CD6 ; Right # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0D02..0D03 ; Right # Mc [2] MALAYALAM SIGN ANUSVARA..MALAYALAM SIGN VISARGA +0D3E..0D40 ; Right # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D42 ; Right # Mn [2] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN UU +0D57 ; Right # Mc MALAYALAM AU LENGTH MARK +0D82..0D83 ; Right # Mc [2] SINHALA SIGN ANUSVARAYA..SINHALA SIGN VISARGAYA +0DCF..0DD1 ; Right # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD8 ; Right # Mc SINHALA VOWEL SIGN GAETTA-PILLA +0DDF ; Right # Mc SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Right # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Right # Lo THAI CHARACTER SARA A +0E32..0E33 ; Right # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E45 ; Right # Lo THAI CHARACTER LAKKHANGYAO +0EB0 ; Right # Lo LAO VOWEL SIGN A +0EB2..0EB3 ; Right # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0F3E ; Right # Mc TIBETAN SIGN YAR TSHES +0F7F ; Right # Mc TIBETAN SIGN RNAM BCAD +102B..102C ; Right # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +1038 ; Right # Mc MYANMAR SIGN VISARGA +103B ; Right # Mc MYANMAR CONSONANT SIGN MEDIAL YA +1056..1057 ; Right # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1062..1064 ; Right # Mc [3] MYANMAR VOWEL SIGN SGAW KAREN EU..MYANMAR TONE MARK SGAW KAREN KE PHO +1067..106D ; Right # Mc [7] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1083 ; Right # Mc MYANMAR VOWEL SIGN SHAN AA +1087..108C ; Right # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108F ; Right # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109C ; Right # Mc [3] MYANMAR SIGN KHAMTI TONE-1..MYANMAR VOWEL SIGN AITON A +17B6 ; Right # Mc KHMER VOWEL SIGN AA +17C7..17C8 ; Right # Mc [2] KHMER SIGN REAHMUK..KHMER SIGN YUUKALEAPINTU +1923..1924 ; Right # Mc [2] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AI +1929..192B ; Right # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1930..1931 ; Right # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Right # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +19B0..19B4 ; Right # Lo [5] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN UU +19B8..19B9 ; Right # Lo [2] NEW TAI LUE VOWEL SIGN OA..NEW TAI LUE VOWEL SIGN UE +19BB..19C0 ; Right # Lo [6] NEW TAI LUE VOWEL SIGN AAY..NEW TAI LUE VOWEL SIGN IY +19C8..19C9 ; Right # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A1A ; Right # Mc BUGINESE VOWEL SIGN O +1A57 ; Right # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A61 ; Right # Mc TAI THAM VOWEL SIGN A +1A63..1A64 ; Right # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A6D ; Right # Mc TAI THAM VOWEL SIGN OY +1B04 ; Right # Mc BALINESE SIGN BISAH +1B35 ; Right # Mc BALINESE VOWEL SIGN TEDUNG +1B44 ; Right # Mc BALINESE ADEG ADEG +1B82 ; Right # Mc SUNDANESE SIGN PANGWISAD +1BA1 ; Right # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA7 ; Right # Mc SUNDANESE VOWEL SIGN PANOLONG +1BAA ; Right # Mc SUNDANESE SIGN PAMAAEH +1BE7 ; Right # Mc BATAK VOWEL SIGN E +1BEA..1BEC ; Right # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BEE ; Right # Mc BATAK VOWEL SIGN U +1BF2..1BF3 ; Right # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +1C24..1C26 ; Right # Mc [3] LEPCHA SUBJOINED LETTER YA..LEPCHA VOWEL SIGN AA +1C2A..1C2B ; Right # Mc [2] LEPCHA VOWEL SIGN U..LEPCHA VOWEL SIGN UU +1CE1 ; Right # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF7 ; Right # Mc VEDIC SIGN ATIKRAMA +A823..A824 ; Right # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A827 ; Right # Mc SYLOTI NAGRI VOWEL SIGN OO +A880..A881 ; Right # Mc [2] SAURASHTRA SIGN ANUSVARA..SAURASHTRA SIGN VISARGA +A8B4..A8C3 ; Right # Mc [16] SAURASHTRA CONSONANT SIGN HAARU..SAURASHTRA VOWEL SIGN AU +A952..A953 ; Right # Mc [2] REJANG CONSONANT SIGN H..REJANG VIRAMA +A983 ; Right # Mc JAVANESE SIGN WIGNYAN +A9B4..A9B5 ; Right # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9BE ; Right # Mc JAVANESE CONSONANT SIGN PENGKAL +AA33 ; Right # Mc CHAM CONSONANT SIGN YA +AA4D ; Right # Mc CHAM CONSONANT SIGN FINAL H +AA7B ; Right # Mc MYANMAR SIGN PAO KAREN TONE +AA7D ; Right # Mc MYANMAR SIGN TAI LAING TONE-5 +AAB1 ; Right # Lo TAI VIET VOWEL AA +AABA ; Right # Lo TAI VIET VOWEL UA +AABD ; Right # Lo TAI VIET VOWEL AN +AAEF ; Right # Mc MEETEI MAYEK VOWEL SIGN AAU +AAF5 ; Right # Mc MEETEI MAYEK VOWEL SIGN VISARGA +ABE3..ABE4 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE6..ABE7 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE9..ABEA ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +ABEC ; Right # Mc MEETEI MAYEK LUM IYEK +11000 ; Right # Mc BRAHMI SIGN CANDRABINDU +11002 ; Right # Mc BRAHMI SIGN VISARGA +11082 ; Right # Mc KAITHI SIGN VISARGA +110B0 ; Right # Mc KAITHI VOWEL SIGN AA +110B2 ; Right # Mc KAITHI VOWEL SIGN II +110B7..110B8 ; Right # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11145..11146 ; Right # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI +11182 ; Right # Mc SHARADA SIGN VISARGA +111B3 ; Right # Mc SHARADA VOWEL SIGN AA +111B5 ; Right # Mc SHARADA VOWEL SIGN II +111C0 ; Right # Mc SHARADA SIGN VIRAMA +1122C..1122E ; Right # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +11235 ; Right # Mc KHOJKI SIGN VIRAMA +112E0 ; Right # Mc KHUDAWADI VOWEL SIGN AA +112E2 ; Right # Mc KHUDAWADI VOWEL SIGN II +11302..11303 ; Right # Mc [2] GRANTHA SIGN ANUSVARA..GRANTHA SIGN VISARGA +1133E..1133F ; Right # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11341..11344 ; Right # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +1134D ; Right # Mc GRANTHA SIGN VIRAMA +11357 ; Right # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Right # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +11435 ; Right # Mc NEWA VOWEL SIGN AA +11437 ; Right # Mc NEWA VOWEL SIGN II +11440..11441 ; Right # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +11445 ; Right # Mc NEWA SIGN VISARGA +114B0 ; Right # Mc TIRHUTA VOWEL SIGN AA +114B2 ; Right # Mc TIRHUTA VOWEL SIGN II +114BD ; Right # Mc TIRHUTA VOWEL SIGN SHORT O +114C1 ; Right # Mc TIRHUTA SIGN VISARGA +115AF ; Right # Mc SIDDHAM VOWEL SIGN AA +115B1 ; Right # Mc SIDDHAM VOWEL SIGN II +115BE ; Right # Mc SIDDHAM SIGN VISARGA +11630..11632 ; Right # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +1163B..1163C ; Right # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +1163E ; Right # Mc MODI SIGN VISARGA +116AC ; Right # Mc TAKRI SIGN VISARGA +116AF ; Right # Mc TAKRI VOWEL SIGN II +116B6 ; Right # Mc TAKRI SIGN VIRAMA +11720..11721 ; Right # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +1182C ; Right # Mc DOGRA VOWEL SIGN AA +1182E ; Right # Mc DOGRA VOWEL SIGN II +11838 ; Right # Mc DOGRA SIGN VISARGA +119D1 ; Right # Mc NANDINAGARI VOWEL SIGN AA +119D3 ; Right # Mc NANDINAGARI VOWEL SIGN II +119DC..119DF ; Right # Mc [4] NANDINAGARI VOWEL SIGN O..NANDINAGARI SIGN VISARGA +11A39 ; Right # Mc ZANABAZAR SQUARE SIGN VISARGA +11A57..11A58 ; Right # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A97 ; Right # Mc SOYOMBO SIGN VISARGA +11C2F ; Right # Mc BHAIKSUKI VOWEL SIGN AA +11C3E ; Right # Mc BHAIKSUKI SIGN VISARGA +11CA9 ; Right # Mc MARCHEN SUBJOINED LETTER YA +11CB4 ; Right # Mc MARCHEN VOWEL SIGN O +11D8A..11D8E ; Right # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU +11D93..11D94 ; Right # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU +11D96 ; Right # Mc GUNJALA GONDI SIGN VISARGA +11EF6 ; Right # Mc MAKASAR VOWEL SIGN O + +# Indic_Positional_Category=Left + +093F ; Left # Mc DEVANAGARI VOWEL SIGN I +094E ; Left # Mc DEVANAGARI VOWEL SIGN PRISHTHAMATRA E +09BF ; Left # Mc BENGALI VOWEL SIGN I +09C7..09C8 ; Left # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +0A3F ; Left # Mc GURMUKHI VOWEL SIGN I +0ABF ; Left # Mc GUJARATI VOWEL SIGN I +0B47 ; Left # Mc ORIYA VOWEL SIGN E +0BC6..0BC8 ; Left # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0D46..0D48 ; Left # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0DD9 ; Left # Mc SINHALA VOWEL SIGN KOMBUVA +0DDB ; Left # Mc SINHALA VOWEL SIGN KOMBU DEKA +0F3F ; Left # Mc TIBETAN SIGN MAR TSHES +1031 ; Left # Mc MYANMAR VOWEL SIGN E +1084 ; Left # Mc MYANMAR VOWEL SIGN SHAN E +17C1..17C3 ; Left # Mc [3] KHMER VOWEL SIGN E..KHMER VOWEL SIGN AI +1A19 ; Left # Mc BUGINESE VOWEL SIGN E +1A55 ; Left # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A6E..1A72 ; Left # Mc [5] TAI THAM VOWEL SIGN E..TAI THAM VOWEL SIGN THAM AI +1B3E..1B3F ; Left # Mc [2] BALINESE VOWEL SIGN TALING..BALINESE VOWEL SIGN TALING REPA +1BA6 ; Left # Mc SUNDANESE VOWEL SIGN PANAELAENG +1C27..1C28 ; Left # Mc [2] LEPCHA VOWEL SIGN I..LEPCHA VOWEL SIGN O +1C34..1C35 ; Left # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A9BA..A9BB ; Left # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +AA2F..AA30 ; Left # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA34 ; Left # Mc CHAM CONSONANT SIGN RA +AAEB ; Left # Mc MEETEI MAYEK VOWEL SIGN II +AAEE ; Left # Mc MEETEI MAYEK VOWEL SIGN AU +110B1 ; Left # Mc KAITHI VOWEL SIGN I +1112C ; Left # Mc CHAKMA VOWEL SIGN E +111B4 ; Left # Mc SHARADA VOWEL SIGN I +112E1 ; Left # Mc KHUDAWADI VOWEL SIGN I +11347..11348 ; Left # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +11436 ; Left # Mc NEWA VOWEL SIGN I +114B1 ; Left # Mc TIRHUTA VOWEL SIGN I +114B9 ; Left # Mc TIRHUTA VOWEL SIGN E +115B0 ; Left # Mc SIDDHAM VOWEL SIGN I +115B8 ; Left # Mc SIDDHAM VOWEL SIGN E +116AE ; Left # Mc TAKRI VOWEL SIGN I +11726 ; Left # Mc AHOM VOWEL SIGN E +1182D ; Left # Mc DOGRA VOWEL SIGN I +119D2 ; Left # Mc NANDINAGARI VOWEL SIGN I +119E4 ; Left # Mc NANDINAGARI VOWEL SIGN PRISHTHAMATRA E +11CB1 ; Left # Mc MARCHEN VOWEL SIGN I +11EF5 ; Left # Mc MAKASAR VOWEL SIGN E + +# Indic_Positional_Category=Visual_Order_Left + +# These are dependent vowels that occur to the left of the consonant +# letter in a syllable, but which occur in scripts using the visual order +# model, instead of the logical order model. Because of the different +# model, these left-side vowels occur first in the backing store (before +# the consonant letter) and are not reordered during text rendering. +# +# [Derivation: Logical_Order_Exception=Yes] + +0E40..0E44 ; Visual_Order_Left # Lo [5] THAI CHARACTER SARA E..THAI CHARACTER SARA AI MAIMALAI +0EC0..0EC4 ; Visual_Order_Left # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +19B5..19B7 ; Visual_Order_Left # Lo [3] NEW TAI LUE VOWEL SIGN E..NEW TAI LUE VOWEL SIGN O +19BA ; Visual_Order_Left # Lo NEW TAI LUE VOWEL SIGN AY +AAB5..AAB6 ; Visual_Order_Left # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB9 ; Visual_Order_Left # Lo TAI VIET VOWEL UEA +AABB..AABC ; Visual_Order_Left # Lo [2] TAI VIET VOWEL AUE..TAI VIET VOWEL AY + +# Indic_Positional_Category=Left_And_Right + +09CB..09CC ; Left_And_Right # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +0B4B ; Left_And_Right # Mc ORIYA VOWEL SIGN O +0BCA..0BCC ; Left_And_Right # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0D4A..0D4C ; Left_And_Right # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0DDC ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA +0DDE ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA +17C0 ; Left_And_Right # Mc KHMER VOWEL SIGN IE +17C4..17C5 ; Left_And_Right # Mc [2] KHMER VOWEL SIGN OO..KHMER VOWEL SIGN AU +1B40..1B41 ; Left_And_Right # Mc [2] BALINESE VOWEL SIGN TALING TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1134B..1134C ; Left_And_Right # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +114BC ; Left_And_Right # Mc TIRHUTA VOWEL SIGN O +114BE ; Left_And_Right # Mc TIRHUTA VOWEL SIGN AU +115BA ; Left_And_Right # Mc SIDDHAM VOWEL SIGN O + +# Indic_Positional_Category=Top + +0900..0902 ; Top # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +093A ; Top # Mn DEVANAGARI VOWEL SIGN OE +0945..0948 ; Top # Mn [4] DEVANAGARI VOWEL SIGN CANDRA E..DEVANAGARI VOWEL SIGN AI +0951 ; Top # Mn DEVANAGARI STRESS SIGN UDATTA +0953..0955 ; Top # Mn [3] DEVANAGARI GRAVE ACCENT..DEVANAGARI VOWEL SIGN CANDRA LONG E +0981 ; Top # Mn BENGALI SIGN CANDRABINDU +09FE ; Top # Mn BENGALI SANDHI MARK +0A01..0A02 ; Top # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A47..0A48 ; Top # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Top # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0A70..0A71 ; Top # Mn [2] GURMUKHI TIPPI..GURMUKHI ADDAK +0A81..0A82 ; Top # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0AC5 ; Top # Mn GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Top # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AFA..0AFF ; Top # Mn [6] GUJARATI SIGN SUKUN..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B01 ; Top # Mn ORIYA SIGN CANDRABINDU +0B3F ; Top # Mn ORIYA VOWEL SIGN I +0B56 ; Top # Mn ORIYA AI LENGTH MARK +0B82 ; Top # Mn TAMIL SIGN ANUSVARA +0BC0 ; Top # Mn TAMIL VOWEL SIGN II +0BCD ; Top # Mn TAMIL SIGN VIRAMA +0C00 ; Top # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C04 ; Top # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C3E..0C40 ; Top # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C46..0C47 ; Top # Mn [2] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN EE +0C4A..0C4D ; Top # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA +0C55 ; Top # Mn TELUGU LENGTH MARK +0C81 ; Top # Mn KANNADA SIGN CANDRABINDU +0CBF ; Top # Mn KANNADA VOWEL SIGN I +0CC6 ; Top # Mn KANNADA VOWEL SIGN E +0CCC..0CCD ; Top # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA +0D00..0D01 ; Top # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU +0D3B..0D3C ; Top # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA +0D4D ; Top # Mn MALAYALAM SIGN VIRAMA +0DCA ; Top # Mn SINHALA SIGN AL-LAKUNA +0DD2..0DD3 ; Top # Mn [2] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN DIGA IS-PILLA +0E31 ; Top # Mn THAI CHARACTER MAI HAN-AKAT +0E34..0E37 ; Top # Mn [4] THAI CHARACTER SARA I..THAI CHARACTER SARA UEE +0E47..0E4E ; Top # Mn [8] THAI CHARACTER MAITAIKHU..THAI CHARACTER YAMAKKAN +0EB1 ; Top # Mn LAO VOWEL SIGN MAI KAN +0EB4..0EB7 ; Top # Mn [4] LAO VOWEL SIGN I..LAO VOWEL SIGN YY +0EBB ; Top # Mn LAO VOWEL SIGN MAI KON +0EC8..0ECD ; Top # Mn [6] LAO TONE MAI EK..LAO NIGGAHITA +0F39 ; Top # Mn TIBETAN MARK TSA -PHRU +0F72 ; Top # Mn TIBETAN VOWEL SIGN I +0F7A..0F7E ; Top # Mn [5] TIBETAN VOWEL SIGN E..TIBETAN SIGN RJES SU NGA RO +0F80 ; Top # Mn TIBETAN VOWEL SIGN REVERSED I +0F82..0F83 ; Top # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +0F86..0F87 ; Top # Mn [2] TIBETAN SIGN LCI RTAGS..TIBETAN SIGN YANG RTAGS +102D..102E ; Top # Mn [2] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN II +1032..1036 ; Top # Mn [5] MYANMAR VOWEL SIGN AI..MYANMAR SIGN ANUSVARA +103A ; Top # Mn MYANMAR SIGN ASAT +1071..1074 ; Top # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1085..1086 ; Top # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109D ; Top # Mn MYANMAR VOWEL SIGN AITON AI +1712 ; Top # Mn TAGALOG VOWEL SIGN I +1732 ; Top # Mn HANUNOO VOWEL SIGN I +1752 ; Top # Mn BUHID VOWEL SIGN I +1772 ; Top # Mn TAGBANWA VOWEL SIGN I +17B7..17BA ; Top # Mn [4] KHMER VOWEL SIGN I..KHMER VOWEL SIGN YY +17C6 ; Top # Mn KHMER SIGN NIKAHIT +17C9..17D1 ; Top # Mn [9] KHMER SIGN MUUSIKATOAN..KHMER SIGN VIRIAM +17D3 ; Top # Mn KHMER SIGN BATHAMASAT +17DD ; Top # Mn KHMER SIGN ATTHACAN +1920..1921 ; Top # Mn [2] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN I +1927..1928 ; Top # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Top # Mn LIMBU SIGN KEMPHRENG +1A17 ; Top # Mn BUGINESE VOWEL SIGN I +1A1B ; Top # Mn BUGINESE VOWEL SIGN AE +1A58..1A5A ; Top # Mn [3] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN LOW PA +1A62 ; Top # Mn TAI THAM VOWEL SIGN MAI SAT +1A65..1A68 ; Top # Mn [4] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN UUE +1A6B ; Top # Mn TAI THAM VOWEL SIGN O +1A73..1A7C ; Top # Mn [10] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN KHUEN-LUE KARAN +1B00..1B03 ; Top # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG +1B34 ; Top # Mn BALINESE SIGN REREKAN +1B36..1B37 ; Top # Mn [2] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN ULU SARI +1B42 ; Top # Mn BALINESE VOWEL SIGN PEPET +1B6B ; Top # Mn BALINESE MUSICAL SYMBOL COMBINING TEGEH +1B6D..1B73 ; Top # Mn [7] BALINESE MUSICAL SYMBOL COMBINING KEMPUL..BALINESE MUSICAL SYMBOL COMBINING GONG +1B80..1B81 ; Top # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR +1BA4 ; Top # Mn SUNDANESE VOWEL SIGN PANGHULU +1BA8..1BA9 ; Top # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE6 ; Top # Mn BATAK SIGN TOMPI +1BE8..1BE9 ; Top # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BED ; Top # Mn BATAK VOWEL SIGN KARO O +1BEF..1BF1 ; Top # Mn [3] BATAK VOWEL SIGN U FOR SIMALUNGUN SA..BATAK CONSONANT SIGN H +1C2D..1C33 ; Top # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +1C36 ; Top # Mn LEPCHA SIGN RAN +1CD0..1CD2 ; Top # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CDA..1CDB ; Top # Mn [2] VEDIC TONE DOUBLE SVARITA..VEDIC TONE TRIPLE SVARITA +1CE0 ; Top # Mn VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CF4 ; Top # Mn VEDIC TONE CANDRA ABOVE +1DFB ; Top # Mn COMBINING DELETION MARK +20F0 ; Top # Mn COMBINING ASTERISK ABOVE +A802 ; Top # Mn SYLOTI NAGRI SIGN DVISVARA +A806 ; Top # Mn SYLOTI NAGRI SIGN HASANTA +A80B ; Top # Mn SYLOTI NAGRI SIGN ANUSVARA +A826 ; Top # Mn SYLOTI NAGRI VOWEL SIGN E +A8C5 ; Top # Mn SAURASHTRA SIGN CANDRABINDU +A8E0..A8F1 ; Top # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +A8FF ; Top # Mn DEVANAGARI VOWEL SIGN AY +A94A ; Top # Mn REJANG VOWEL SIGN AI +A94F..A951 ; Top # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A980..A982 ; Top # Mn [3] JAVANESE SIGN PANYANGGA..JAVANESE SIGN LAYAR +A9B3 ; Top # Mn JAVANESE SIGN CECAK TELU +A9B6..A9B7 ; Top # Mn [2] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN WULU MELIK +A9BC ; Top # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Top # Mn MYANMAR SIGN SHAN SAW +AA29..AA2C ; Top # Mn [4] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN EI +AA2E ; Top # Mn CHAM VOWEL SIGN OE +AA31 ; Top # Mn CHAM VOWEL SIGN AU +AA43 ; Top # Mn CHAM CONSONANT SIGN FINAL NG +AA4C ; Top # Mn CHAM CONSONANT SIGN FINAL M +AA7C ; Top # Mn MYANMAR SIGN TAI LAING TONE-2 +AAB0 ; Top # Mn TAI VIET MAI KANG +AAB2..AAB3 ; Top # Mn [2] TAI VIET VOWEL I..TAI VIET VOWEL UE +AAB7..AAB8 ; Top # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AABE..AABF ; Top # Mn [2] TAI VIET VOWEL AM..TAI VIET TONE MAI EK +AAC1 ; Top # Mn TAI VIET TONE MAI THO +AAED ; Top # Mn MEETEI MAYEK VOWEL SIGN AAI +ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP +10A05 ; Top # Mn KHAROSHTHI VOWEL SIGN E +10A0F ; Top # Mn KHAROSHTHI SIGN VISARGA +10A38 ; Top # Mn KHAROSHTHI SIGN BAR ABOVE +11001 ; Top # Mn BRAHMI SIGN ANUSVARA +11038..1103B ; Top # Mn [4] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN II +11042..11046 ; Top # Mn [5] BRAHMI VOWEL SIGN E..BRAHMI VIRAMA +11080..11081 ; Top # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +110B5..110B6 ; Top # Mn [2] KAITHI VOWEL SIGN E..KAITHI VOWEL SIGN AI +11100..11102 ; Top # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA +11127..11129 ; Top # Mn [3] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN II +1112D ; Top # Mn CHAKMA VOWEL SIGN AI +11130 ; Top # Mn CHAKMA VOWEL SIGN OI +11134 ; Top # Mn CHAKMA MAAYYAA +11180..11181 ; Top # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +111BC..111BE ; Top # Mn [3] SHARADA VOWEL SIGN E..SHARADA VOWEL SIGN O +111CB ; Top # Mn SHARADA VOWEL MODIFIER MARK +11230..11231 ; Top # Mn [2] KHOJKI VOWEL SIGN E..KHOJKI VOWEL SIGN AI +11234 ; Top # Mn KHOJKI SIGN ANUSVARA +11236..11237 ; Top # Mn [2] KHOJKI SIGN NUKTA..KHOJKI SIGN SHADDA +1123E ; Top # Mn KHOJKI SIGN SUKUN +112DF ; Top # Mn KHUDAWADI SIGN ANUSVARA +112E5..112E8 ; Top # Mn [4] KHUDAWADI VOWEL SIGN E..KHUDAWADI VOWEL SIGN AU +11300..11301 ; Top # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11340 ; Top # Mn GRANTHA VOWEL SIGN II +11366..1136C ; Top # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Top # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA +1143E..1143F ; Top # Mn [2] NEWA VOWEL SIGN E..NEWA VOWEL SIGN AI +11443..11444 ; Top # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +1145E ; Top # Mn NEWA SANDHI MARK +114BA ; Top # Mn TIRHUTA VOWEL SIGN SHORT E +114BF..114C0 ; Top # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Top # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +11639..1163A ; Top # Mn [2] MODI VOWEL SIGN E..MODI VOWEL SIGN AI +1163D ; Top # Mn MODI SIGN ANUSVARA +11640 ; Top # Mn MODI SIGN ARDHACANDRA +116AB ; Top # Mn TAKRI SIGN ANUSVARA +116AD ; Top # Mn TAKRI VOWEL SIGN AA +116B2..116B5 ; Top # Mn [4] TAKRI VOWEL SIGN E..TAKRI VOWEL SIGN AU +1171F ; Top # Mn AHOM CONSONANT SIGN MEDIAL LIGATING RA +11722..11723 ; Top # Mn [2] AHOM VOWEL SIGN I..AHOM VOWEL SIGN II +11727 ; Top # Mn AHOM VOWEL SIGN AW +11729..1172B ; Top # Mn [3] AHOM VOWEL SIGN AI..AHOM SIGN KILLER +11833..11837 ; Top # Mn [5] DOGRA VOWEL SIGN E..DOGRA SIGN ANUSVARA +119DA..119DB ; Top # Mn [2] NANDINAGARI VOWEL SIGN E..NANDINAGARI VOWEL SIGN AI +11A01 ; Top # Mn ZANABAZAR SQUARE VOWEL SIGN I +11A04..11A09 ; Top # Mn [6] ZANABAZAR SQUARE VOWEL SIGN E..ZANABAZAR SQUARE VOWEL SIGN REVERSED I +11A35..11A38 ; Top # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A51 ; Top # Mn SOYOMBO VOWEL SIGN I +11A54..11A56 ; Top # Mn [3] SOYOMBO VOWEL SIGN E..SOYOMBO VOWEL SIGN OE +11A96 ; Top # Mn SOYOMBO SIGN ANUSVARA +11A98 ; Top # Mn SOYOMBO GEMINATION MARK +11C30..11C31 ; Top # Mn [2] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN II +11C38..11C3D ; Top # Mn [6] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI SIGN ANUSVARA +11CB3 ; Top # Mn MARCHEN VOWEL SIGN E +11CB5..11CB6 ; Top # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D31..11D35 ; Top # Mn [5] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN UU +11D3A ; Top # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Top # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F..11D41 ; Top # Mn [3] MASARAM GONDI VOWEL SIGN AU..MASARAM GONDI SIGN VISARGA +11D43 ; Top # Mn MASARAM GONDI SIGN CANDRA +11D90..11D91 ; Top # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI +11D95 ; Top # Mn GUNJALA GONDI SIGN ANUSVARA +11EF3 ; Top # Mn MAKASAR VOWEL SIGN I + +# Indic_Positional_Category=Bottom + +093C ; Bottom # Mn DEVANAGARI SIGN NUKTA +0941..0944 ; Bottom # Mn [4] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN VOCALIC RR +094D ; Bottom # Mn DEVANAGARI SIGN VIRAMA +0952 ; Bottom # Mn DEVANAGARI STRESS SIGN ANUDATTA +0956..0957 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN UE..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BC ; Bottom # Mn BENGALI SIGN NUKTA +09C1..09C4 ; Bottom # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09CD ; Bottom # Mn BENGALI SIGN VIRAMA +09E2..09E3 ; Bottom # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3C ; Bottom # Mn GURMUKHI SIGN NUKTA +0A41..0A42 ; Bottom # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A4D ; Bottom # Mn GURMUKHI SIGN VIRAMA +0A51 ; Bottom # Mn GURMUKHI SIGN UDAAT +0A75 ; Bottom # Mn GURMUKHI SIGN YAKASH +0ABC ; Bottom # Mn GUJARATI SIGN NUKTA +0AC1..0AC4 ; Bottom # Mn [4] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN VOCALIC RR +0ACD ; Bottom # Mn GUJARATI SIGN VIRAMA +0AE2..0AE3 ; Bottom # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3C ; Bottom # Mn ORIYA SIGN NUKTA +0B41..0B44 ; Bottom # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B4D ; Bottom # Mn ORIYA SIGN VIRAMA +0B62..0B63 ; Bottom # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0C56 ; Bottom # Mn TELUGU AI LENGTH MARK +0C62..0C63 ; Bottom # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBC ; Bottom # Mn KANNADA SIGN NUKTA +0CE2..0CE3 ; Bottom # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D43..0D44 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC R..MALAYALAM VOWEL SIGN VOCALIC RR +0D62..0D63 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DD4 ; Bottom # Mn SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Bottom # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0E38..0E3A ; Bottom # Mn [3] THAI CHARACTER SARA U..THAI CHARACTER PHINTHU +0EB8..0EBA ; Bottom # Mn [3] LAO VOWEL SIGN U..LAO SIGN PALI VIRAMA +0EBC ; Bottom # Mn LAO SEMIVOWEL SIGN LO +0F18..0F19 ; Bottom # Mn [2] TIBETAN ASTROLOGICAL SIGN -KHYUD PA..TIBETAN ASTROLOGICAL SIGN SDONG TSHUGS +0F35 ; Bottom # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Bottom # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0F71 ; Bottom # Mn TIBETAN VOWEL SIGN AA +0F74..0F75 ; Bottom # Mn [2] TIBETAN VOWEL SIGN U..TIBETAN VOWEL SIGN UU +0F84 ; Bottom # Mn TIBETAN MARK HALANTA +0F8D..0F97 ; Bottom # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Bottom # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +0FC6 ; Bottom # Mn TIBETAN SYMBOL PADMA GDAN +102F..1030 ; Bottom # Mn [2] MYANMAR VOWEL SIGN U..MYANMAR VOWEL SIGN UU +1037 ; Bottom # Mn MYANMAR SIGN DOT BELOW +103D..103E ; Bottom # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +1058..1059 ; Bottom # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +105E..1060 ; Bottom # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Bottom # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +108D ; Bottom # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +1713..1714 ; Bottom # Mn [2] TAGALOG VOWEL SIGN U..TAGALOG SIGN VIRAMA +1733..1734 ; Bottom # Mn [2] HANUNOO VOWEL SIGN U..HANUNOO SIGN PAMUDPOD +1753 ; Bottom # Mn BUHID VOWEL SIGN U +1773 ; Bottom # Mn TAGBANWA VOWEL SIGN U +17BB..17BD ; Bottom # Mn [3] KHMER VOWEL SIGN U..KHMER VOWEL SIGN UA +1922 ; Bottom # Mn LIMBU VOWEL SIGN U +1932 ; Bottom # Mn LIMBU SMALL LETTER ANUSVARA +1939 ; Bottom # Mn LIMBU SIGN MUKPHRENG +193B ; Bottom # Mn LIMBU SIGN SA-I +1A18 ; Bottom # Mn BUGINESE VOWEL SIGN U +1A56 ; Bottom # Mn TAI THAM CONSONANT SIGN MEDIAL LA +1A5B..1A5E ; Bottom # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1A69..1A6A ; Bottom # Mn [2] TAI THAM VOWEL SIGN U..TAI THAM VOWEL SIGN UU +1A6C ; Bottom # Mn TAI THAM VOWEL SIGN OA BELOW +1A7F ; Bottom # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1B38..1B3A ; Bottom # Mn [3] BALINESE VOWEL SIGN SUKU..BALINESE VOWEL SIGN RA REPA +1B6C ; Bottom # Mn BALINESE MUSICAL SYMBOL COMBINING ENDEP +1BA2..1BA3 ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BA5 ; Bottom # Mn SUNDANESE VOWEL SIGN PANYUKU +1BAC..1BAD ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C2C ; Bottom # Mn LEPCHA VOWEL SIGN E +1C37 ; Bottom # Mn LEPCHA SIGN NUKTA +1CD5..1CD9 ; Bottom # Mn [5] VEDIC TONE YAJURVEDIC AGGRAVATED INDEPENDENT SVARITA..VEDIC TONE YAJURVEDIC KATHAKA INDEPENDENT SVARITA SCHROEDER +1CDC..1CDF ; Bottom # Mn [4] VEDIC TONE KATHAKA ANUDATTA..VEDIC TONE THREE DOTS BELOW +1CED ; Bottom # Mn VEDIC SIGN TIRYAK +A825 ; Bottom # Mn SYLOTI NAGRI VOWEL SIGN U +A8C4 ; Bottom # Mn SAURASHTRA SIGN VIRAMA +A92B..A92D ; Bottom # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +A947..A949 ; Bottom # Mn [3] REJANG VOWEL SIGN I..REJANG VOWEL SIGN E +A94B..A94E ; Bottom # Mn [4] REJANG VOWEL SIGN O..REJANG VOWEL SIGN EA +A9B8..A9B9 ; Bottom # Mn [2] JAVANESE VOWEL SIGN SUKU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BD ; Bottom # Mn JAVANESE CONSONANT SIGN KERET +AA2D ; Bottom # Mn CHAM VOWEL SIGN U +AA32 ; Bottom # Mn CHAM VOWEL SIGN UE +AA35..AA36 ; Bottom # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +AAB4 ; Bottom # Mn TAI VIET VOWEL U +AAEC ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UU +ABE8 ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK +10A02..10A03 ; Bottom # Mn [2] KHAROSHTHI VOWEL SIGN U..KHAROSHTHI VOWEL SIGN VOCALIC R +10A0C..10A0E ; Bottom # Mn [3] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN ANUSVARA +10A39..10A3A ; Bottom # Mn [2] KHAROSHTHI SIGN CAUDA..KHAROSHTHI SIGN DOT BELOW +1103C..11041 ; Bottom # Mn [6] BRAHMI VOWEL SIGN U..BRAHMI VOWEL SIGN VOCALIC LL +110B3..110B4 ; Bottom # Mn [2] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN UU +110B9..110BA ; Bottom # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +1112A..1112B ; Bottom # Mn [2] CHAKMA VOWEL SIGN U..CHAKMA VOWEL SIGN UU +11131..11132 ; Bottom # Mn [2] CHAKMA O MARK..CHAKMA AU MARK +11173 ; Bottom # Mn MAHAJANI SIGN NUKTA +111B6..111BB ; Bottom # Mn [6] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN VOCALIC LL +111C9..111CA ; Bottom # Mn [2] SHARADA SANDHI MARK..SHARADA SIGN NUKTA +111CC ; Bottom # Mn SHARADA EXTRA SHORT VOWEL MARK +1122F ; Bottom # Mn KHOJKI VOWEL SIGN U +112E3..112E4 ; Bottom # Mn [2] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN UU +112E9..112EA ; Bottom # Mn [2] KHUDAWADI SIGN NUKTA..KHUDAWADI SIGN VIRAMA +1133B..1133C ; Bottom # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA +11438..1143D ; Bottom # Mn [6] NEWA VOWEL SIGN U..NEWA VOWEL SIGN VOCALIC LL +11442 ; Bottom # Mn NEWA SIGN VIRAMA +11446 ; Bottom # Mn NEWA SIGN NUKTA +114B3..114B8 ; Bottom # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114C2..114C3 ; Bottom # Mn [2] TIRHUTA SIGN VIRAMA..TIRHUTA SIGN NUKTA +115B2..115B5 ; Bottom # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115BF..115C0 ; Bottom # Mn [2] SIDDHAM SIGN VIRAMA..SIDDHAM SIGN NUKTA +115DC..115DD ; Bottom # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11633..11638 ; Bottom # Mn [6] MODI VOWEL SIGN U..MODI VOWEL SIGN VOCALIC LL +1163F ; Bottom # Mn MODI SIGN VIRAMA +116B0..116B1 ; Bottom # Mn [2] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN UU +116B7 ; Bottom # Mn TAKRI SIGN NUKTA +1171D ; Bottom # Mn AHOM CONSONANT SIGN MEDIAL LA +11724..11725 ; Bottom # Mn [2] AHOM VOWEL SIGN U..AHOM VOWEL SIGN UU +11728 ; Bottom # Mn AHOM VOWEL SIGN O +1182F..11832 ; Bottom # Mn [4] DOGRA VOWEL SIGN U..DOGRA VOWEL SIGN VOCALIC RR +11839..1183A ; Bottom # Mn [2] DOGRA SIGN VIRAMA..DOGRA SIGN NUKTA +119D4..119D7 ; Bottom # Mn [4] NANDINAGARI VOWEL SIGN U..NANDINAGARI VOWEL SIGN VOCALIC RR +119E0 ; Bottom # Mn NANDINAGARI SIGN VIRAMA +11A02..11A03 ; Bottom # Mn [2] ZANABAZAR SQUARE VOWEL SIGN UE..ZANABAZAR SQUARE VOWEL SIGN U +11A0A ; Bottom # Mn ZANABAZAR SQUARE VOWEL LENGTH MARK +11A33..11A34 ; Bottom # Mn [2] ZANABAZAR SQUARE FINAL CONSONANT MARK..ZANABAZAR SQUARE SIGN VIRAMA +11A3B..11A3E ; Bottom # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11A52..11A53 ; Bottom # Mn [2] SOYOMBO VOWEL SIGN UE..SOYOMBO VOWEL SIGN U +11A59..11A5B ; Bottom # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11A8A..11A95 ; Bottom # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A +11C32..11C36 ; Bottom # Mn [5] BHAIKSUKI VOWEL SIGN U..BHAIKSUKI VOWEL SIGN VOCALIC L +11C3F ; Bottom # Mn BHAIKSUKI SIGN VIRAMA +11C92..11CA7 ; Bottom # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CAA..11CB0 ; Bottom # Mn [7] MARCHEN SUBJOINED LETTER RA..MARCHEN VOWEL SIGN AA +11CB2 ; Bottom # Mn MARCHEN VOWEL SIGN U +11D36 ; Bottom # Mn MASARAM GONDI VOWEL SIGN VOCALIC R +11D42 ; Bottom # Mn MASARAM GONDI SIGN NUKTA +11D44 ; Bottom # Mn MASARAM GONDI SIGN HALANTA +11D47 ; Bottom # Mn MASARAM GONDI RA-KARA +11EF4 ; Bottom # Mn MAKASAR VOWEL SIGN U + +# Indic_Positional_Category=Top_And_Bottom + +0C48 ; Top_And_Bottom # Mn TELUGU VOWEL SIGN AI +0F73 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN II +0F76..0F79 ; Top_And_Bottom # Mn [4] TIBETAN VOWEL SIGN VOCALIC R..TIBETAN VOWEL SIGN VOCALIC LL +0F81 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN REVERSED II +1B3C ; Top_And_Bottom # Mn BALINESE VOWEL SIGN LA LENGA +1112E..1112F ; Top_And_Bottom # Mn [2] CHAKMA VOWEL SIGN O..CHAKMA VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Right + +0AC9 ; Top_And_Right # Mc GUJARATI VOWEL SIGN CANDRA O +0B57 ; Top_And_Right # Mc ORIYA AU LENGTH MARK +0CC0 ; Top_And_Right # Mc KANNADA VOWEL SIGN II +0CC7..0CC8 ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +1925..1926 ; Top_And_Right # Mc [2] LIMBU VOWEL SIGN OO..LIMBU VOWEL SIGN AU +1B43 ; Top_And_Right # Mc BALINESE VOWEL SIGN PEPET TEDUNG +111BF ; Top_And_Right # Mc SHARADA VOWEL SIGN AU +11232..11233 ; Top_And_Right # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Left + +0B48 ; Top_And_Left # Mc ORIYA VOWEL SIGN AI +0DDA ; Top_And_Left # Mc SINHALA VOWEL SIGN DIGA KOMBUVA +17BE ; Top_And_Left # Mc KHMER VOWEL SIGN OE +1C29 ; Top_And_Left # Mc LEPCHA VOWEL SIGN OO +114BB ; Top_And_Left # Mc TIRHUTA VOWEL SIGN AI +115B9 ; Top_And_Left # Mc SIDDHAM VOWEL SIGN AI + +# Indic_Positional_Category=Top_And_Left_And_Right + +0B4C ; Top_And_Left_And_Right # Mc ORIYA VOWEL SIGN AU +0DDD ; Top_And_Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA +17BF ; Top_And_Left_And_Right # Mc KHMER VOWEL SIGN YA +115BB ; Top_And_Left_And_Right # Mc SIDDHAM VOWEL SIGN AU + +# Indic_Positional_Category=Bottom_And_Right + +1B3B ; Bottom_And_Right # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +A9C0 ; Bottom_And_Right # Mc JAVANESE PANGKON + +# Indic_Positional_Category=Bottom_And_Left + +A9BF ; Bottom_And_Left # Mc JAVANESE CONSONANT SIGN CAKRA + +# Indic_Positional_Category=Top_And_Bottom_And_Right + +1B3D ; Top_And_Bottom_And_Right # Mc BALINESE VOWEL SIGN LA LENGA TEDUNG + +# Indic_Positional_Category=Overstruck + +1CD4 ; Overstruck # Mn VEDIC SIGN YAJURVEDIC MIDLINE SVARITA +1CE2..1CE8 ; Overstruck # Mn [7] VEDIC SIGN VISARGA SVARITA..VEDIC SIGN VISARGA ANUDATTA WITH TAIL +10A01 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN I +10A06 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN O + +# EOF diff --git a/data/12.1.0-indic-syllabic-category.txt b/data/12.1.0-indic-syllabic-category.txt new file mode 100644 index 0000000..91ae6a0 --- /dev/null +++ b/data/12.1.0-indic-syllabic-category.txt @@ -0,0 +1,1286 @@ +# IndicSyllabicCategory-12.1.0.txt +# Date: 2019-03-08, 23:59:00 GMT [KW, RP] +# © 2019 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# +# For documentation, see UAX #44: Unicode Character Database, +# at http://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Syllabic_Category enumerated property +# +# Scope: This property is aimed at two general problem +# areas involving the analysis and processing of Indic scripts: +# +# 1. Specification of syllabic structure. +# 2. Specification of segmentation rules. +# +# Both of these problem areas may benefit from having defined subtypes +# of Indic script characters which are relevant to how Indic +# syllables (or aksaras) are constructed. Note that rules for +# syllabic structure in Indic scripts may differ significantly +# from how phonological syllables are defined. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Syllabic_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as Indic in the structural sense used for the +# Indic_Syllabic_Category are the following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Dogra, Grantha, Gujarati, Gunjala Gondi, +# Gurmukhi, Hanunoo, Javanese, Kaithi, Kannada, Kayah Li, Kharoshthi, +# Khmer, Khojki, Khudawadi, Lao, Lepcha, Limbu, Mahajani, Makasar, +# Malayalam, Marchen, Masaram Gondi, Meetei Mayek, Modi, Multani, +# Myanmar, Nandinagari, Newa, New Tai Lue, Oriya, Phags-pa, Rejang, +# Saurashtra, Sharada, Siddham, Sinhala, Soyombo, Sundanese, Syloti +# Nagri, Tagalog, Tagbanwa, Tai Le, Tai Tham, Tai Viet, Takri, Tamil, +# Telugu, Thai, Tibetan, Tirhuta, and Zanabazar Square. +# +# All characters for all other scripts not in that list +# take the default value for this property, unless they +# are individually listed in this data file. +# + +# ================================================ + +# Property: Indic_Syllabic_Category +# +# All code points not explicitly listed for Indic_Syllabic_Category +# have the value Other. +# +# @missing: 0000..10FFFF; Other + +# ================================================ + +# Indic_Syllabic_Category=Bindu + +# Bindu/Anusvara (nasalization or -n) + +# [Not derivable] + +0900..0902 ; Bindu # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +0981 ; Bindu # Mn BENGALI SIGN CANDRABINDU +0982 ; Bindu # Mc BENGALI SIGN ANUSVARA +09FC ; Bindu # Lo BENGALI LETTER VEDIC ANUSVARA +0A01..0A02 ; Bindu # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A70 ; Bindu # Mn GURMUKHI TIPPI +0A81..0A82 ; Bindu # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0B01 ; Bindu # Mn ORIYA SIGN CANDRABINDU +0B02 ; Bindu # Mc ORIYA SIGN ANUSVARA +0B82 ; Bindu # Mn TAMIL SIGN ANUSVARA +0C00 ; Bindu # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C01..0C02 ; Bindu # Mc [2] TELUGU SIGN CANDRABINDU..TELUGU SIGN ANUSVARA +0C04 ; Bindu # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C80 ; Bindu # Lo KANNADA SIGN SPACING CANDRABINDU +0C81 ; Bindu # Mn KANNADA SIGN CANDRABINDU +0C82 ; Bindu # Mc KANNADA SIGN ANUSVARA +0D00..0D01 ; Bindu # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU +0D02 ; Bindu # Mc MALAYALAM SIGN ANUSVARA +0D82 ; Bindu # Mc SINHALA SIGN ANUSVARAYA +0E4D ; Bindu # Mn THAI CHARACTER NIKHAHIT +0ECD ; Bindu # Mn LAO NIGGAHITA +0F7E ; Bindu # Mn TIBETAN SIGN RJES SU NGA RO +0F82..0F83 ; Bindu # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +1036 ; Bindu # Mn MYANMAR SIGN ANUSVARA +17C6 ; Bindu # Mn KHMER SIGN NIKAHIT +1932 ; Bindu # Mn LIMBU SMALL LETTER ANUSVARA +1A74 ; Bindu # Mn TAI THAM SIGN MAI KANG +1B00..1B02 ; Bindu # Mn [3] BALINESE SIGN ULU RICEM..BALINESE SIGN CECEK +1B80 ; Bindu # Mn SUNDANESE SIGN PANYECEK +1C34..1C35 ; Bindu # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A80B ; Bindu # Mn SYLOTI NAGRI SIGN ANUSVARA +A873 ; Bindu # Lo PHAGS-PA LETTER CANDRABINDU +A880 ; Bindu # Mc SAURASHTRA SIGN ANUSVARA +A8C5 ; Bindu # Mn SAURASHTRA SIGN CANDRABINDU +A8F2..A8F3 ; Bindu # Lo [2] DEVANAGARI SIGN SPACING CANDRABINDU..DEVANAGARI SIGN CANDRABINDU VIRAMA +A980..A981 ; Bindu # Mn [2] JAVANESE SIGN PANYANGGA..JAVANESE SIGN CECAK +10A0E ; Bindu # Mn KHAROSHTHI SIGN ANUSVARA +11000 ; Bindu # Mc BRAHMI SIGN CANDRABINDU +11001 ; Bindu # Mn BRAHMI SIGN ANUSVARA +11080..11081 ; Bindu # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +11100..11101 ; Bindu # Mn [2] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN ANUSVARA +11180..11181 ; Bindu # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +11234 ; Bindu # Mn KHOJKI SIGN ANUSVARA +112DF ; Bindu # Mn KHUDAWADI SIGN ANUSVARA +11300..11301 ; Bindu # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11302 ; Bindu # Mc GRANTHA SIGN ANUSVARA +1135E..1135F ; Bindu # Lo [2] GRANTHA LETTER VEDIC ANUSVARA..GRANTHA LETTER VEDIC DOUBLE ANUSVARA +11443..11444 ; Bindu # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +1145F ; Bindu # Lo NEWA LETTER VEDIC ANUSVARA +114BF..114C0 ; Bindu # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Bindu # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +1163D ; Bindu # Mn MODI SIGN ANUSVARA +116AB ; Bindu # Mn TAKRI SIGN ANUSVARA +11837 ; Bindu # Mn DOGRA SIGN ANUSVARA +119DE ; Bindu # Mc NANDINAGARI SIGN ANUSVARA +11A35..11A38 ; Bindu # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A96 ; Bindu # Mn SOYOMBO SIGN ANUSVARA +11C3C..11C3D ; Bindu # Mn [2] BHAIKSUKI SIGN CANDRABINDU..BHAIKSUKI SIGN ANUSVARA +11CB5..11CB6 ; Bindu # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D40 ; Bindu # Mn MASARAM GONDI SIGN ANUSVARA +11D95 ; Bindu # Mn GUNJALA GONDI SIGN ANUSVARA + +# ================================================ + +# Indic_Syllabic_Category=Visarga + +# Visarga (-h) +# Excludes letters for jihvamuliya and upadhmaniya, which are +# related, but structured somewhat differently. + +# [Not derivable] + +0903 ; Visarga # Mc DEVANAGARI SIGN VISARGA +0983 ; Visarga # Mc BENGALI SIGN VISARGA +0A03 ; Visarga # Mc GURMUKHI SIGN VISARGA +0A83 ; Visarga # Mc GUJARATI SIGN VISARGA +0B03 ; Visarga # Mc ORIYA SIGN VISARGA +0C03 ; Visarga # Mc TELUGU SIGN VISARGA +0C83 ; Visarga # Mc KANNADA SIGN VISARGA +0D03 ; Visarga # Mc MALAYALAM SIGN VISARGA +0D83 ; Visarga # Mc SINHALA SIGN VISARGAYA +0F7F ; Visarga # Mc TIBETAN SIGN RNAM BCAD +1038 ; Visarga # Mc MYANMAR SIGN VISARGA +17C7 ; Visarga # Mc KHMER SIGN REAHMUK +1B04 ; Visarga # Mc BALINESE SIGN BISAH +1B82 ; Visarga # Mc SUNDANESE SIGN PANGWISAD +A881 ; Visarga # Mc SAURASHTRA SIGN VISARGA +A983 ; Visarga # Mc JAVANESE SIGN WIGNYAN +AAF5 ; Visarga # Mc MEETEI MAYEK VOWEL SIGN VISARGA +10A0F ; Visarga # Mn KHAROSHTHI SIGN VISARGA +11002 ; Visarga # Mc BRAHMI SIGN VISARGA +11082 ; Visarga # Mc KAITHI SIGN VISARGA +11102 ; Visarga # Mn CHAKMA SIGN VISARGA +11182 ; Visarga # Mc SHARADA SIGN VISARGA +11303 ; Visarga # Mc GRANTHA SIGN VISARGA +11445 ; Visarga # Mc NEWA SIGN VISARGA +114C1 ; Visarga # Mc TIRHUTA SIGN VISARGA +115BE ; Visarga # Mc SIDDHAM SIGN VISARGA +1163E ; Visarga # Mc MODI SIGN VISARGA +116AC ; Visarga # Mc TAKRI SIGN VISARGA +11838 ; Visarga # Mc DOGRA SIGN VISARGA +119DF ; Visarga # Mc NANDINAGARI SIGN VISARGA +11A39 ; Visarga # Mc ZANABAZAR SQUARE SIGN VISARGA +11A97 ; Visarga # Mc SOYOMBO SIGN VISARGA +11C3E ; Visarga # Mc BHAIKSUKI SIGN VISARGA +11D41 ; Visarga # Mn MASARAM GONDI SIGN VISARGA +11D96 ; Visarga # Mc GUNJALA GONDI SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Avagraha + +# Avagraha (elision of initial a- in sandhi) + +# [Not derivable] + +093D ; Avagraha # Lo DEVANAGARI SIGN AVAGRAHA +09BD ; Avagraha # Lo BENGALI SIGN AVAGRAHA +0ABD ; Avagraha # Lo GUJARATI SIGN AVAGRAHA +0B3D ; Avagraha # Lo ORIYA SIGN AVAGRAHA +0C3D ; Avagraha # Lo TELUGU SIGN AVAGRAHA +0CBD ; Avagraha # Lo KANNADA SIGN AVAGRAHA +0D3D ; Avagraha # Lo MALAYALAM SIGN AVAGRAHA +0F85 ; Avagraha # Po TIBETAN MARK PALUTA +17DC ; Avagraha # Lo KHMER SIGN AVAKRAHASANYA +1BBA ; Avagraha # Lo SUNDANESE AVAGRAHA +111C1 ; Avagraha # Lo SHARADA SIGN AVAGRAHA +1133D ; Avagraha # Lo GRANTHA SIGN AVAGRAHA +11447 ; Avagraha # Lo NEWA SIGN AVAGRAHA +114C4 ; Avagraha # Lo TIRHUTA SIGN AVAGRAHA +119E1 ; Avagraha # Lo NANDINAGARI SIGN AVAGRAHA +11A9D ; Avagraha # Lo SOYOMBO MARK PLUTA +11C40 ; Avagraha # Lo BHAIKSUKI SIGN AVAGRAHA + +# ================================================ + +# Indic_Syllabic_Category=Nukta + +# Nukta (diacritic for borrowed consonants or other consonant +# modifications). Note that while the resulting sound is typically a +# consonant, the base letter a nukta follows may be an independent +# vowel. For example, is used to transcribe ARABIC LETTER +# AIN. + +# [Not derivable] + +093C ; Nukta # Mn DEVANAGARI SIGN NUKTA +09BC ; Nukta # Mn BENGALI SIGN NUKTA +0A3C ; Nukta # Mn GURMUKHI SIGN NUKTA +0ABC ; Nukta # Mn GUJARATI SIGN NUKTA +0AFD..0AFF ; Nukta # Mn [3] GUJARATI SIGN THREE-DOT NUKTA ABOVE..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B3C ; Nukta # Mn ORIYA SIGN NUKTA +0CBC ; Nukta # Mn KANNADA SIGN NUKTA +0F39 ; Nukta # Mn TIBETAN MARK TSA -PHRU +1B34 ; Nukta # Mn BALINESE SIGN REREKAN +1BE6 ; Nukta # Mn BATAK SIGN TOMPI +1C37 ; Nukta # Mn LEPCHA SIGN NUKTA +A9B3 ; Nukta # Mn JAVANESE SIGN CECAK TELU +10A38..10A3A ; Nukta # Mn [3] KHAROSHTHI SIGN BAR ABOVE..KHAROSHTHI SIGN DOT BELOW +110BA ; Nukta # Mn KAITHI SIGN NUKTA +11173 ; Nukta # Mn MAHAJANI SIGN NUKTA +111CA ; Nukta # Mn SHARADA SIGN NUKTA +11236 ; Nukta # Mn KHOJKI SIGN NUKTA +112E9 ; Nukta # Mn KHUDAWADI SIGN NUKTA +1133B..1133C ; Nukta # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA +11446 ; Nukta # Mn NEWA SIGN NUKTA +114C3 ; Nukta # Mn TIRHUTA SIGN NUKTA +115C0 ; Nukta # Mn SIDDHAM SIGN NUKTA +116B7 ; Nukta # Mn TAKRI SIGN NUKTA +1183A ; Nukta # Mn DOGRA SIGN NUKTA +11D42 ; Nukta # Mn MASARAM GONDI SIGN NUKTA + +# ================================================ + +# Indic_Syllabic_Category=Virama + +# Virama (killing of inherent vowel in consonant sequence +# or consonant stacker) +# Only includes characters that can act both as visible killer viramas +# and consonant stackers. Separate property values exist for characters +# that can only act as pure killers or only as consonant stackers. + +# [Derivation: (ccc=9) - (InSC=Pure_Killer) - (InSC=Invisible_Stacker) +# - (InSC=Number_Joiner) - 2D7F] + +094D ; Virama # Mn DEVANAGARI SIGN VIRAMA +09CD ; Virama # Mn BENGALI SIGN VIRAMA +0A4D ; Virama # Mn GURMUKHI SIGN VIRAMA +0ACD ; Virama # Mn GUJARATI SIGN VIRAMA +0B4D ; Virama # Mn ORIYA SIGN VIRAMA +0BCD ; Virama # Mn TAMIL SIGN VIRAMA +0C4D ; Virama # Mn TELUGU SIGN VIRAMA +0CCD ; Virama # Mn KANNADA SIGN VIRAMA +0D4D ; Virama # Mn MALAYALAM SIGN VIRAMA +0DCA ; Virama # Mn SINHALA SIGN AL-LAKUNA +1B44 ; Virama # Mc BALINESE ADEG ADEG +A806 ; Virama # Mn SYLOTI NAGRI SIGN HASANTA +A8C4 ; Virama # Mn SAURASHTRA SIGN VIRAMA +A9C0 ; Virama # Mc JAVANESE PANGKON +11046 ; Virama # Mn BRAHMI VIRAMA +110B9 ; Virama # Mn KAITHI SIGN VIRAMA +111C0 ; Virama # Mc SHARADA SIGN VIRAMA +11235 ; Virama # Mc KHOJKI SIGN VIRAMA +1134D ; Virama # Mc GRANTHA SIGN VIRAMA +11442 ; Virama # Mn NEWA SIGN VIRAMA +114C2 ; Virama # Mn TIRHUTA SIGN VIRAMA +115BF ; Virama # Mn SIDDHAM SIGN VIRAMA +1163F ; Virama # Mn MODI SIGN VIRAMA +116B6 ; Virama # Mc TAKRI SIGN VIRAMA +11839 ; Virama # Mn DOGRA SIGN VIRAMA +119E0 ; Virama # Mn NANDINAGARI SIGN VIRAMA +11C3F ; Virama # Mn BHAIKSUKI SIGN VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Pure_Killer + +# Pure killer (killing of inherent vowel in consonant sequence, +# with no consonant stacking behavior) + +# [Not derivable] + +0D3B..0D3C ; Pure_Killer # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA +0E3A ; Pure_Killer # Mn THAI CHARACTER PHINTHU +0E4E ; Pure_Killer # Mn THAI CHARACTER YAMAKKAN +0EBA ; Pure_Killer # Mn LAO SIGN PALI VIRAMA +0F84 ; Pure_Killer # Mn TIBETAN MARK HALANTA +103A ; Pure_Killer # Mn MYANMAR SIGN ASAT +1714 ; Pure_Killer # Mn TAGALOG SIGN VIRAMA +1734 ; Pure_Killer # Mn HANUNOO SIGN PAMUDPOD +17D1 ; Pure_Killer # Mn KHMER SIGN VIRIAM +1A7A ; Pure_Killer # Mn TAI THAM SIGN RA HAAM +1BAA ; Pure_Killer # Mc SUNDANESE SIGN PAMAAEH +1BF2..1BF3 ; Pure_Killer # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +A953 ; Pure_Killer # Mc REJANG VIRAMA +ABED ; Pure_Killer # Mn MEETEI MAYEK APUN IYEK +11134 ; Pure_Killer # Mn CHAKMA MAAYYAA +112EA ; Pure_Killer # Mn KHUDAWADI SIGN VIRAMA +1172B ; Pure_Killer # Mn AHOM SIGN KILLER +11A34 ; Pure_Killer # Mn ZANABAZAR SQUARE SIGN VIRAMA +11D44 ; Pure_Killer # Mn MASARAM GONDI SIGN HALANTA + +# ================================================ + +# Indic_Syllabic_Category=Invisible_Stacker + +# Invisible stacker (invisible consonant stacker virama). +# +# Note that in some scripts, such as Kharoshthi and Masaram Gondi, an invisible +# stacker may have a second function, changing the shape and/or location of the +# consonant preceding it, even when there is no consonant following the +# invisible stacker. + +# [Not derivable] + +1039 ; Invisible_Stacker # Mn MYANMAR SIGN VIRAMA +17D2 ; Invisible_Stacker # Mn KHMER SIGN COENG +1A60 ; Invisible_Stacker # Mn TAI THAM SIGN SAKOT +1BAB ; Invisible_Stacker # Mn SUNDANESE SIGN VIRAMA +AAF6 ; Invisible_Stacker # Mn MEETEI MAYEK VIRAMA +10A3F ; Invisible_Stacker # Mn KHAROSHTHI VIRAMA +11133 ; Invisible_Stacker # Mn CHAKMA VIRAMA +11A47 ; Invisible_Stacker # Mn ZANABAZAR SQUARE SUBJOINER +11A99 ; Invisible_Stacker # Mn SOYOMBO SUBJOINER +11D45 ; Invisible_Stacker # Mn MASARAM GONDI VIRAMA +11D97 ; Invisible_Stacker # Mn GUNJALA GONDI VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Independent + +# Independent Vowels (contrasted with matras) + +# [Not derivable] + +0904..0914 ; Vowel_Independent # Lo [17] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER AU +0960..0961 ; Vowel_Independent # Lo [2] DEVANAGARI LETTER VOCALIC RR..DEVANAGARI LETTER VOCALIC LL +0972..0977 ; Vowel_Independent # Lo [6] DEVANAGARI LETTER CANDRA A..DEVANAGARI LETTER UUE +0985..098C ; Vowel_Independent # Lo [8] BENGALI LETTER A..BENGALI LETTER VOCALIC L +098F..0990 ; Vowel_Independent # Lo [2] BENGALI LETTER E..BENGALI LETTER AI +0993..0994 ; Vowel_Independent # Lo [2] BENGALI LETTER O..BENGALI LETTER AU +09E0..09E1 ; Vowel_Independent # Lo [2] BENGALI LETTER VOCALIC RR..BENGALI LETTER VOCALIC LL +0A05..0A0A ; Vowel_Independent # Lo [6] GURMUKHI LETTER A..GURMUKHI LETTER UU +0A0F..0A10 ; Vowel_Independent # Lo [2] GURMUKHI LETTER EE..GURMUKHI LETTER AI +0A13..0A14 ; Vowel_Independent # Lo [2] GURMUKHI LETTER OO..GURMUKHI LETTER AU +0A85..0A8D ; Vowel_Independent # Lo [9] GUJARATI LETTER A..GUJARATI VOWEL CANDRA E +0A8F..0A91 ; Vowel_Independent # Lo [3] GUJARATI LETTER E..GUJARATI VOWEL CANDRA O +0A93..0A94 ; Vowel_Independent # Lo [2] GUJARATI LETTER O..GUJARATI LETTER AU +0AE0..0AE1 ; Vowel_Independent # Lo [2] GUJARATI LETTER VOCALIC RR..GUJARATI LETTER VOCALIC LL +0B05..0B0C ; Vowel_Independent # Lo [8] ORIYA LETTER A..ORIYA LETTER VOCALIC L +0B0F..0B10 ; Vowel_Independent # Lo [2] ORIYA LETTER E..ORIYA LETTER AI +0B13..0B14 ; Vowel_Independent # Lo [2] ORIYA LETTER O..ORIYA LETTER AU +0B60..0B61 ; Vowel_Independent # Lo [2] ORIYA LETTER VOCALIC RR..ORIYA LETTER VOCALIC LL +0B85..0B8A ; Vowel_Independent # Lo [6] TAMIL LETTER A..TAMIL LETTER UU +0B8E..0B90 ; Vowel_Independent # Lo [3] TAMIL LETTER E..TAMIL LETTER AI +0B92..0B94 ; Vowel_Independent # Lo [3] TAMIL LETTER O..TAMIL LETTER AU +0C05..0C0C ; Vowel_Independent # Lo [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L +0C0E..0C10 ; Vowel_Independent # Lo [3] TELUGU LETTER E..TELUGU LETTER AI +0C12..0C14 ; Vowel_Independent # Lo [3] TELUGU LETTER O..TELUGU LETTER AU +0C60..0C61 ; Vowel_Independent # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL +0C85..0C8C ; Vowel_Independent # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L +0C8E..0C90 ; Vowel_Independent # Lo [3] KANNADA LETTER E..KANNADA LETTER AI +0C92..0C94 ; Vowel_Independent # Lo [3] KANNADA LETTER O..KANNADA LETTER AU +0CE0..0CE1 ; Vowel_Independent # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL +0D05..0D0C ; Vowel_Independent # Lo [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L +0D0E..0D10 ; Vowel_Independent # Lo [3] MALAYALAM LETTER E..MALAYALAM LETTER AI +0D12..0D14 ; Vowel_Independent # Lo [3] MALAYALAM LETTER O..MALAYALAM LETTER AU +0D5F..0D61 ; Vowel_Independent # Lo [3] MALAYALAM LETTER ARCHAIC II..MALAYALAM LETTER VOCALIC LL +0D85..0D96 ; Vowel_Independent # Lo [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA +1021..102A ; Vowel_Independent # Lo [10] MYANMAR LETTER A..MYANMAR LETTER AU +1052..1055 ; Vowel_Independent # Lo [4] MYANMAR LETTER VOCALIC R..MYANMAR LETTER VOCALIC LL +1700..1702 ; Vowel_Independent # Lo [3] TAGALOG LETTER A..TAGALOG LETTER U +1720..1722 ; Vowel_Independent # Lo [3] HANUNOO LETTER A..HANUNOO LETTER U +1740..1742 ; Vowel_Independent # Lo [3] BUHID LETTER A..BUHID LETTER U +1760..1762 ; Vowel_Independent # Lo [3] TAGBANWA LETTER A..TAGBANWA LETTER U +17A3..17B3 ; Vowel_Independent # Lo [17] KHMER INDEPENDENT VOWEL QAQ..KHMER INDEPENDENT VOWEL QAU +1A4D..1A52 ; Vowel_Independent # Lo [6] TAI THAM LETTER I..TAI THAM LETTER OO +1B05..1B12 ; Vowel_Independent # Lo [14] BALINESE LETTER AKARA..BALINESE LETTER OKARA TEDUNG +1B83..1B89 ; Vowel_Independent # Lo [7] SUNDANESE LETTER A..SUNDANESE LETTER EU +1BE4..1BE5 ; Vowel_Independent # Lo [2] BATAK LETTER I..BATAK LETTER U +A800..A801 ; Vowel_Independent # Lo [2] SYLOTI NAGRI LETTER A..SYLOTI NAGRI LETTER I +A803..A805 ; Vowel_Independent # Lo [3] SYLOTI NAGRI LETTER U..SYLOTI NAGRI LETTER O +A882..A891 ; Vowel_Independent # Lo [16] SAURASHTRA LETTER A..SAURASHTRA LETTER AU +A8FE ; Vowel_Independent # Lo DEVANAGARI LETTER AY +A984..A988 ; Vowel_Independent # Lo [5] JAVANESE LETTER A..JAVANESE LETTER U +A98C..A98E ; Vowel_Independent # Lo [3] JAVANESE LETTER E..JAVANESE LETTER O +AA00..AA05 ; Vowel_Independent # Lo [6] CHAM LETTER A..CHAM LETTER O +AAE0..AAE1 ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER E..MEETEI MAYEK LETTER O +ABCE..ABCF ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER UN..MEETEI MAYEK LETTER I +ABD1 ; Vowel_Independent # Lo MEETEI MAYEK LETTER ATIYA +11005..11012 ; Vowel_Independent # Lo [14] BRAHMI LETTER A..BRAHMI LETTER AU +11083..1108C ; Vowel_Independent # Lo [10] KAITHI LETTER A..KAITHI LETTER AU +11103..11106 ; Vowel_Independent # Lo [4] CHAKMA LETTER AA..CHAKMA LETTER E +11183..11190 ; Vowel_Independent # Lo [14] SHARADA LETTER A..SHARADA LETTER AU +11200..11207 ; Vowel_Independent # Lo [8] KHOJKI LETTER A..KHOJKI LETTER AU +11280..11283 ; Vowel_Independent # Lo [4] MULTANI LETTER A..MULTANI LETTER E +112B0..112B9 ; Vowel_Independent # Lo [10] KHUDAWADI LETTER A..KHUDAWADI LETTER AU +11305..1130C ; Vowel_Independent # Lo [8] GRANTHA LETTER A..GRANTHA LETTER VOCALIC L +1130F..11310 ; Vowel_Independent # Lo [2] GRANTHA LETTER EE..GRANTHA LETTER AI +11313..11314 ; Vowel_Independent # Lo [2] GRANTHA LETTER OO..GRANTHA LETTER AU +11360..11361 ; Vowel_Independent # Lo [2] GRANTHA LETTER VOCALIC RR..GRANTHA LETTER VOCALIC LL +11400..1140D ; Vowel_Independent # Lo [14] NEWA LETTER A..NEWA LETTER AU +11481..1148E ; Vowel_Independent # Lo [14] TIRHUTA LETTER A..TIRHUTA LETTER AU +11580..1158D ; Vowel_Independent # Lo [14] SIDDHAM LETTER A..SIDDHAM LETTER AU +115D8..115DB ; Vowel_Independent # Lo [4] SIDDHAM LETTER THREE-CIRCLE ALTERNATE I..SIDDHAM LETTER ALTERNATE U +11600..1160D ; Vowel_Independent # Lo [14] MODI LETTER A..MODI LETTER AU +11680..11689 ; Vowel_Independent # Lo [10] TAKRI LETTER A..TAKRI LETTER AU +11800..11809 ; Vowel_Independent # Lo [10] DOGRA LETTER A..DOGRA LETTER AU +119A0..119A7 ; Vowel_Independent # Lo [8] NANDINAGARI LETTER A..NANDINAGARI LETTER VOCALIC RR +119AA..119AD ; Vowel_Independent # Lo [4] NANDINAGARI LETTER E..NANDINAGARI LETTER AU +11A00 ; Vowel_Independent # Lo ZANABAZAR SQUARE LETTER A +11A50 ; Vowel_Independent # Lo SOYOMBO LETTER A +11C00..11C08 ; Vowel_Independent # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L +11C0A..11C0D ; Vowel_Independent # Lo [4] BHAIKSUKI LETTER E..BHAIKSUKI LETTER AU +11D00..11D06 ; Vowel_Independent # Lo [7] MASARAM GONDI LETTER A..MASARAM GONDI LETTER E +11D08..11D09 ; Vowel_Independent # Lo [2] MASARAM GONDI LETTER AI..MASARAM GONDI LETTER O +11D0B ; Vowel_Independent # Lo MASARAM GONDI LETTER AU +11D60..11D65 ; Vowel_Independent # Lo [6] GUNJALA GONDI LETTER A..GUNJALA GONDI LETTER UU +11D67..11D68 ; Vowel_Independent # Lo [2] GUNJALA GONDI LETTER EE..GUNJALA GONDI LETTER AI +11D6A..11D6B ; Vowel_Independent # Lo [2] GUNJALA GONDI LETTER OO..GUNJALA GONDI LETTER AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Dependent + +# Dependent Vowels (contrasted with independent vowels and/or with +# complex placement). Known as matras in Indic scripts. Also +# includes vowel modifiers that follow dependent (and sometimes +# independent) vowels. + +# [Not derivable] + +093A ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN OE +093B ; Vowel_Dependent # Mc DEVANAGARI VOWEL SIGN OOE +093E..0940 ; Vowel_Dependent # Mc [3] DEVANAGARI VOWEL SIGN AA..DEVANAGARI VOWEL SIGN II +0941..0948 ; Vowel_Dependent # Mn [8] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN AI +0949..094C ; Vowel_Dependent # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094E..094F ; Vowel_Dependent # Mc [2] DEVANAGARI VOWEL SIGN PRISHTHAMATRA E..DEVANAGARI VOWEL SIGN AW +0955..0957 ; Vowel_Dependent # Mn [3] DEVANAGARI VOWEL SIGN CANDRA LONG E..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Vowel_Dependent # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BE..09C0 ; Vowel_Dependent # Mc [3] BENGALI VOWEL SIGN AA..BENGALI VOWEL SIGN II +09C1..09C4 ; Vowel_Dependent # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09C7..09C8 ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +09CB..09CC ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +09D7 ; Vowel_Dependent # Mc BENGALI AU LENGTH MARK +09E2..09E3 ; Vowel_Dependent # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3E..0A40 ; Vowel_Dependent # Mc [3] GURMUKHI VOWEL SIGN AA..GURMUKHI VOWEL SIGN II +0A41..0A42 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A47..0A48 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0ABE..0AC0 ; Vowel_Dependent # Mc [3] GUJARATI VOWEL SIGN AA..GUJARATI VOWEL SIGN II +0AC1..0AC5 ; Vowel_Dependent # Mn [5] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AC9 ; Vowel_Dependent # Mc GUJARATI VOWEL SIGN CANDRA O +0ACB..0ACC ; Vowel_Dependent # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0AE2..0AE3 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3E ; Vowel_Dependent # Mc ORIYA VOWEL SIGN AA +0B3F ; Vowel_Dependent # Mn ORIYA VOWEL SIGN I +0B40 ; Vowel_Dependent # Mc ORIYA VOWEL SIGN II +0B41..0B44 ; Vowel_Dependent # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B47..0B48 ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI +0B4B..0B4C ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN O..ORIYA VOWEL SIGN AU +0B56 ; Vowel_Dependent # Mn ORIYA AI LENGTH MARK +0B57 ; Vowel_Dependent # Mc ORIYA AU LENGTH MARK +0B62..0B63 ; Vowel_Dependent # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BBE..0BBF ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC0 ; Vowel_Dependent # Mn TAMIL VOWEL SIGN II +0BC1..0BC2 ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BC6..0BC8 ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0BCA..0BCC ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0BD7 ; Vowel_Dependent # Mc TAMIL AU LENGTH MARK +0C3E..0C40 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C41..0C44 ; Vowel_Dependent # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C46..0C48 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI +0C4A..0C4C ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C55..0C56 ; Vowel_Dependent # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK +0C62..0C63 ; Vowel_Dependent # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBE ; Vowel_Dependent # Mc KANNADA VOWEL SIGN AA +0CBF ; Vowel_Dependent # Mn KANNADA VOWEL SIGN I +0CC0..0CC4 ; Vowel_Dependent # Mc [5] KANNADA VOWEL SIGN II..KANNADA VOWEL SIGN VOCALIC RR +0CC6 ; Vowel_Dependent # Mn KANNADA VOWEL SIGN E +0CC7..0CC8 ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +0CCC ; Vowel_Dependent # Mn KANNADA VOWEL SIGN AU +0CD5..0CD6 ; Vowel_Dependent # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CE2..0CE3 ; Vowel_Dependent # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D3E..0D40 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D44 ; Vowel_Dependent # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR +0D46..0D48 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0D4A..0D4C ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0D57 ; Vowel_Dependent # Mc MALAYALAM AU LENGTH MARK +0D62..0D63 ; Vowel_Dependent # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DCF..0DD1 ; Vowel_Dependent # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD2..0DD4 ; Vowel_Dependent # Mn [3] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Vowel_Dependent # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0DD8..0DDF ; Vowel_Dependent # Mc [8] SINHALA VOWEL SIGN GAETTA-PILLA..SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Vowel_Dependent # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Vowel_Dependent # Lo THAI CHARACTER SARA A +0E31 ; Vowel_Dependent # Mn THAI CHARACTER MAI HAN-AKAT +0E32..0E33 ; Vowel_Dependent # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E34..0E39 ; Vowel_Dependent # Mn [6] THAI CHARACTER SARA I..THAI CHARACTER SARA UU +0E40..0E45 ; Vowel_Dependent # Lo [6] THAI CHARACTER SARA E..THAI CHARACTER LAKKHANGYAO +0E47 ; Vowel_Dependent # Mn THAI CHARACTER MAITAIKHU +0EB0 ; Vowel_Dependent # Lo LAO VOWEL SIGN A +0EB1 ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KAN +0EB2..0EB3 ; Vowel_Dependent # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0EB4..0EB9 ; Vowel_Dependent # Mn [6] LAO VOWEL SIGN I..LAO VOWEL SIGN UU +0EBB ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KON +0EC0..0EC4 ; Vowel_Dependent # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +0F71..0F7D ; Vowel_Dependent # Mn [13] TIBETAN VOWEL SIGN AA..TIBETAN VOWEL SIGN OO +0F80..0F81 ; Vowel_Dependent # Mn [2] TIBETAN VOWEL SIGN REVERSED I..TIBETAN VOWEL SIGN REVERSED II +102B..102C ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +102D..1030 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN UU +1031 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN E +1032..1035 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +1056..1057 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1058..1059 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1062 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1071..1074 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1083..1084 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN SHAN AA..MYANMAR VOWEL SIGN SHAN E +1085..1086 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109C ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN AITON A +109D ; Vowel_Dependent # Mn MYANMAR VOWEL SIGN AITON AI +1712..1713 ; Vowel_Dependent # Mn [2] TAGALOG VOWEL SIGN I..TAGALOG VOWEL SIGN U +1732..1733 ; Vowel_Dependent # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1752..1753 ; Vowel_Dependent # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U +1772..1773 ; Vowel_Dependent # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U +17B6 ; Vowel_Dependent # Mc KHMER VOWEL SIGN AA +17B7..17BD ; Vowel_Dependent # Mn [7] KHMER VOWEL SIGN I..KHMER VOWEL SIGN UA +17BE..17C5 ; Vowel_Dependent # Mc [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU +17C8 ; Vowel_Dependent # Mc KHMER SIGN YUUKALEAPINTU +1920..1922 ; Vowel_Dependent # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U +1923..1926 ; Vowel_Dependent # Mc [4] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AU +1927..1928 ; Vowel_Dependent # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Vowel_Dependent # Mn LIMBU SIGN KEMPHRENG +19B0..19C0 ; Vowel_Dependent # Lo [17] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN IY +1A17..1A18 ; Vowel_Dependent # Mn [2] BUGINESE VOWEL SIGN I..BUGINESE VOWEL SIGN U +1A19..1A1A ; Vowel_Dependent # Mc [2] BUGINESE VOWEL SIGN E..BUGINESE VOWEL SIGN O +1A1B ; Vowel_Dependent # Mn BUGINESE VOWEL SIGN AE +1A61 ; Vowel_Dependent # Mc TAI THAM VOWEL SIGN A +1A62 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN MAI SAT +1A63..1A64 ; Vowel_Dependent # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A65..1A6C ; Vowel_Dependent # Mn [8] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN OA BELOW +1A6D..1A72 ; Vowel_Dependent # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI +1A73 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN OA ABOVE +1B35 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN TEDUNG +1B36..1B3A ; Vowel_Dependent # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA +1B3B ; Vowel_Dependent # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +1B3C ; Vowel_Dependent # Mn BALINESE VOWEL SIGN LA LENGA +1B3D..1B41 ; Vowel_Dependent # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1B42 ; Vowel_Dependent # Mn BALINESE VOWEL SIGN PEPET +1B43 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN PEPET TEDUNG +1BA4..1BA5 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PANGHULU..SUNDANESE VOWEL SIGN PANYUKU +1BA6..1BA7 ; Vowel_Dependent # Mc [2] SUNDANESE VOWEL SIGN PANAELAENG..SUNDANESE VOWEL SIGN PANOLONG +1BA8..1BA9 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE7 ; Vowel_Dependent # Mc BATAK VOWEL SIGN E +1BE8..1BE9 ; Vowel_Dependent # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BEA..1BEC ; Vowel_Dependent # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BED ; Vowel_Dependent # Mn BATAK VOWEL SIGN KARO O +1BEE ; Vowel_Dependent # Mc BATAK VOWEL SIGN U +1BEF ; Vowel_Dependent # Mn BATAK VOWEL SIGN U FOR SIMALUNGUN SA +1C26..1C2B ; Vowel_Dependent # Mc [6] LEPCHA VOWEL SIGN AA..LEPCHA VOWEL SIGN UU +1C2C ; Vowel_Dependent # Mn LEPCHA VOWEL SIGN E +A802 ; Vowel_Dependent # Mn SYLOTI NAGRI SIGN DVISVARA +A823..A824 ; Vowel_Dependent # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A825..A826 ; Vowel_Dependent # Mn [2] SYLOTI NAGRI VOWEL SIGN U..SYLOTI NAGRI VOWEL SIGN E +A827 ; Vowel_Dependent # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Vowel_Dependent # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A8FF ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN AY +A947..A94E ; Vowel_Dependent # Mn [8] REJANG VOWEL SIGN I..REJANG VOWEL SIGN EA +A9B4..A9B5 ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9B6..A9B9 ; Vowel_Dependent # Mn [4] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BA..A9BB ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +A9BC ; Vowel_Dependent # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Vowel_Dependent # Mn MYANMAR SIGN SHAN SAW +AA29..AA2E ; Vowel_Dependent # Mn [6] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN OE +AA2F..AA30 ; Vowel_Dependent # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA31..AA32 ; Vowel_Dependent # Mn [2] CHAM VOWEL SIGN AU..CHAM VOWEL SIGN UE +AAB0 ; Vowel_Dependent # Mn TAI VIET MAI KANG +AAB1 ; Vowel_Dependent # Lo TAI VIET VOWEL AA +AAB2..AAB4 ; Vowel_Dependent # Mn [3] TAI VIET VOWEL I..TAI VIET VOWEL U +AAB5..AAB6 ; Vowel_Dependent # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB7..AAB8 ; Vowel_Dependent # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AAB9..AABD ; Vowel_Dependent # Lo [5] TAI VIET VOWEL UEA..TAI VIET VOWEL AN +AABE ; Vowel_Dependent # Mn TAI VIET VOWEL AM +AAEB ; Vowel_Dependent # Mc MEETEI MAYEK VOWEL SIGN II +AAEC..AAED ; Vowel_Dependent # Mn [2] MEETEI MAYEK VOWEL SIGN UU..MEETEI MAYEK VOWEL SIGN AAI +AAEE..AAEF ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN AU..MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE5 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN ANAP +ABE6..ABE7 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE8 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABE9..ABEA ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +10A01..10A03 ; Vowel_Dependent # Mn [3] KHAROSHTHI VOWEL SIGN I..KHAROSHTHI VOWEL SIGN VOCALIC R +10A05..10A06 ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O +10A0C..10A0D ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN DOUBLE RING BELOW +11038..11045 ; Vowel_Dependent # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +110B0..110B2 ; Vowel_Dependent # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II +110B3..110B6 ; Vowel_Dependent # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI +110B7..110B8 ; Vowel_Dependent # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11127..1112B ; Vowel_Dependent # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU +1112C ; Vowel_Dependent # Mc CHAKMA VOWEL SIGN E +1112D..11132 ; Vowel_Dependent # Mn [6] CHAKMA VOWEL SIGN AI..CHAKMA AU MARK +11145..11146 ; Vowel_Dependent # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI +111B3..111B5 ; Vowel_Dependent # Mc [3] SHARADA VOWEL SIGN AA..SHARADA VOWEL SIGN II +111B6..111BE ; Vowel_Dependent # Mn [9] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN O +111BF ; Vowel_Dependent # Mc SHARADA VOWEL SIGN AU +111CB..111CC ; Vowel_Dependent # Mn [2] SHARADA VOWEL MODIFIER MARK..SHARADA EXTRA SHORT VOWEL MARK +1122C..1122E ; Vowel_Dependent # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +1122F..11231 ; Vowel_Dependent # Mn [3] KHOJKI VOWEL SIGN U..KHOJKI VOWEL SIGN AI +11232..11233 ; Vowel_Dependent # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU +112E0..112E2 ; Vowel_Dependent # Mc [3] KHUDAWADI VOWEL SIGN AA..KHUDAWADI VOWEL SIGN II +112E3..112E8 ; Vowel_Dependent # Mn [6] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN AU +1133E..1133F ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11340 ; Vowel_Dependent # Mn GRANTHA VOWEL SIGN II +11341..11344 ; Vowel_Dependent # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +11347..11348 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +1134B..1134C ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +11357 ; Vowel_Dependent # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +11435..11437 ; Vowel_Dependent # Mc [3] NEWA VOWEL SIGN AA..NEWA VOWEL SIGN II +11438..1143F ; Vowel_Dependent # Mn [8] NEWA VOWEL SIGN U..NEWA VOWEL SIGN AI +11440..11441 ; Vowel_Dependent # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +114B0..114B2 ; Vowel_Dependent # Mc [3] TIRHUTA VOWEL SIGN AA..TIRHUTA VOWEL SIGN II +114B3..114B8 ; Vowel_Dependent # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114B9 ; Vowel_Dependent # Mc TIRHUTA VOWEL SIGN E +114BA ; Vowel_Dependent # Mn TIRHUTA VOWEL SIGN SHORT E +114BB..114BE ; Vowel_Dependent # Mc [4] TIRHUTA VOWEL SIGN AI..TIRHUTA VOWEL SIGN AU +115AF..115B1 ; Vowel_Dependent # Mc [3] SIDDHAM VOWEL SIGN AA..SIDDHAM VOWEL SIGN II +115B2..115B5 ; Vowel_Dependent # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115B8..115BB ; Vowel_Dependent # Mc [4] SIDDHAM VOWEL SIGN E..SIDDHAM VOWEL SIGN AU +115DC..115DD ; Vowel_Dependent # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11630..11632 ; Vowel_Dependent # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +11633..1163A ; Vowel_Dependent # Mn [8] MODI VOWEL SIGN U..MODI VOWEL SIGN AI +1163B..1163C ; Vowel_Dependent # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +11640 ; Vowel_Dependent # Mn MODI SIGN ARDHACANDRA +116AD ; Vowel_Dependent # Mn TAKRI VOWEL SIGN AA +116AE..116AF ; Vowel_Dependent # Mc [2] TAKRI VOWEL SIGN I..TAKRI VOWEL SIGN II +116B0..116B5 ; Vowel_Dependent # Mn [6] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN AU +11720..11721 ; Vowel_Dependent # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +11722..11725 ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN I..AHOM VOWEL SIGN UU +11726 ; Vowel_Dependent # Mc AHOM VOWEL SIGN E +11727..1172A ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN AW..AHOM VOWEL SIGN AM +1182C..1182E ; Vowel_Dependent # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II +1182F..11836 ; Vowel_Dependent # Mn [8] DOGRA VOWEL SIGN U..DOGRA VOWEL SIGN AU +119D1..119D3 ; Vowel_Dependent # Mc [3] NANDINAGARI VOWEL SIGN AA..NANDINAGARI VOWEL SIGN II +119D4..119D7 ; Vowel_Dependent # Mn [4] NANDINAGARI VOWEL SIGN U..NANDINAGARI VOWEL SIGN VOCALIC RR +119DA..119DB ; Vowel_Dependent # Mn [2] NANDINAGARI VOWEL SIGN E..NANDINAGARI VOWEL SIGN AI +119DC..119DD ; Vowel_Dependent # Mc [2] NANDINAGARI VOWEL SIGN O..NANDINAGARI VOWEL SIGN AU +119E4 ; Vowel_Dependent # Mc NANDINAGARI VOWEL SIGN PRISHTHAMATRA E +11A01..11A0A ; Vowel_Dependent # Mn [10] ZANABAZAR SQUARE VOWEL SIGN I..ZANABAZAR SQUARE VOWEL LENGTH MARK +11A51..11A56 ; Vowel_Dependent # Mn [6] SOYOMBO VOWEL SIGN I..SOYOMBO VOWEL SIGN OE +11A57..11A58 ; Vowel_Dependent # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A59..11A5B ; Vowel_Dependent # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11C2F ; Vowel_Dependent # Mc BHAIKSUKI VOWEL SIGN AA +11C30..11C36 ; Vowel_Dependent # Mn [7] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN VOCALIC L +11C38..11C3B ; Vowel_Dependent # Mn [4] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI VOWEL SIGN AU +11CB0 ; Vowel_Dependent # Mn MARCHEN VOWEL SIGN AA +11CB1 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN I +11CB2..11CB3 ; Vowel_Dependent # Mn [2] MARCHEN VOWEL SIGN U..MARCHEN VOWEL SIGN E +11CB4 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN O +11D31..11D36 ; Vowel_Dependent # Mn [6] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN VOCALIC R +11D3A ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Vowel_Dependent # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN AU +11D43 ; Vowel_Dependent # Mn MASARAM GONDI SIGN CANDRA +11D8A..11D8E ; Vowel_Dependent # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU +11D90..11D91 ; Vowel_Dependent # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI +11D93..11D94 ; Vowel_Dependent # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU +11EF3..11EF4 ; Vowel_Dependent # Mn [2] MAKASAR VOWEL SIGN I..MAKASAR VOWEL SIGN U +11EF5..11EF6 ; Vowel_Dependent # Mc [2] MAKASAR VOWEL SIGN E..MAKASAR VOWEL SIGN O + +# ================================================ + +# Indic_Syllabic_Category=Vowel + +# (Other) Vowels (reanalyzed as ordinary alphabetic letters or marks) + +# [Not derivable] + +1963..196D ; Vowel # Lo [11] TAI LE LETTER A..TAI LE LETTER AI +A85E..A861 ; Vowel # Lo [4] PHAGS-PA LETTER I..PHAGS-PA LETTER O +A866 ; Vowel # Lo PHAGS-PA LETTER EE +A922..A925 ; Vowel # Lo [4] KAYAH LI LETTER A..KAYAH LI LETTER OO +A926..A92A ; Vowel # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O +11150..11154 ; Vowel # Lo [5] MAHAJANI LETTER A..MAHAJANI LETTER O + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Placeholder + +# Consonant Placeholder +# This includes generic placeholders used for +# Indic script layout (NBSP and dotted circle), as well as a few script- +# specific vowel-holder characters which are not technically +# consonants, but serve instead as bases for placement of vowel marks. + +# [Not derivable] + +002D ; Consonant_Placeholder # Pd HYPHEN-MINUS +00A0 ; Consonant_Placeholder # Zs NO-BREAK SPACE +00D7 ; Consonant_Placeholder # Sm MULTIPLICATION SIGN +0980 ; Consonant_Placeholder # Lo BENGALI ANJI +0A72..0A73 ; Consonant_Placeholder # Lo [2] GURMUKHI IRI..GURMUKHI URA +104B ; Consonant_Placeholder # Po MYANMAR SIGN SECTION +104E ; Consonant_Placeholder # Po MYANMAR SYMBOL AFOREMENTIONED +1900 ; Consonant_Placeholder # Lo LIMBU VOWEL-CARRIER LETTER +1CFA ; Consonant_Placeholder # Lo VEDIC SIGN DOUBLE ANUSVARA ANTARGOMUKHA +2010..2014 ; Consonant_Placeholder # Pd [5] HYPHEN..EM DASH +25CC ; Consonant_Placeholder # So DOTTED CIRCLE +AA74..AA76 ; Consonant_Placeholder # Lo [3] MYANMAR LOGOGRAM KHAMTI OAY..MYANMAR LOGOGRAM KHAMTI HM +11A3F ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL HEAD MARK +11A45 ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL DOUBLE-LINED HEAD MARK +11EF2 ; Consonant_Placeholder # Lo MAKASAR ANGKA + +# ================================================ + +# Indic_Syllabic_Category=Consonant + +# Consonant (ordinary abugida consonants, with inherent vowels) + +# [Not derivable] + +0915..0939 ; Consonant # Lo [37] DEVANAGARI LETTER KA..DEVANAGARI LETTER HA +0958..095F ; Consonant # Lo [8] DEVANAGARI LETTER QA..DEVANAGARI LETTER YYA +0978..097F ; Consonant # Lo [8] DEVANAGARI LETTER MARWARI DDA..DEVANAGARI LETTER BBA +0995..09A8 ; Consonant # Lo [20] BENGALI LETTER KA..BENGALI LETTER NA +09AA..09B0 ; Consonant # Lo [7] BENGALI LETTER PA..BENGALI LETTER RA +09B2 ; Consonant # Lo BENGALI LETTER LA +09B6..09B9 ; Consonant # Lo [4] BENGALI LETTER SHA..BENGALI LETTER HA +09DC..09DD ; Consonant # Lo [2] BENGALI LETTER RRA..BENGALI LETTER RHA +09DF ; Consonant # Lo BENGALI LETTER YYA +09F0..09F1 ; Consonant # Lo [2] BENGALI LETTER RA WITH MIDDLE DIAGONAL..BENGALI LETTER RA WITH LOWER DIAGONAL +0A15..0A28 ; Consonant # Lo [20] GURMUKHI LETTER KA..GURMUKHI LETTER NA +0A2A..0A30 ; Consonant # Lo [7] GURMUKHI LETTER PA..GURMUKHI LETTER RA +0A32..0A33 ; Consonant # Lo [2] GURMUKHI LETTER LA..GURMUKHI LETTER LLA +0A35..0A36 ; Consonant # Lo [2] GURMUKHI LETTER VA..GURMUKHI LETTER SHA +0A38..0A39 ; Consonant # Lo [2] GURMUKHI LETTER SA..GURMUKHI LETTER HA +0A59..0A5C ; Consonant # Lo [4] GURMUKHI LETTER KHHA..GURMUKHI LETTER RRA +0A5E ; Consonant # Lo GURMUKHI LETTER FA +0A95..0AA8 ; Consonant # Lo [20] GUJARATI LETTER KA..GUJARATI LETTER NA +0AAA..0AB0 ; Consonant # Lo [7] GUJARATI LETTER PA..GUJARATI LETTER RA +0AB2..0AB3 ; Consonant # Lo [2] GUJARATI LETTER LA..GUJARATI LETTER LLA +0AB5..0AB9 ; Consonant # Lo [5] GUJARATI LETTER VA..GUJARATI LETTER HA +0AF9 ; Consonant # Lo GUJARATI LETTER ZHA +0B15..0B28 ; Consonant # Lo [20] ORIYA LETTER KA..ORIYA LETTER NA +0B2A..0B30 ; Consonant # Lo [7] ORIYA LETTER PA..ORIYA LETTER RA +0B32..0B33 ; Consonant # Lo [2] ORIYA LETTER LA..ORIYA LETTER LLA +0B35..0B39 ; Consonant # Lo [5] ORIYA LETTER VA..ORIYA LETTER HA +0B5C..0B5D ; Consonant # Lo [2] ORIYA LETTER RRA..ORIYA LETTER RHA +0B5F ; Consonant # Lo ORIYA LETTER YYA +0B71 ; Consonant # Lo ORIYA LETTER WA +0B95 ; Consonant # Lo TAMIL LETTER KA +0B99..0B9A ; Consonant # Lo [2] TAMIL LETTER NGA..TAMIL LETTER CA +0B9C ; Consonant # Lo TAMIL LETTER JA +0B9E..0B9F ; Consonant # Lo [2] TAMIL LETTER NYA..TAMIL LETTER TTA +0BA3..0BA4 ; Consonant # Lo [2] TAMIL LETTER NNA..TAMIL LETTER TA +0BA8..0BAA ; Consonant # Lo [3] TAMIL LETTER NA..TAMIL LETTER PA +0BAE..0BB9 ; Consonant # Lo [12] TAMIL LETTER MA..TAMIL LETTER HA +0C15..0C28 ; Consonant # Lo [20] TELUGU LETTER KA..TELUGU LETTER NA +0C2A..0C39 ; Consonant # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C58..0C5A ; Consonant # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C95..0CA8 ; Consonant # Lo [20] KANNADA LETTER KA..KANNADA LETTER NA +0CAA..0CB3 ; Consonant # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA +0CB5..0CB9 ; Consonant # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA +0CDE ; Consonant # Lo KANNADA LETTER FA +0D15..0D3A ; Consonant # Lo [38] MALAYALAM LETTER KA..MALAYALAM LETTER TTTA +0D9A..0DB1 ; Consonant # Lo [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA +0DB3..0DBB ; Consonant # Lo [9] SINHALA LETTER SANYAKA DAYANNA..SINHALA LETTER RAYANNA +0DBD ; Consonant # Lo SINHALA LETTER DANTAJA LAYANNA +0DC0..0DC6 ; Consonant # Lo [7] SINHALA LETTER VAYANNA..SINHALA LETTER FAYANNA +0E01..0E2E ; Consonant # Lo [46] THAI CHARACTER KO KAI..THAI CHARACTER HO NOKHUK +0E81..0E82 ; Consonant # Lo [2] LAO LETTER KO..LAO LETTER KHO SUNG +0E84 ; Consonant # Lo LAO LETTER KHO TAM +0E86..0E8A ; Consonant # Lo [5] LAO LETTER PALI GHA..LAO LETTER SO TAM +0E8C..0EA3 ; Consonant # Lo [24] LAO LETTER PALI JHA..LAO LETTER LO LING +0EA5 ; Consonant # Lo LAO LETTER LO LOOT +0EA7..0EAE ; Consonant # Lo [8] LAO LETTER WO..LAO LETTER HO TAM +0EDC..0EDF ; Consonant # Lo [4] LAO HO NO..LAO LETTER KHMU NYO +0F40..0F47 ; Consonant # Lo [8] TIBETAN LETTER KA..TIBETAN LETTER JA +0F49..0F6C ; Consonant # Lo [36] TIBETAN LETTER NYA..TIBETAN LETTER RRA +1000..1020 ; Consonant # Lo [33] MYANMAR LETTER KA..MYANMAR LETTER LLA +103F ; Consonant # Lo MYANMAR LETTER GREAT SA +1050..1051 ; Consonant # Lo [2] MYANMAR LETTER SHA..MYANMAR LETTER SSA +105A..105D ; Consonant # Lo [4] MYANMAR LETTER MON NGA..MYANMAR LETTER MON BBE +1061 ; Consonant # Lo MYANMAR LETTER SGAW KAREN SHA +1065..1066 ; Consonant # Lo [2] MYANMAR LETTER WESTERN PWO KAREN THA..MYANMAR LETTER WESTERN PWO KAREN PWA +106E..1070 ; Consonant # Lo [3] MYANMAR LETTER EASTERN PWO KAREN NNA..MYANMAR LETTER EASTERN PWO KAREN GHWA +1075..1081 ; Consonant # Lo [13] MYANMAR LETTER SHAN KA..MYANMAR LETTER SHAN HA +108E ; Consonant # Lo MYANMAR LETTER RUMAI PALAUNG FA +1703..170C ; Consonant # Lo [10] TAGALOG LETTER KA..TAGALOG LETTER YA +170E..1711 ; Consonant # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1723..1731 ; Consonant # Lo [15] HANUNOO LETTER KA..HANUNOO LETTER HA +1743..1751 ; Consonant # Lo [15] BUHID LETTER KA..BUHID LETTER HA +1763..176C ; Consonant # Lo [10] TAGBANWA LETTER KA..TAGBANWA LETTER YA +176E..1770 ; Consonant # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA +1780..17A2 ; Consonant # Lo [35] KHMER LETTER KA..KHMER LETTER QA +1901..191E ; Consonant # Lo [30] LIMBU LETTER KA..LIMBU LETTER TRA +1950..1962 ; Consonant # Lo [19] TAI LE LETTER KA..TAI LE LETTER NA +1980..19AB ; Consonant # Lo [44] NEW TAI LUE LETTER HIGH QA..NEW TAI LUE LETTER LOW SUA +1A00..1A16 ; Consonant # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA +1A20..1A4C ; Consonant # Lo [45] TAI THAM LETTER HIGH KA..TAI THAM LETTER LOW HA +1A53..1A54 ; Consonant # Lo [2] TAI THAM LETTER LAE..TAI THAM LETTER GREAT SA +1B13..1B33 ; Consonant # Lo [33] BALINESE LETTER KA..BALINESE LETTER HA +1B45..1B4B ; Consonant # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B8A..1BA0 ; Consonant # Lo [23] SUNDANESE LETTER KA..SUNDANESE LETTER HA +1BAE..1BAF ; Consonant # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA +1BBB..1BBD ; Consonant # Lo [3] SUNDANESE LETTER REU..SUNDANESE LETTER BHA +1BC0..1BE3 ; Consonant # Lo [36] BATAK LETTER A..BATAK LETTER MBA +1C00..1C23 ; Consonant # Lo [36] LEPCHA LETTER KA..LEPCHA LETTER A +1C4D..1C4F ; Consonant # Lo [3] LEPCHA LETTER TTA..LEPCHA LETTER DDA +A807..A80A ; Consonant # Lo [4] SYLOTI NAGRI LETTER KO..SYLOTI NAGRI LETTER GHO +A80C..A822 ; Consonant # Lo [23] SYLOTI NAGRI LETTER CO..SYLOTI NAGRI LETTER HO +A840..A85D ; Consonant # Lo [30] PHAGS-PA LETTER KA..PHAGS-PA LETTER A +A862..A865 ; Consonant # Lo [4] PHAGS-PA LETTER QA..PHAGS-PA LETTER GGA +A869..A870 ; Consonant # Lo [8] PHAGS-PA LETTER TTA..PHAGS-PA LETTER ASPIRATED FA +A872 ; Consonant # Lo PHAGS-PA SUPERFIXED LETTER RA +A892..A8B3 ; Consonant # Lo [34] SAURASHTRA LETTER KA..SAURASHTRA LETTER LLA +A90A..A921 ; Consonant # Lo [24] KAYAH LI LETTER KA..KAYAH LI LETTER CA +A930..A946 ; Consonant # Lo [23] REJANG LETTER KA..REJANG LETTER A +A989..A98B ; Consonant # Lo [3] JAVANESE LETTER PA CEREK..JAVANESE LETTER NGA LELET RASWADI +A98F..A9B2 ; Consonant # Lo [36] JAVANESE LETTER KA..JAVANESE LETTER HA +A9E0..A9E4 ; Consonant # Lo [5] MYANMAR LETTER SHAN GHA..MYANMAR LETTER SHAN BHA +A9E7..A9EF ; Consonant # Lo [9] MYANMAR LETTER TAI LAING NYA..MYANMAR LETTER TAI LAING NNA +A9FA..A9FE ; Consonant # Lo [5] MYANMAR LETTER TAI LAING LLA..MYANMAR LETTER TAI LAING BHA +AA06..AA28 ; Consonant # Lo [35] CHAM LETTER KA..CHAM LETTER HA +AA60..AA6F ; Consonant # Lo [16] MYANMAR LETTER KHAMTI GA..MYANMAR LETTER KHAMTI FA +AA71..AA73 ; Consonant # Lo [3] MYANMAR LETTER KHAMTI XA..MYANMAR LETTER KHAMTI RA +AA7A ; Consonant # Lo MYANMAR LETTER AITON RA +AA7E..AA7F ; Consonant # Lo [2] MYANMAR LETTER SHWE PALAUNG CHA..MYANMAR LETTER SHWE PALAUNG SHA +AA80..AAAF ; Consonant # Lo [48] TAI VIET LETTER LOW KO..TAI VIET LETTER HIGH O +AAE2..AAEA ; Consonant # Lo [9] MEETEI MAYEK LETTER CHA..MEETEI MAYEK LETTER SSA +ABC0..ABCD ; Consonant # Lo [14] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER HUK +ABD0 ; Consonant # Lo MEETEI MAYEK LETTER PHAM +ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTER BHAM +10A00 ; Consonant # Lo KHAROSHTHI LETTER A +10A10..10A13 ; Consonant # Lo [4] KHAROSHTHI LETTER KA..KHAROSHTHI LETTER GHA +10A15..10A17 ; Consonant # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA +10A19..10A35 ; Consonant # Lo [29] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER VHA +11013..11037 ; Consonant # Lo [37] BRAHMI LETTER KA..BRAHMI LETTER OLD TAMIL NNNA +1108D..110AF ; Consonant # Lo [35] KAITHI LETTER KA..KAITHI LETTER HA +11107..11126 ; Consonant # Lo [32] CHAKMA LETTER KAA..CHAKMA LETTER HAA +11144 ; Consonant # Lo CHAKMA LETTER LHAA +11155..11172 ; Consonant # Lo [30] MAHAJANI LETTER KA..MAHAJANI LETTER RRA +11191..111B2 ; Consonant # Lo [34] SHARADA LETTER KA..SHARADA LETTER HA +11208..11211 ; Consonant # Lo [10] KHOJKI LETTER KA..KHOJKI LETTER JJA +11213..1122B ; Consonant # Lo [25] KHOJKI LETTER NYA..KHOJKI LETTER LLA +11284..11286 ; Consonant # Lo [3] MULTANI LETTER KA..MULTANI LETTER GA +11288 ; Consonant # Lo MULTANI LETTER GHA +1128A..1128D ; Consonant # Lo [4] MULTANI LETTER CA..MULTANI LETTER JJA +1128F..1129D ; Consonant # Lo [15] MULTANI LETTER NYA..MULTANI LETTER BA +1129F..112A8 ; Consonant # Lo [10] MULTANI LETTER BHA..MULTANI LETTER RHA +112BA..112DE ; Consonant # Lo [37] KHUDAWADI LETTER KA..KHUDAWADI LETTER HA +11315..11328 ; Consonant # Lo [20] GRANTHA LETTER KA..GRANTHA LETTER NA +1132A..11330 ; Consonant # Lo [7] GRANTHA LETTER PA..GRANTHA LETTER RA +11332..11333 ; Consonant # Lo [2] GRANTHA LETTER LA..GRANTHA LETTER LLA +11335..11339 ; Consonant # Lo [5] GRANTHA LETTER VA..GRANTHA LETTER HA +1140E..11434 ; Consonant # Lo [39] NEWA LETTER KA..NEWA LETTER HA +1148F..114AF ; Consonant # Lo [33] TIRHUTA LETTER KA..TIRHUTA LETTER HA +1158E..115AE ; Consonant # Lo [33] SIDDHAM LETTER KA..SIDDHAM LETTER HA +1160E..1162F ; Consonant # Lo [34] MODI LETTER KA..MODI LETTER LLA +1168A..116AA ; Consonant # Lo [33] TAKRI LETTER KA..TAKRI LETTER RRA +116B8 ; Consonant # Lo TAKRI LETTER ARCHAIC KHA +11700..1171A ; Consonant # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA +1180A..1182B ; Consonant # Lo [34] DOGRA LETTER KA..DOGRA LETTER RRA +119AE..119D0 ; Consonant # Lo [35] NANDINAGARI LETTER KA..NANDINAGARI LETTER RRA +11A0B..11A32 ; Consonant # Lo [40] ZANABAZAR SQUARE LETTER KA..ZANABAZAR SQUARE LETTER KSSA +11A5C..11A83 ; Consonant # Lo [40] SOYOMBO LETTER KA..SOYOMBO LETTER KSSA +11C0E..11C2E ; Consonant # Lo [33] BHAIKSUKI LETTER KA..BHAIKSUKI LETTER HA +11C72..11C8F ; Consonant # Lo [30] MARCHEN LETTER KA..MARCHEN LETTER A +11D0C..11D30 ; Consonant # Lo [37] MASARAM GONDI LETTER KA..MASARAM GONDI LETTER TRA +11D6C..11D89 ; Consonant # Lo [30] GUNJALA GONDI LETTER YA..GUNJALA GONDI LETTER SA +11EE0..11EF1 ; Consonant # Lo [18] MAKASAR LETTER KA..MAKASAR LETTER A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Dead + +# Dead Consonant (special consonant with killed vowel) + +# [Not derivable] + +09CE ; Consonant_Dead # Lo BENGALI LETTER KHANDA TA +0D54..0D56 ; Consonant_Dead # Lo [3] MALAYALAM LETTER CHILLU M..MALAYALAM LETTER CHILLU LLL +0D7A..0D7F ; Consonant_Dead # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K +1CF2..1CF3 ; Consonant_Dead # Lo [2] VEDIC SIGN ARDHAVISARGA..VEDIC SIGN ROTATED ARDHAVISARGA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_With_Stacker + +# Consonants that may make stacked ligatures with the next consonant +# without the use of a virama + +# [Not derivable] + +0CF1..0CF2 ; Consonant_With_Stacker # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA +1CF5..1CF6 ; Consonant_With_Stacker # Lo [2] VEDIC SIGN JIHVAMULIYA..VEDIC SIGN UPADHMANIYA +11003..11004 ; Consonant_With_Stacker # Lo [2] BRAHMI SIGN JIHVAMULIYA..BRAHMI SIGN UPADHMANIYA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Prefixed + +# Cluster-initial consonants + +# [Not derivable] + +111C2..111C3 ; Consonant_Prefixed # Lo [2] SHARADA SIGN JIHVAMULIYA..SHARADA SIGN UPADHMANIYA +11A3A ; Consonant_Prefixed # Lo ZANABAZAR SQUARE CLUSTER-INITIAL LETTER RA +11A84..11A89 ; Consonant_Prefixed # Lo [6] SOYOMBO SIGN JIHVAMULIYA..SOYOMBO CLUSTER-INITIAL LETTER SA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Preceding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when preceding the main +# consonant. + +# [Not derivable] + +0D4E ; Consonant_Preceding_Repha # Lo MALAYALAM LETTER DOT REPH +11D46 ; Consonant_Preceding_Repha # Lo MASARAM GONDI REPHA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Initial_Postfixed + +# Consonants that succeed the main consonant in character sequences, but are +# pronounced before it. + +# [Not derivable] + +1A5A ; Consonant_Initial_Postfixed # Mn TAI THAM CONSONANT SIGN LOW PA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Succeeding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when succeeding the main +# consonant. + +# [Not derivable] + +17CC ; Consonant_Succeeding_Repha # Mn KHMER SIGN ROBAT +1B03 ; Consonant_Succeeding_Repha # Mn BALINESE SIGN SURANG +1B81 ; Consonant_Succeeding_Repha # Mn SUNDANESE SIGN PANGLAYAR +A982 ; Consonant_Succeeding_Repha # Mn JAVANESE SIGN LAYAR + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Subjoined + +# Subjoined Consonant (C2 form subtending a base consonant in Tibetan, etc.) + +# [Not derivable] + +0F8D..0F97 ; Consonant_Subjoined # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Consonant_Subjoined # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +1929..192B ; Consonant_Subjoined # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1A57 ; Consonant_Subjoined # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A5B..1A5E ; Consonant_Subjoined # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1BA1 ; Consonant_Subjoined # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA2..1BA3 ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BAC..1BAD ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C24..1C25 ; Consonant_Subjoined # Mc [2] LEPCHA SUBJOINED LETTER YA..LEPCHA SUBJOINED LETTER RA +A867..A868 ; Consonant_Subjoined # Lo [2] PHAGS-PA SUBJOINED LETTER WA..PHAGS-PA SUBJOINED LETTER YA +A871 ; Consonant_Subjoined # Lo PHAGS-PA SUBJOINED LETTER RA +11C92..11CA7 ; Consonant_Subjoined # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CA9 ; Consonant_Subjoined # Mc MARCHEN SUBJOINED LETTER YA +11CAA..11CAF ; Consonant_Subjoined # Mn [6] MARCHEN SUBJOINED LETTER RA..MARCHEN SUBJOINED LETTER A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Medial + +# Medial Consonant (medial liquid, occurring in clusters) + +# [Not derivable] + +0A75 ; Consonant_Medial # Mn GURMUKHI SIGN YAKASH +0EBC ; Consonant_Medial # Mn LAO SEMIVOWEL SIGN LO +0EBD ; Consonant_Medial # Lo LAO SEMIVOWEL SIGN NYO +103B..103C ; Consonant_Medial # Mc [2] MYANMAR CONSONANT SIGN MEDIAL YA..MYANMAR CONSONANT SIGN MEDIAL RA +103D..103E ; Consonant_Medial # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +105E..1060 ; Consonant_Medial # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Consonant_Medial # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +1A55 ; Consonant_Medial # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A56 ; Consonant_Medial # Mn TAI THAM CONSONANT SIGN MEDIAL LA +A8B4 ; Consonant_Medial # Mc SAURASHTRA CONSONANT SIGN HAARU +A9BD ; Consonant_Medial # Mn JAVANESE CONSONANT SIGN KERET +A9BE..A9BF ; Consonant_Medial # Mc [2] JAVANESE CONSONANT SIGN PENGKAL..JAVANESE CONSONANT SIGN CAKRA +AA33..AA34 ; Consonant_Medial # Mc [2] CHAM CONSONANT SIGN YA..CHAM CONSONANT SIGN RA +AA35..AA36 ; Consonant_Medial # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +1171D..1171F ; Consonant_Medial # Mn [3] AHOM CONSONANT SIGN MEDIAL LA..AHOM CONSONANT SIGN MEDIAL LIGATING RA +11A3B..11A3E ; Consonant_Medial # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11D47 ; Consonant_Medial # Mn MASARAM GONDI RA-KARA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Final + +# Final Consonant (special final forms which do not take vowels) + +# [Not derivable] + +1930..1931 ; Consonant_Final # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Consonant_Final # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +1939 ; Consonant_Final # Mn LIMBU SIGN MUKPHRENG +19C1..19C7 ; Consonant_Final # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B +1A58..1A59 ; Consonant_Final # Mn [2] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN FINAL NGA +1BBE..1BBF ; Consonant_Final # Lo [2] SUNDANESE LETTER FINAL K..SUNDANESE LETTER FINAL M +1BF0..1BF1 ; Consonant_Final # Mn [2] BATAK CONSONANT SIGN NG..BATAK CONSONANT SIGN H +1C2D..1C33 ; Consonant_Final # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +A94F..A951 ; Consonant_Final # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A952 ; Consonant_Final # Mc REJANG CONSONANT SIGN H +AA40..AA42 ; Consonant_Final # Lo [3] CHAM LETTER FINAL K..CHAM LETTER FINAL NG +AA43 ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL NG +AA44..AA4B ; Consonant_Final # Lo [8] CHAM LETTER FINAL CH..CHAM LETTER FINAL SS +AA4C ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL M +AA4D ; Consonant_Final # Mc CHAM CONSONANT SIGN FINAL H +ABDB..ABE2 ; Consonant_Final # Lo [8] MEETEI MAYEK LETTER KOK LONSUM..MEETEI MAYEK LETTER I LONSUM +11A8A..11A95 ; Consonant_Final # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Head_Letter + +# Head Letter (Tibetan) + +# [Not derivable] + +0F88..0F8C ; Consonant_Head_Letter # Lo [5] TIBETAN SIGN LCE TSA CAN..TIBETAN SIGN INVERTED MCHU CAN + +# ================================================ + +# Indic_Syllabic_Category=Modifying_Letter + +# Reanalyzed letters not participating in the abugida structure, but +# serving to modify the sound of an adjacent vowel or consonant. +# Note that this is not the same as General_Category=Modifier_Letter. + +# [Not derivable] + +0B83 ; Modifying_Letter # Lo TAMIL SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Tone_Letter + +# Tone Letter (spacing lexical tone mark with status as a letter) + +# [Not derivable] + +1970..1974 ; Tone_Letter # Lo [5] TAI LE LETTER TONE-2..TAI LE LETTER TONE-6 +AAC0 ; Tone_Letter # Lo TAI VIET TONE MAI NUENG +AAC2 ; Tone_Letter # Lo TAI VIET TONE MAI SONG + +# ================================================ + +# Indic_Syllabic_Category=Tone_Mark + +# Tone Mark (nonspacing or spacing lexical tone mark) + +# [Not derivable] + +0E48..0E4B ; Tone_Mark # Mn [4] THAI CHARACTER MAI EK..THAI CHARACTER MAI CHATTAWA +0EC8..0ECB ; Tone_Mark # Mn [4] LAO TONE MAI EK..LAO TONE MAI CATAWA +1037 ; Tone_Mark # Mn MYANMAR SIGN DOT BELOW +1063..1064 ; Tone_Mark # Mc [2] MYANMAR TONE MARK SGAW KAREN HATHI..MYANMAR TONE MARK SGAW KAREN KE PHO +1069..106D ; Tone_Mark # Mc [5] MYANMAR SIGN WESTERN PWO KAREN TONE-1..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1087..108C ; Tone_Mark # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108D ; Tone_Mark # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +108F ; Tone_Mark # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109B ; Tone_Mark # Mc [2] MYANMAR SIGN KHAMTI TONE-1..MYANMAR SIGN KHAMTI TONE-3 +19C8..19C9 ; Tone_Mark # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A75..1A79 ; Tone_Mark # Mn [5] TAI THAM SIGN TONE-1..TAI THAM SIGN KHUEN TONE-5 +A92B..A92D ; Tone_Mark # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +AA7B ; Tone_Mark # Mc MYANMAR SIGN PAO KAREN TONE +AA7C ; Tone_Mark # Mn MYANMAR SIGN TAI LAING TONE-2 +AA7D ; Tone_Mark # Mc MYANMAR SIGN TAI LAING TONE-5 +AABF ; Tone_Mark # Mn TAI VIET TONE MAI EK +AAC1 ; Tone_Mark # Mn TAI VIET TONE MAI THO +ABEC ; Tone_Mark # Mc MEETEI MAYEK LUM IYEK + +# ================================================ + +# Indic_Syllabic_Category=Gemination_Mark + +# Gemination Mark (doubling of the preceding or following consonant) + +# [Not derivable] + +0A71 ; Gemination_Mark # Mn GURMUKHI ADDAK +11237 ; Gemination_Mark # Mn KHOJKI SIGN SHADDA +11A98 ; Gemination_Mark # Mn SOYOMBO GEMINATION MARK + +# ================================================ + +# Indic_Syllabic_Category=Cantillation_Mark + +# Cantillation Mark (recitation marks, such as svara markers for the Samaveda) + +# [Not derivable] + +0951..0952 ; Cantillation_Mark # Mn [2] DEVANAGARI STRESS SIGN UDATTA..DEVANAGARI STRESS SIGN ANUDATTA +0A51 ; Cantillation_Mark # Mn GURMUKHI SIGN UDAAT +0AFA..0AFC ; Cantillation_Mark # Mn [3] GUJARATI SIGN SUKUN..GUJARATI SIGN MADDAH +1CD0..1CD2 ; Cantillation_Mark # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CD4..1CE0 ; Cantillation_Mark # Mn [13] VEDIC SIGN YAJURVEDIC MIDLINE SVARITA..VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CE1 ; Cantillation_Mark # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF4 ; Cantillation_Mark # Mn VEDIC TONE CANDRA ABOVE +1CF7 ; Cantillation_Mark # Mc VEDIC SIGN ATIKRAMA +1CF8..1CF9 ; Cantillation_Mark # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE +20F0 ; Cantillation_Mark # Mn COMBINING ASTERISK ABOVE +A8E0..A8F1 ; Cantillation_Mark # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +1123E ; Cantillation_Mark # Mn KHOJKI SIGN SUKUN +11366..1136C ; Cantillation_Mark # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Cantillation_Mark # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA + +# ================================================ + +# Indic_Syllabic_Category=Register_Shifter + +# Register Shifter (shifts register for consonants, akin to a tone mark) + +# [Not derivable] + +17C9..17CA ; Register_Shifter # Mn [2] KHMER SIGN MUUSIKATOAN..KHMER SIGN TRIISAP + +# ================================================ + +# Indic_Syllabic_Category=Syllable_Modifier + +# Syllable Modifier (miscellaneous combining characters that modify +# something in the orthographic syllable they succeed) + +# [Not derivable] + +00B2..00B3 ; Syllable_Modifier # No [2] SUPERSCRIPT TWO..SUPERSCRIPT THREE +09FE ; Syllable_Modifier # Mn BENGALI SANDHI MARK +0F35 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0FC6 ; Syllable_Modifier # Mn TIBETAN SYMBOL PADMA GDAN +17CB ; Syllable_Modifier # Mn KHMER SIGN BANTOC +17CE..17D0 ; Syllable_Modifier # Mn [3] KHMER SIGN KAKABAT..KHMER SIGN SAMYOK SANNYA +17D3 ; Syllable_Modifier # Mn KHMER SIGN BATHAMASAT +17DD ; Syllable_Modifier # Mn KHMER SIGN ATTHACAN +193B ; Syllable_Modifier # Mn LIMBU SIGN SA-I +1A7B..1A7C ; Syllable_Modifier # Mn [2] TAI THAM SIGN MAI SAM..TAI THAM SIGN KHUEN-LUE KARAN +1A7F ; Syllable_Modifier # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1C36 ; Syllable_Modifier # Mn LEPCHA SIGN RAN +1DFB ; Syllable_Modifier # Mn COMBINING DELETION MARK +2074 ; Syllable_Modifier # No SUPERSCRIPT FOUR +2082..2084 ; Syllable_Modifier # No [3] SUBSCRIPT TWO..SUBSCRIPT FOUR +111C9 ; Syllable_Modifier # Mn SHARADA SANDHI MARK +1145E ; Syllable_Modifier # Mn NEWA SANDHI MARK +11A33 ; Syllable_Modifier # Mn ZANABAZAR SQUARE FINAL CONSONANT MARK + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Killer + +# Consonant Killer (signifies that the previous consonant or consonants are +# not pronounced) + +# [Not derivable] + +0E4C ; Consonant_Killer # Mn THAI CHARACTER THANTHAKHAT +17CD ; Consonant_Killer # Mn KHMER SIGN TOANDAKHIAT + +# ================================================ + +# Indic_Syllabic_Category=Non_Joiner + +# Non_Joiner (Zero Width Non-Joiner) + +# [Not derivable] + +200C ; Non_Joiner # Cf ZERO WIDTH NON-JOINER + +# ================================================ + +# Indic_Syllabic_Category=Joiner + +# Joiner (Zero Width Joiner) + +# [Not derivable] + +200D ; Joiner # Cf ZERO WIDTH JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number_Joiner + +# Number_Joiner (forms ligatures between numbers for multiplication) + +# [Not derivable] + +1107F ; Number_Joiner # Mn BRAHMI NUMBER JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number + +# Number (can be used as vowel-holders like consonant placeholders) +# Note: A number may even hold subjoined consonants which may in turn +# have been formed using a virama or a stacker, e.g. the sequence +# where THAI THAM LETTER LOW TA is subjoined to +# TAI THAM THAM DIGIT THREE using an invisible stacker. + +# [Not derivable] + +0030..0039 ; Number # Nd [10] DIGIT ZERO..DIGIT NINE +0966..096F ; Number # Nd [10] DEVANAGARI DIGIT ZERO..DEVANAGARI DIGIT NINE +09E6..09EF ; Number # Nd [10] BENGALI DIGIT ZERO..BENGALI DIGIT NINE +0A66..0A6F ; Number # Nd [10] GURMUKHI DIGIT ZERO..GURMUKHI DIGIT NINE +0AE6..0AEF ; Number # Nd [10] GUJARATI DIGIT ZERO..GUJARATI DIGIT NINE +0B66..0B6F ; Number # Nd [10] ORIYA DIGIT ZERO..ORIYA DIGIT NINE +0BE6..0BEF ; Number # Nd [10] TAMIL DIGIT ZERO..TAMIL DIGIT NINE +0C66..0C6F ; Number # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE +0CE6..0CEF ; Number # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE +0D66..0D6F ; Number # Nd [10] MALAYALAM DIGIT ZERO..MALAYALAM DIGIT NINE +0DE6..0DEF ; Number # Nd [10] SINHALA LITH DIGIT ZERO..SINHALA LITH DIGIT NINE +0E50..0E59 ; Number # Nd [10] THAI DIGIT ZERO..THAI DIGIT NINE +0ED0..0ED9 ; Number # Nd [10] LAO DIGIT ZERO..LAO DIGIT NINE +0F20..0F29 ; Number # Nd [10] TIBETAN DIGIT ZERO..TIBETAN DIGIT NINE +0F2A..0F33 ; Number # No [10] TIBETAN DIGIT HALF ONE..TIBETAN DIGIT HALF ZERO +1040..1049 ; Number # Nd [10] MYANMAR DIGIT ZERO..MYANMAR DIGIT NINE +1090..1099 ; Number # Nd [10] MYANMAR SHAN DIGIT ZERO..MYANMAR SHAN DIGIT NINE +17E0..17E9 ; Number # Nd [10] KHMER DIGIT ZERO..KHMER DIGIT NINE +1946..194F ; Number # Nd [10] LIMBU DIGIT ZERO..LIMBU DIGIT NINE +19D0..19D9 ; Number # Nd [10] NEW TAI LUE DIGIT ZERO..NEW TAI LUE DIGIT NINE +19DA ; Number # No NEW TAI LUE THAM DIGIT ONE +1A80..1A89 ; Number # Nd [10] TAI THAM HORA DIGIT ZERO..TAI THAM HORA DIGIT NINE +1A90..1A99 ; Number # Nd [10] TAI THAM THAM DIGIT ZERO..TAI THAM THAM DIGIT NINE +1B50..1B59 ; Number # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE +1BB0..1BB9 ; Number # Nd [10] SUNDANESE DIGIT ZERO..SUNDANESE DIGIT NINE +1C40..1C49 ; Number # Nd [10] LEPCHA DIGIT ZERO..LEPCHA DIGIT NINE +A8D0..A8D9 ; Number # Nd [10] SAURASHTRA DIGIT ZERO..SAURASHTRA DIGIT NINE +A900..A909 ; Number # Nd [10] KAYAH LI DIGIT ZERO..KAYAH LI DIGIT NINE +A9D0..A9D9 ; Number # Nd [10] JAVANESE DIGIT ZERO..JAVANESE DIGIT NINE +A9F0..A9F9 ; Number # Nd [10] MYANMAR TAI LAING DIGIT ZERO..MYANMAR TAI LAING DIGIT NINE +AA50..AA59 ; Number # Nd [10] CHAM DIGIT ZERO..CHAM DIGIT NINE +ABF0..ABF9 ; Number # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE +10A40..10A48 ; Number # No [9] KHAROSHTHI DIGIT ONE..KHAROSHTHI FRACTION ONE HALF +11066..1106F ; Number # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11136..1113F ; Number # Nd [10] CHAKMA DIGIT ZERO..CHAKMA DIGIT NINE +111D0..111D9 ; Number # Nd [10] SHARADA DIGIT ZERO..SHARADA DIGIT NINE +111E1..111F4 ; Number # No [20] SINHALA ARCHAIC DIGIT ONE..SINHALA ARCHAIC NUMBER ONE THOUSAND +112F0..112F9 ; Number # Nd [10] KHUDAWADI DIGIT ZERO..KHUDAWADI DIGIT NINE +11450..11459 ; Number # Nd [10] NEWA DIGIT ZERO..NEWA DIGIT NINE +114D0..114D9 ; Number # Nd [10] TIRHUTA DIGIT ZERO..TIRHUTA DIGIT NINE +11650..11659 ; Number # Nd [10] MODI DIGIT ZERO..MODI DIGIT NINE +116C0..116C9 ; Number # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE +11730..11739 ; Number # Nd [10] AHOM DIGIT ZERO..AHOM DIGIT NINE +1173A..1173B ; Number # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY +11C50..11C59 ; Number # Nd [10] BHAIKSUKI DIGIT ZERO..BHAIKSUKI DIGIT NINE +11C5A..11C6C ; Number # No [19] BHAIKSUKI NUMBER ONE..BHAIKSUKI HUNDREDS UNIT MARK +11D50..11D59 ; Number # Nd [10] MASARAM GONDI DIGIT ZERO..MASARAM GONDI DIGIT NINE +11DA0..11DA9 ; Number # Nd [10] GUNJALA GONDI DIGIT ZERO..GUNJALA GONDI DIGIT NINE + +# ================================================ + +# Indic_Syllabic_Category=Brahmi_Joining_Number + +# Brahmi Joining Number (similar to Number in that in can be used as +# vowel-holders like Consonant_Placeholder, but may also be joined by +# a Number_Joiner of the same script, e.g. in Brahmi) + +# [Not derivable] + +11052..11065 ; Brahmi_Joining_Number # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND + +# EOF diff --git a/data/13.0.0-indic-positional-category.txt b/data/13.0.0-indic-positional-category.txt new file mode 100644 index 0000000..ee74dbe --- /dev/null +++ b/data/13.0.0-indic-positional-category.txt @@ -0,0 +1,790 @@ +# IndicPositionalCategory-13.0.0.txt +# Date: 2019-07-23, 00:01:00 GMT [KW, RP] +# © 2019 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# +# For documentation, see UAX #44: Unicode Character Database, +# at http://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Positional_Category enumerated property +# +# Scope: This property is aimed at the problem of +# the specification of syllabic structure for Indic scripts. +# Because dependent vowels (matras), visible viramas, and other +# characters are placed in notional slots around the consonant (or +# consonant cluster) core of an Indic syllable, there may be +# cooccurrence constraints or other interactions. Also, it may be +# desirable, in cases where more than one such character may occur in +# sequence, as for example, in a top slot and a bottom slot, to +# specify preferred orders for spelling. As such, this property +# is designed primarily to supplement the Indic_Syllabic_Category +# property. +# +# In addition to combining marks associated with Indic scripts, the +# Indic_Positional_Category has non-trivial values for special signs +# associated with Indic_Syllabic_Category=Consonant_Prefixed or +# Indic_Syllabic_Category=Consonant_Preceding_Repha. Those signs +# have General_Category=Lo, rather than being combining marks. +# They occur in initial position in syllabic structure. However, when +# rendered, they appear as marks positioned with respect to another +# base letter (usually above it). Hence, having an explicit value for +# Indic_Positional_Category for those signs can be helpful. +# +# Note that this property is *not* intended as +# a prescriptive property regarding display or font design, +# for a number of reasons. Good font design requires information +# that is outside the context of a character encoding standard, +# and is best handled in other venues. For Indic dependent +# vowels and similar characters, in particular: +# +# 1. Matra placement may vary somewhat based on typeface design. +# 2. Matra placement, even within a single script, may vary +# somewhat according to historic period or local conventions. +# 3. Matra placement may be changed by explicit orthographic reform +# decisions. +# 4. Matras may ligate in various ways with a consonant (or even +# other elements of a syllable) instead of occurring in a +# discrete location. +# 5. Matra display may be contextually determined. This is +# notable, for example, in the Tamil script, where the shape +# and placement of -u and -uu vowels depends strongly on +# which consonant they adjoin. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Positional_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as containing dependent vowels or similar characters +# in the structural sense used for the Indic_Positional_Category are the +# following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Dives Akuru, Dogra, Grantha, Gujarati, +# Gunjala Gondi, Gurmukhi, Hanunoo, Javanese, Kaithi, Kannada, +# Kharoshthi, Khmer, Khojki, Khudawadi, Lao, Lepcha, Limbu, Makasar, +# Malayalam, Marchen, Masaram Gondi, Meetei Mayek, Modi, Myanmar, +# Nandinagari, Newa, New Tai Lue, Oriya, Rejang, Saurashtra, Sharada, +# Siddham, Sinhala, Soyombo, Sundanese, Syloti Nagri, Tagalog, +# Tagbanwa, Tai Tham, Tai Viet, Takri, Tamil, Telugu, Thai, Tibetan, +# Tirhuta, and Zanabazar Square. +# +# All characters for all other scripts not in that list +# take the default value for this property. +# +# See IndicSyllabicCategory.txt for a slightly more extended +# list of Indic scripts, including those which do not have +# positional characters. Currently, those additional +# Indic scripts without positional characters are +# Multani, Phags-pa, and Tai Le. +# +# Notes: +# +# 1. The following characters are all assigned the positional category Right, +# but may have different positions in some cases: +# * U+0BC1 TAMIL VOWEL SIGN U and U+0BC2 TAMIL VOWEL SIGN UU have +# contextually variable placement in Tamil. +# * U+0D41 MALAYALAM VOWEL SIGN U and U+0D42 MALAYALAM VOWEL SIGN UU form +# complex ligatures with consonants in older Malayalam orthography. +# * U+11341 GRANTHA VOWEL SIGN U and U+11342 GRANTHA VOWEL SIGN UU have +# contextually variable placement in Grantha. +# * U+11440 NEWA VOWEL SIGN O and U+11441 NEWA VOWEL SIGN AU have contextually +# variable placement in Newa. +# +# 2. The following characters are all assigned the positional category Top, +# but may have different positions in some cases: +# * U+1143E NEWA VOWEL SIGN E and U+1143F NEWA VOWEL SIGN AI have contextually +# variable placement in Newa. +# +# 3. The following characters are all assigned the positional category Bottom, +# but may have different positions in some cases: +# * U+102F MYANMAR VOWEL SIGN U and U+1030 MYANMAR VOWEL SIGN UU have +# contextually variable placement in Myanmar. +# * U+1A69 TAI THAM VOWEL SIGN U and U+1A6A TAI THAM VOWEL SIGN UU have +# contextually variable placement in Tai Tham. +# +# 4. The following character is assigned the positional category Left, but +# may have different positions in different styles: +# * U+119D2 NANDINAGARI VOWEL SIGN I has stylistically variable placement +# in Nandinagari. + + +# ================================================ + +# Property: Indic_Positional_Category +# +# All code points not explicitly listed for Indic_Positional_Category +# have the value NA (not applicable). +# +# @missing: 0000..10FFFF; NA + +# ------------------------------------------------ + +# Indic_Positional_Category=Right + +0903 ; Right # Mc DEVANAGARI SIGN VISARGA +093B ; Right # Mc DEVANAGARI VOWEL SIGN OOE +093E ; Right # Mc DEVANAGARI VOWEL SIGN AA +0940 ; Right # Mc DEVANAGARI VOWEL SIGN II +0949..094C ; Right # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094F ; Right # Mc DEVANAGARI VOWEL SIGN AW +0982..0983 ; Right # Mc [2] BENGALI SIGN ANUSVARA..BENGALI SIGN VISARGA +09BE ; Right # Mc BENGALI VOWEL SIGN AA +09C0 ; Right # Mc BENGALI VOWEL SIGN II +09D7 ; Right # Mc BENGALI AU LENGTH MARK +0A03 ; Right # Mc GURMUKHI SIGN VISARGA +0A3E ; Right # Mc GURMUKHI VOWEL SIGN AA +0A40 ; Right # Mc GURMUKHI VOWEL SIGN II +0A83 ; Right # Mc GUJARATI SIGN VISARGA +0ABE ; Right # Mc GUJARATI VOWEL SIGN AA +0AC0 ; Right # Mc GUJARATI VOWEL SIGN II +0ACB..0ACC ; Right # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0B02..0B03 ; Right # Mc [2] ORIYA SIGN ANUSVARA..ORIYA SIGN VISARGA +0B3E ; Right # Mc ORIYA VOWEL SIGN AA +0B40 ; Right # Mc ORIYA VOWEL SIGN II +0BBE..0BBF ; Right # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC1..0BC2 ; Right # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BD7 ; Right # Mc TAMIL AU LENGTH MARK +0C01..0C03 ; Right # Mc [3] TELUGU SIGN CANDRABINDU..TELUGU SIGN VISARGA +0C41..0C44 ; Right # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C82..0C83 ; Right # Mc [2] KANNADA SIGN ANUSVARA..KANNADA SIGN VISARGA +0CBE ; Right # Mc KANNADA VOWEL SIGN AA +0CC1..0CC4 ; Right # Mc [4] KANNADA VOWEL SIGN U..KANNADA VOWEL SIGN VOCALIC RR +0CD5..0CD6 ; Right # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0D02..0D03 ; Right # Mc [2] MALAYALAM SIGN ANUSVARA..MALAYALAM SIGN VISARGA +0D3E..0D40 ; Right # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D42 ; Right # Mn [2] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN UU +0D57 ; Right # Mc MALAYALAM AU LENGTH MARK +0D82..0D83 ; Right # Mc [2] SINHALA SIGN ANUSVARAYA..SINHALA SIGN VISARGAYA +0DCF..0DD1 ; Right # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD8 ; Right # Mc SINHALA VOWEL SIGN GAETTA-PILLA +0DDF ; Right # Mc SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Right # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Right # Lo THAI CHARACTER SARA A +0E32..0E33 ; Right # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E45 ; Right # Lo THAI CHARACTER LAKKHANGYAO +0EB0 ; Right # Lo LAO VOWEL SIGN A +0EB2..0EB3 ; Right # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0F3E ; Right # Mc TIBETAN SIGN YAR TSHES +0F7F ; Right # Mc TIBETAN SIGN RNAM BCAD +102B..102C ; Right # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +1038 ; Right # Mc MYANMAR SIGN VISARGA +103B ; Right # Mc MYANMAR CONSONANT SIGN MEDIAL YA +1056..1057 ; Right # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1062..1064 ; Right # Mc [3] MYANMAR VOWEL SIGN SGAW KAREN EU..MYANMAR TONE MARK SGAW KAREN KE PHO +1067..106D ; Right # Mc [7] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1083 ; Right # Mc MYANMAR VOWEL SIGN SHAN AA +1087..108C ; Right # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108F ; Right # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109C ; Right # Mc [3] MYANMAR SIGN KHAMTI TONE-1..MYANMAR VOWEL SIGN AITON A +17B6 ; Right # Mc KHMER VOWEL SIGN AA +17C7..17C8 ; Right # Mc [2] KHMER SIGN REAHMUK..KHMER SIGN YUUKALEAPINTU +1923..1924 ; Right # Mc [2] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AI +1929..192B ; Right # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1930..1931 ; Right # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Right # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +19B0..19B4 ; Right # Lo [5] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN UU +19B8..19B9 ; Right # Lo [2] NEW TAI LUE VOWEL SIGN OA..NEW TAI LUE VOWEL SIGN UE +19BB..19C0 ; Right # Lo [6] NEW TAI LUE VOWEL SIGN AAY..NEW TAI LUE VOWEL SIGN IY +19C8..19C9 ; Right # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A1A ; Right # Mc BUGINESE VOWEL SIGN O +1A57 ; Right # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A61 ; Right # Mc TAI THAM VOWEL SIGN A +1A63..1A64 ; Right # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A6D ; Right # Mc TAI THAM VOWEL SIGN OY +1B04 ; Right # Mc BALINESE SIGN BISAH +1B35 ; Right # Mc BALINESE VOWEL SIGN TEDUNG +1B44 ; Right # Mc BALINESE ADEG ADEG +1B82 ; Right # Mc SUNDANESE SIGN PANGWISAD +1BA1 ; Right # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA7 ; Right # Mc SUNDANESE VOWEL SIGN PANOLONG +1BAA ; Right # Mc SUNDANESE SIGN PAMAAEH +1BE7 ; Right # Mc BATAK VOWEL SIGN E +1BEA..1BEC ; Right # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BEE ; Right # Mc BATAK VOWEL SIGN U +1BF2..1BF3 ; Right # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +1C24..1C26 ; Right # Mc [3] LEPCHA SUBJOINED LETTER YA..LEPCHA VOWEL SIGN AA +1C2A..1C2B ; Right # Mc [2] LEPCHA VOWEL SIGN U..LEPCHA VOWEL SIGN UU +1CE1 ; Right # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF7 ; Right # Mc VEDIC SIGN ATIKRAMA +A823..A824 ; Right # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A827 ; Right # Mc SYLOTI NAGRI VOWEL SIGN OO +A880..A881 ; Right # Mc [2] SAURASHTRA SIGN ANUSVARA..SAURASHTRA SIGN VISARGA +A8B4..A8C3 ; Right # Mc [16] SAURASHTRA CONSONANT SIGN HAARU..SAURASHTRA VOWEL SIGN AU +A952..A953 ; Right # Mc [2] REJANG CONSONANT SIGN H..REJANG VIRAMA +A983 ; Right # Mc JAVANESE SIGN WIGNYAN +A9B4..A9B5 ; Right # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +AA33 ; Right # Mc CHAM CONSONANT SIGN YA +AA4D ; Right # Mc CHAM CONSONANT SIGN FINAL H +AA7B ; Right # Mc MYANMAR SIGN PAO KAREN TONE +AA7D ; Right # Mc MYANMAR SIGN TAI LAING TONE-5 +AAB1 ; Right # Lo TAI VIET VOWEL AA +AABA ; Right # Lo TAI VIET VOWEL UA +AABD ; Right # Lo TAI VIET VOWEL AN +AAEF ; Right # Mc MEETEI MAYEK VOWEL SIGN AAU +AAF5 ; Right # Mc MEETEI MAYEK VOWEL SIGN VISARGA +ABE3..ABE4 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE6..ABE7 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE9..ABEA ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +ABEC ; Right # Mc MEETEI MAYEK LUM IYEK +11000 ; Right # Mc BRAHMI SIGN CANDRABINDU +11002 ; Right # Mc BRAHMI SIGN VISARGA +11082 ; Right # Mc KAITHI SIGN VISARGA +110B0 ; Right # Mc KAITHI VOWEL SIGN AA +110B2 ; Right # Mc KAITHI VOWEL SIGN II +110B7..110B8 ; Right # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11145..11146 ; Right # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI +11182 ; Right # Mc SHARADA SIGN VISARGA +111B3 ; Right # Mc SHARADA VOWEL SIGN AA +111B5 ; Right # Mc SHARADA VOWEL SIGN II +111C0 ; Right # Mc SHARADA SIGN VIRAMA +1122C..1122E ; Right # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +11235 ; Right # Mc KHOJKI SIGN VIRAMA +112E0 ; Right # Mc KHUDAWADI VOWEL SIGN AA +112E2 ; Right # Mc KHUDAWADI VOWEL SIGN II +11302..11303 ; Right # Mc [2] GRANTHA SIGN ANUSVARA..GRANTHA SIGN VISARGA +1133E..1133F ; Right # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11341..11344 ; Right # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +1134D ; Right # Mc GRANTHA SIGN VIRAMA +11357 ; Right # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Right # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +11435 ; Right # Mc NEWA VOWEL SIGN AA +11437 ; Right # Mc NEWA VOWEL SIGN II +11440..11441 ; Right # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +11445 ; Right # Mc NEWA SIGN VISARGA +114B0 ; Right # Mc TIRHUTA VOWEL SIGN AA +114B2 ; Right # Mc TIRHUTA VOWEL SIGN II +114BD ; Right # Mc TIRHUTA VOWEL SIGN SHORT O +114C1 ; Right # Mc TIRHUTA SIGN VISARGA +115AF ; Right # Mc SIDDHAM VOWEL SIGN AA +115B1 ; Right # Mc SIDDHAM VOWEL SIGN II +115BE ; Right # Mc SIDDHAM SIGN VISARGA +11630..11632 ; Right # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +1163B..1163C ; Right # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +1163E ; Right # Mc MODI SIGN VISARGA +116AC ; Right # Mc TAKRI SIGN VISARGA +116AF ; Right # Mc TAKRI VOWEL SIGN II +116B6 ; Right # Mc TAKRI SIGN VIRAMA +11720..11721 ; Right # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +1182C ; Right # Mc DOGRA VOWEL SIGN AA +1182E ; Right # Mc DOGRA VOWEL SIGN II +11838 ; Right # Mc DOGRA SIGN VISARGA +11930..11934 ; Right # Mc [5] DIVES AKURU VOWEL SIGN AA..DIVES AKURU VOWEL SIGN UU +1193D ; Right # Mc DIVES AKURU SIGN HALANTA +11940 ; Right # Mc DIVES AKURU MEDIAL YA +119D1 ; Right # Mc NANDINAGARI VOWEL SIGN AA +119D3 ; Right # Mc NANDINAGARI VOWEL SIGN II +119DC..119DF ; Right # Mc [4] NANDINAGARI VOWEL SIGN O..NANDINAGARI SIGN VISARGA +11A39 ; Right # Mc ZANABAZAR SQUARE SIGN VISARGA +11A57..11A58 ; Right # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A97 ; Right # Mc SOYOMBO SIGN VISARGA +11C2F ; Right # Mc BHAIKSUKI VOWEL SIGN AA +11C3E ; Right # Mc BHAIKSUKI SIGN VISARGA +11CA9 ; Right # Mc MARCHEN SUBJOINED LETTER YA +11CB4 ; Right # Mc MARCHEN VOWEL SIGN O +11D46 ; Right # Lo MASARAM GONDI REPHA +11D8A..11D8E ; Right # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU +11D93..11D94 ; Right # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU +11D96 ; Right # Mc GUNJALA GONDI SIGN VISARGA +11EF6 ; Right # Mc MAKASAR VOWEL SIGN O + +# Indic_Positional_Category=Left + +093F ; Left # Mc DEVANAGARI VOWEL SIGN I +094E ; Left # Mc DEVANAGARI VOWEL SIGN PRISHTHAMATRA E +09BF ; Left # Mc BENGALI VOWEL SIGN I +09C7..09C8 ; Left # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +0A3F ; Left # Mc GURMUKHI VOWEL SIGN I +0ABF ; Left # Mc GUJARATI VOWEL SIGN I +0B47 ; Left # Mc ORIYA VOWEL SIGN E +0BC6..0BC8 ; Left # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0D46..0D48 ; Left # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0DD9 ; Left # Mc SINHALA VOWEL SIGN KOMBUVA +0DDB ; Left # Mc SINHALA VOWEL SIGN KOMBU DEKA +0F3F ; Left # Mc TIBETAN SIGN MAR TSHES +1031 ; Left # Mc MYANMAR VOWEL SIGN E +1084 ; Left # Mc MYANMAR VOWEL SIGN SHAN E +17C1..17C3 ; Left # Mc [3] KHMER VOWEL SIGN E..KHMER VOWEL SIGN AI +1A19 ; Left # Mc BUGINESE VOWEL SIGN E +1A55 ; Left # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A6E..1A72 ; Left # Mc [5] TAI THAM VOWEL SIGN E..TAI THAM VOWEL SIGN THAM AI +1B3E..1B3F ; Left # Mc [2] BALINESE VOWEL SIGN TALING..BALINESE VOWEL SIGN TALING REPA +1BA6 ; Left # Mc SUNDANESE VOWEL SIGN PANAELAENG +1C27..1C28 ; Left # Mc [2] LEPCHA VOWEL SIGN I..LEPCHA VOWEL SIGN O +1C34..1C35 ; Left # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A9BA..A9BB ; Left # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +AA2F..AA30 ; Left # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA34 ; Left # Mc CHAM CONSONANT SIGN RA +AAEB ; Left # Mc MEETEI MAYEK VOWEL SIGN II +AAEE ; Left # Mc MEETEI MAYEK VOWEL SIGN AU +110B1 ; Left # Mc KAITHI VOWEL SIGN I +1112C ; Left # Mc CHAKMA VOWEL SIGN E +111B4 ; Left # Mc SHARADA VOWEL SIGN I +111CE ; Left # Mc SHARADA VOWEL SIGN PRISHTHAMATRA E +112E1 ; Left # Mc KHUDAWADI VOWEL SIGN I +11347..11348 ; Left # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +11436 ; Left # Mc NEWA VOWEL SIGN I +114B1 ; Left # Mc TIRHUTA VOWEL SIGN I +114B9 ; Left # Mc TIRHUTA VOWEL SIGN E +115B0 ; Left # Mc SIDDHAM VOWEL SIGN I +115B8 ; Left # Mc SIDDHAM VOWEL SIGN E +116AE ; Left # Mc TAKRI VOWEL SIGN I +11726 ; Left # Mc AHOM VOWEL SIGN E +1182D ; Left # Mc DOGRA VOWEL SIGN I +11935 ; Left # Mc DIVES AKURU VOWEL SIGN E +11937 ; Left # Mc DIVES AKURU VOWEL SIGN AI +119D2 ; Left # Mc NANDINAGARI VOWEL SIGN I +119E4 ; Left # Mc NANDINAGARI VOWEL SIGN PRISHTHAMATRA E +11CB1 ; Left # Mc MARCHEN VOWEL SIGN I +11EF5 ; Left # Mc MAKASAR VOWEL SIGN E + +# Indic_Positional_Category=Visual_Order_Left + +# These are dependent vowels that occur to the left of the consonant +# letter in a syllable, but which occur in scripts using the visual order +# model, instead of the logical order model. Because of the different +# model, these left-side vowels occur first in the backing store (before +# the consonant letter) and are not reordered during text rendering. +# +# [Derivation: Logical_Order_Exception=Yes] + +0E40..0E44 ; Visual_Order_Left # Lo [5] THAI CHARACTER SARA E..THAI CHARACTER SARA AI MAIMALAI +0EC0..0EC4 ; Visual_Order_Left # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +19B5..19B7 ; Visual_Order_Left # Lo [3] NEW TAI LUE VOWEL SIGN E..NEW TAI LUE VOWEL SIGN O +19BA ; Visual_Order_Left # Lo NEW TAI LUE VOWEL SIGN AY +AAB5..AAB6 ; Visual_Order_Left # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB9 ; Visual_Order_Left # Lo TAI VIET VOWEL UEA +AABB..AABC ; Visual_Order_Left # Lo [2] TAI VIET VOWEL AUE..TAI VIET VOWEL AY + +# Indic_Positional_Category=Left_And_Right + +09CB..09CC ; Left_And_Right # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +0B4B ; Left_And_Right # Mc ORIYA VOWEL SIGN O +0BCA..0BCC ; Left_And_Right # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0D4A..0D4C ; Left_And_Right # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0DDC ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA +0DDE ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA +17C0 ; Left_And_Right # Mc KHMER VOWEL SIGN IE +17C4..17C5 ; Left_And_Right # Mc [2] KHMER VOWEL SIGN OO..KHMER VOWEL SIGN AU +1B40..1B41 ; Left_And_Right # Mc [2] BALINESE VOWEL SIGN TALING TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1134B..1134C ; Left_And_Right # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +114BC ; Left_And_Right # Mc TIRHUTA VOWEL SIGN O +114BE ; Left_And_Right # Mc TIRHUTA VOWEL SIGN AU +115BA ; Left_And_Right # Mc SIDDHAM VOWEL SIGN O +11938 ; Left_And_Right # Mc DIVES AKURU VOWEL SIGN O + +# Indic_Positional_Category=Top + +0900..0902 ; Top # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +093A ; Top # Mn DEVANAGARI VOWEL SIGN OE +0945..0948 ; Top # Mn [4] DEVANAGARI VOWEL SIGN CANDRA E..DEVANAGARI VOWEL SIGN AI +0951 ; Top # Mn DEVANAGARI STRESS SIGN UDATTA +0953..0955 ; Top # Mn [3] DEVANAGARI GRAVE ACCENT..DEVANAGARI VOWEL SIGN CANDRA LONG E +0981 ; Top # Mn BENGALI SIGN CANDRABINDU +09FE ; Top # Mn BENGALI SANDHI MARK +0A01..0A02 ; Top # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A47..0A48 ; Top # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Top # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0A70..0A71 ; Top # Mn [2] GURMUKHI TIPPI..GURMUKHI ADDAK +0A81..0A82 ; Top # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0AC5 ; Top # Mn GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Top # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AFA..0AFF ; Top # Mn [6] GUJARATI SIGN SUKUN..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B01 ; Top # Mn ORIYA SIGN CANDRABINDU +0B3F ; Top # Mn ORIYA VOWEL SIGN I +0B55..0B56 ; Top # Mn [2] ORIYA SIGN OVERLINE..ORIYA AI LENGTH MARK +0B82 ; Top # Mn TAMIL SIGN ANUSVARA +0BC0 ; Top # Mn TAMIL VOWEL SIGN II +0BCD ; Top # Mn TAMIL SIGN VIRAMA +0C00 ; Top # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C04 ; Top # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C3E..0C40 ; Top # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C46..0C47 ; Top # Mn [2] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN EE +0C4A..0C4D ; Top # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA +0C55 ; Top # Mn TELUGU LENGTH MARK +0C81 ; Top # Mn KANNADA SIGN CANDRABINDU +0CBF ; Top # Mn KANNADA VOWEL SIGN I +0CC6 ; Top # Mn KANNADA VOWEL SIGN E +0CCC..0CCD ; Top # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA +0D00..0D01 ; Top # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU +0D3B..0D3C ; Top # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA +0D4D ; Top # Mn MALAYALAM SIGN VIRAMA +0D4E ; Top # Lo MALAYALAM LETTER DOT REPH +0D81 ; Top # Mn SINHALA SIGN CANDRABINDU +0DCA ; Top # Mn SINHALA SIGN AL-LAKUNA +0DD2..0DD3 ; Top # Mn [2] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN DIGA IS-PILLA +0E31 ; Top # Mn THAI CHARACTER MAI HAN-AKAT +0E34..0E37 ; Top # Mn [4] THAI CHARACTER SARA I..THAI CHARACTER SARA UEE +0E47..0E4E ; Top # Mn [8] THAI CHARACTER MAITAIKHU..THAI CHARACTER YAMAKKAN +0EB1 ; Top # Mn LAO VOWEL SIGN MAI KAN +0EB4..0EB7 ; Top # Mn [4] LAO VOWEL SIGN I..LAO VOWEL SIGN YY +0EBB ; Top # Mn LAO VOWEL SIGN MAI KON +0EC8..0ECD ; Top # Mn [6] LAO TONE MAI EK..LAO NIGGAHITA +0F39 ; Top # Mn TIBETAN MARK TSA -PHRU +0F72 ; Top # Mn TIBETAN VOWEL SIGN I +0F7A..0F7E ; Top # Mn [5] TIBETAN VOWEL SIGN E..TIBETAN SIGN RJES SU NGA RO +0F80 ; Top # Mn TIBETAN VOWEL SIGN REVERSED I +0F82..0F83 ; Top # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +0F86..0F87 ; Top # Mn [2] TIBETAN SIGN LCI RTAGS..TIBETAN SIGN YANG RTAGS +102D..102E ; Top # Mn [2] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN II +1032..1036 ; Top # Mn [5] MYANMAR VOWEL SIGN AI..MYANMAR SIGN ANUSVARA +103A ; Top # Mn MYANMAR SIGN ASAT +1071..1074 ; Top # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1085..1086 ; Top # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109D ; Top # Mn MYANMAR VOWEL SIGN AITON AI +1712 ; Top # Mn TAGALOG VOWEL SIGN I +1732 ; Top # Mn HANUNOO VOWEL SIGN I +1752 ; Top # Mn BUHID VOWEL SIGN I +1772 ; Top # Mn TAGBANWA VOWEL SIGN I +17B7..17BA ; Top # Mn [4] KHMER VOWEL SIGN I..KHMER VOWEL SIGN YY +17C6 ; Top # Mn KHMER SIGN NIKAHIT +17C9..17D1 ; Top # Mn [9] KHMER SIGN MUUSIKATOAN..KHMER SIGN VIRIAM +17D3 ; Top # Mn KHMER SIGN BATHAMASAT +17DD ; Top # Mn KHMER SIGN ATTHACAN +1920..1921 ; Top # Mn [2] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN I +1927..1928 ; Top # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Top # Mn LIMBU SIGN KEMPHRENG +1A17 ; Top # Mn BUGINESE VOWEL SIGN I +1A1B ; Top # Mn BUGINESE VOWEL SIGN AE +1A58..1A5A ; Top # Mn [3] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN LOW PA +1A62 ; Top # Mn TAI THAM VOWEL SIGN MAI SAT +1A65..1A68 ; Top # Mn [4] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN UUE +1A6B ; Top # Mn TAI THAM VOWEL SIGN O +1A73..1A7C ; Top # Mn [10] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN KHUEN-LUE KARAN +1B00..1B03 ; Top # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG +1B34 ; Top # Mn BALINESE SIGN REREKAN +1B36..1B37 ; Top # Mn [2] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN ULU SARI +1B42 ; Top # Mn BALINESE VOWEL SIGN PEPET +1B6B ; Top # Mn BALINESE MUSICAL SYMBOL COMBINING TEGEH +1B6D..1B73 ; Top # Mn [7] BALINESE MUSICAL SYMBOL COMBINING KEMPUL..BALINESE MUSICAL SYMBOL COMBINING GONG +1B80..1B81 ; Top # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR +1BA4 ; Top # Mn SUNDANESE VOWEL SIGN PANGHULU +1BA8..1BA9 ; Top # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE6 ; Top # Mn BATAK SIGN TOMPI +1BE8..1BE9 ; Top # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BED ; Top # Mn BATAK VOWEL SIGN KARO O +1BEF..1BF1 ; Top # Mn [3] BATAK VOWEL SIGN U FOR SIMALUNGUN SA..BATAK CONSONANT SIGN H +1C2D..1C33 ; Top # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +1C36 ; Top # Mn LEPCHA SIGN RAN +1CD0..1CD2 ; Top # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CDA..1CDB ; Top # Mn [2] VEDIC TONE DOUBLE SVARITA..VEDIC TONE TRIPLE SVARITA +1CE0 ; Top # Mn VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CF4 ; Top # Mn VEDIC TONE CANDRA ABOVE +1DFB ; Top # Mn COMBINING DELETION MARK +20F0 ; Top # Mn COMBINING ASTERISK ABOVE +A802 ; Top # Mn SYLOTI NAGRI SIGN DVISVARA +A806 ; Top # Mn SYLOTI NAGRI SIGN HASANTA +A80B ; Top # Mn SYLOTI NAGRI SIGN ANUSVARA +A826 ; Top # Mn SYLOTI NAGRI VOWEL SIGN E +A8C5 ; Top # Mn SAURASHTRA SIGN CANDRABINDU +A8E0..A8F1 ; Top # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +A8FF ; Top # Mn DEVANAGARI VOWEL SIGN AY +A94A ; Top # Mn REJANG VOWEL SIGN AI +A94F..A951 ; Top # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A980..A982 ; Top # Mn [3] JAVANESE SIGN PANYANGGA..JAVANESE SIGN LAYAR +A9B3 ; Top # Mn JAVANESE SIGN CECAK TELU +A9B6..A9B7 ; Top # Mn [2] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN WULU MELIK +A9BC ; Top # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Top # Mn MYANMAR SIGN SHAN SAW +AA29..AA2C ; Top # Mn [4] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN EI +AA2E ; Top # Mn CHAM VOWEL SIGN OE +AA31 ; Top # Mn CHAM VOWEL SIGN AU +AA43 ; Top # Mn CHAM CONSONANT SIGN FINAL NG +AA4C ; Top # Mn CHAM CONSONANT SIGN FINAL M +AA7C ; Top # Mn MYANMAR SIGN TAI LAING TONE-2 +AAB0 ; Top # Mn TAI VIET MAI KANG +AAB2..AAB3 ; Top # Mn [2] TAI VIET VOWEL I..TAI VIET VOWEL UE +AAB7..AAB8 ; Top # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AABE..AABF ; Top # Mn [2] TAI VIET VOWEL AM..TAI VIET TONE MAI EK +AAC1 ; Top # Mn TAI VIET TONE MAI THO +AAED ; Top # Mn MEETEI MAYEK VOWEL SIGN AAI +ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP +10A05 ; Top # Mn KHAROSHTHI VOWEL SIGN E +10A0F ; Top # Mn KHAROSHTHI SIGN VISARGA +10A38 ; Top # Mn KHAROSHTHI SIGN BAR ABOVE +11001 ; Top # Mn BRAHMI SIGN ANUSVARA +11038..1103B ; Top # Mn [4] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN II +11042..11046 ; Top # Mn [5] BRAHMI VOWEL SIGN E..BRAHMI VIRAMA +11080..11081 ; Top # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +110B5..110B6 ; Top # Mn [2] KAITHI VOWEL SIGN E..KAITHI VOWEL SIGN AI +11100..11102 ; Top # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA +11127..11129 ; Top # Mn [3] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN II +1112D ; Top # Mn CHAKMA VOWEL SIGN AI +11130 ; Top # Mn CHAKMA VOWEL SIGN OI +11134 ; Top # Mn CHAKMA MAAYYAA +11180..11181 ; Top # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +111BC..111BE ; Top # Mn [3] SHARADA VOWEL SIGN E..SHARADA VOWEL SIGN O +111C2..111C3 ; Top # Lo [2] SHARADA SIGN JIHVAMULIYA..SHARADA SIGN UPADHMANIYA +111CB ; Top # Mn SHARADA VOWEL MODIFIER MARK +111CF ; Top # Mn SHARADA SIGN INVERTED CANDRABINDU +11230..11231 ; Top # Mn [2] KHOJKI VOWEL SIGN E..KHOJKI VOWEL SIGN AI +11234 ; Top # Mn KHOJKI SIGN ANUSVARA +11236..11237 ; Top # Mn [2] KHOJKI SIGN NUKTA..KHOJKI SIGN SHADDA +1123E ; Top # Mn KHOJKI SIGN SUKUN +112DF ; Top # Mn KHUDAWADI SIGN ANUSVARA +112E5..112E8 ; Top # Mn [4] KHUDAWADI VOWEL SIGN E..KHUDAWADI VOWEL SIGN AU +11300..11301 ; Top # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11340 ; Top # Mn GRANTHA VOWEL SIGN II +11366..1136C ; Top # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Top # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA +1143E..1143F ; Top # Mn [2] NEWA VOWEL SIGN E..NEWA VOWEL SIGN AI +11443..11444 ; Top # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +1145E ; Top # Mn NEWA SANDHI MARK +114BA ; Top # Mn TIRHUTA VOWEL SIGN SHORT E +114BF..114C0 ; Top # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Top # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +11639..1163A ; Top # Mn [2] MODI VOWEL SIGN E..MODI VOWEL SIGN AI +1163D ; Top # Mn MODI SIGN ANUSVARA +11640 ; Top # Mn MODI SIGN ARDHACANDRA +116AB ; Top # Mn TAKRI SIGN ANUSVARA +116AD ; Top # Mn TAKRI VOWEL SIGN AA +116B2..116B5 ; Top # Mn [4] TAKRI VOWEL SIGN E..TAKRI VOWEL SIGN AU +1171F ; Top # Mn AHOM CONSONANT SIGN MEDIAL LIGATING RA +11722..11723 ; Top # Mn [2] AHOM VOWEL SIGN I..AHOM VOWEL SIGN II +11727 ; Top # Mn AHOM VOWEL SIGN AW +11729..1172B ; Top # Mn [3] AHOM VOWEL SIGN AI..AHOM SIGN KILLER +11833..11837 ; Top # Mn [5] DOGRA VOWEL SIGN E..DOGRA SIGN ANUSVARA +1193B..1193C ; Top # Mn [2] DIVES AKURU SIGN ANUSVARA..DIVES AKURU SIGN CANDRABINDU +1193F ; Top # Lo DIVES AKURU PREFIXED NASAL SIGN +11941 ; Top # Lo DIVES AKURU INITIAL RA +119DA..119DB ; Top # Mn [2] NANDINAGARI VOWEL SIGN E..NANDINAGARI VOWEL SIGN AI +11A01 ; Top # Mn ZANABAZAR SQUARE VOWEL SIGN I +11A04..11A09 ; Top # Mn [6] ZANABAZAR SQUARE VOWEL SIGN E..ZANABAZAR SQUARE VOWEL SIGN REVERSED I +11A35..11A38 ; Top # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A3A ; Top # Lo ZANABAZAR SQUARE CLUSTER-INITIAL LETTER RA +11A51 ; Top # Mn SOYOMBO VOWEL SIGN I +11A54..11A56 ; Top # Mn [3] SOYOMBO VOWEL SIGN E..SOYOMBO VOWEL SIGN OE +11A84..11A89 ; Top # Lo [6] SOYOMBO SIGN JIHVAMULIYA..SOYOMBO CLUSTER-INITIAL LETTER SA +11A96 ; Top # Mn SOYOMBO SIGN ANUSVARA +11A98 ; Top # Mn SOYOMBO GEMINATION MARK +11C30..11C31 ; Top # Mn [2] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN II +11C38..11C3D ; Top # Mn [6] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI SIGN ANUSVARA +11CB3 ; Top # Mn MARCHEN VOWEL SIGN E +11CB5..11CB6 ; Top # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D31..11D35 ; Top # Mn [5] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN UU +11D3A ; Top # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Top # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F..11D41 ; Top # Mn [3] MASARAM GONDI VOWEL SIGN AU..MASARAM GONDI SIGN VISARGA +11D43 ; Top # Mn MASARAM GONDI SIGN CANDRA +11D90..11D91 ; Top # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI +11D95 ; Top # Mn GUNJALA GONDI SIGN ANUSVARA +11EF3 ; Top # Mn MAKASAR VOWEL SIGN I + +# Indic_Positional_Category=Bottom + +093C ; Bottom # Mn DEVANAGARI SIGN NUKTA +0941..0944 ; Bottom # Mn [4] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN VOCALIC RR +094D ; Bottom # Mn DEVANAGARI SIGN VIRAMA +0952 ; Bottom # Mn DEVANAGARI STRESS SIGN ANUDATTA +0956..0957 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN UE..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BC ; Bottom # Mn BENGALI SIGN NUKTA +09C1..09C4 ; Bottom # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09CD ; Bottom # Mn BENGALI SIGN VIRAMA +09E2..09E3 ; Bottom # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3C ; Bottom # Mn GURMUKHI SIGN NUKTA +0A41..0A42 ; Bottom # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A4D ; Bottom # Mn GURMUKHI SIGN VIRAMA +0A51 ; Bottom # Mn GURMUKHI SIGN UDAAT +0A75 ; Bottom # Mn GURMUKHI SIGN YAKASH +0ABC ; Bottom # Mn GUJARATI SIGN NUKTA +0AC1..0AC4 ; Bottom # Mn [4] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN VOCALIC RR +0ACD ; Bottom # Mn GUJARATI SIGN VIRAMA +0AE2..0AE3 ; Bottom # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3C ; Bottom # Mn ORIYA SIGN NUKTA +0B41..0B44 ; Bottom # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B4D ; Bottom # Mn ORIYA SIGN VIRAMA +0B62..0B63 ; Bottom # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0C56 ; Bottom # Mn TELUGU AI LENGTH MARK +0C62..0C63 ; Bottom # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBC ; Bottom # Mn KANNADA SIGN NUKTA +0CE2..0CE3 ; Bottom # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D43..0D44 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC R..MALAYALAM VOWEL SIGN VOCALIC RR +0D62..0D63 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DD4 ; Bottom # Mn SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Bottom # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0E38..0E3A ; Bottom # Mn [3] THAI CHARACTER SARA U..THAI CHARACTER PHINTHU +0EB8..0EBA ; Bottom # Mn [3] LAO VOWEL SIGN U..LAO SIGN PALI VIRAMA +0EBC ; Bottom # Mn LAO SEMIVOWEL SIGN LO +0F18..0F19 ; Bottom # Mn [2] TIBETAN ASTROLOGICAL SIGN -KHYUD PA..TIBETAN ASTROLOGICAL SIGN SDONG TSHUGS +0F35 ; Bottom # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Bottom # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0F71 ; Bottom # Mn TIBETAN VOWEL SIGN AA +0F74..0F75 ; Bottom # Mn [2] TIBETAN VOWEL SIGN U..TIBETAN VOWEL SIGN UU +0F84 ; Bottom # Mn TIBETAN MARK HALANTA +0F8D..0F97 ; Bottom # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Bottom # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +0FC6 ; Bottom # Mn TIBETAN SYMBOL PADMA GDAN +102F..1030 ; Bottom # Mn [2] MYANMAR VOWEL SIGN U..MYANMAR VOWEL SIGN UU +1037 ; Bottom # Mn MYANMAR SIGN DOT BELOW +103D..103E ; Bottom # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +1058..1059 ; Bottom # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +105E..1060 ; Bottom # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Bottom # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +108D ; Bottom # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +1713..1714 ; Bottom # Mn [2] TAGALOG VOWEL SIGN U..TAGALOG SIGN VIRAMA +1733..1734 ; Bottom # Mn [2] HANUNOO VOWEL SIGN U..HANUNOO SIGN PAMUDPOD +1753 ; Bottom # Mn BUHID VOWEL SIGN U +1773 ; Bottom # Mn TAGBANWA VOWEL SIGN U +17BB..17BD ; Bottom # Mn [3] KHMER VOWEL SIGN U..KHMER VOWEL SIGN UA +1922 ; Bottom # Mn LIMBU VOWEL SIGN U +1932 ; Bottom # Mn LIMBU SMALL LETTER ANUSVARA +1939 ; Bottom # Mn LIMBU SIGN MUKPHRENG +193B ; Bottom # Mn LIMBU SIGN SA-I +1A18 ; Bottom # Mn BUGINESE VOWEL SIGN U +1A56 ; Bottom # Mn TAI THAM CONSONANT SIGN MEDIAL LA +1A5B..1A5E ; Bottom # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1A69..1A6A ; Bottom # Mn [2] TAI THAM VOWEL SIGN U..TAI THAM VOWEL SIGN UU +1A6C ; Bottom # Mn TAI THAM VOWEL SIGN OA BELOW +1A7F ; Bottom # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1B38..1B3A ; Bottom # Mn [3] BALINESE VOWEL SIGN SUKU..BALINESE VOWEL SIGN RA REPA +1B6C ; Bottom # Mn BALINESE MUSICAL SYMBOL COMBINING ENDEP +1BA2..1BA3 ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BA5 ; Bottom # Mn SUNDANESE VOWEL SIGN PANYUKU +1BAC..1BAD ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C2C ; Bottom # Mn LEPCHA VOWEL SIGN E +1C37 ; Bottom # Mn LEPCHA SIGN NUKTA +1CD5..1CD9 ; Bottom # Mn [5] VEDIC TONE YAJURVEDIC AGGRAVATED INDEPENDENT SVARITA..VEDIC TONE YAJURVEDIC KATHAKA INDEPENDENT SVARITA SCHROEDER +1CDC..1CDF ; Bottom # Mn [4] VEDIC TONE KATHAKA ANUDATTA..VEDIC TONE THREE DOTS BELOW +1CED ; Bottom # Mn VEDIC SIGN TIRYAK +A825 ; Bottom # Mn SYLOTI NAGRI VOWEL SIGN U +A82C ; Bottom # Mn SYLOTI NAGRI SIGN ALTERNATE HASANTA +A8C4 ; Bottom # Mn SAURASHTRA SIGN VIRAMA +A92B..A92D ; Bottom # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +A947..A949 ; Bottom # Mn [3] REJANG VOWEL SIGN I..REJANG VOWEL SIGN E +A94B..A94E ; Bottom # Mn [4] REJANG VOWEL SIGN O..REJANG VOWEL SIGN EA +A9B8..A9B9 ; Bottom # Mn [2] JAVANESE VOWEL SIGN SUKU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BD ; Bottom # Mn JAVANESE CONSONANT SIGN KERET +AA2D ; Bottom # Mn CHAM VOWEL SIGN U +AA32 ; Bottom # Mn CHAM VOWEL SIGN UE +AA35..AA36 ; Bottom # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +AAB4 ; Bottom # Mn TAI VIET VOWEL U +AAEC ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UU +ABE8 ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK +10A02..10A03 ; Bottom # Mn [2] KHAROSHTHI VOWEL SIGN U..KHAROSHTHI VOWEL SIGN VOCALIC R +10A0C..10A0E ; Bottom # Mn [3] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN ANUSVARA +10A39..10A3A ; Bottom # Mn [2] KHAROSHTHI SIGN CAUDA..KHAROSHTHI SIGN DOT BELOW +1103C..11041 ; Bottom # Mn [6] BRAHMI VOWEL SIGN U..BRAHMI VOWEL SIGN VOCALIC LL +110B3..110B4 ; Bottom # Mn [2] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN UU +110B9..110BA ; Bottom # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +1112A..1112B ; Bottom # Mn [2] CHAKMA VOWEL SIGN U..CHAKMA VOWEL SIGN UU +11131..11132 ; Bottom # Mn [2] CHAKMA O MARK..CHAKMA AU MARK +11173 ; Bottom # Mn MAHAJANI SIGN NUKTA +111B6..111BB ; Bottom # Mn [6] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN VOCALIC LL +111C9..111CA ; Bottom # Mn [2] SHARADA SANDHI MARK..SHARADA SIGN NUKTA +111CC ; Bottom # Mn SHARADA EXTRA SHORT VOWEL MARK +1122F ; Bottom # Mn KHOJKI VOWEL SIGN U +112E3..112E4 ; Bottom # Mn [2] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN UU +112E9..112EA ; Bottom # Mn [2] KHUDAWADI SIGN NUKTA..KHUDAWADI SIGN VIRAMA +1133B..1133C ; Bottom # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA +11438..1143D ; Bottom # Mn [6] NEWA VOWEL SIGN U..NEWA VOWEL SIGN VOCALIC LL +11442 ; Bottom # Mn NEWA SIGN VIRAMA +11446 ; Bottom # Mn NEWA SIGN NUKTA +114B3..114B8 ; Bottom # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114C2..114C3 ; Bottom # Mn [2] TIRHUTA SIGN VIRAMA..TIRHUTA SIGN NUKTA +115B2..115B5 ; Bottom # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115BF..115C0 ; Bottom # Mn [2] SIDDHAM SIGN VIRAMA..SIDDHAM SIGN NUKTA +115DC..115DD ; Bottom # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11633..11638 ; Bottom # Mn [6] MODI VOWEL SIGN U..MODI VOWEL SIGN VOCALIC LL +1163F ; Bottom # Mn MODI SIGN VIRAMA +116B0..116B1 ; Bottom # Mn [2] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN UU +116B7 ; Bottom # Mn TAKRI SIGN NUKTA +1171D ; Bottom # Mn AHOM CONSONANT SIGN MEDIAL LA +11724..11725 ; Bottom # Mn [2] AHOM VOWEL SIGN U..AHOM VOWEL SIGN UU +11728 ; Bottom # Mn AHOM VOWEL SIGN O +1182F..11832 ; Bottom # Mn [4] DOGRA VOWEL SIGN U..DOGRA VOWEL SIGN VOCALIC RR +11839..1183A ; Bottom # Mn [2] DOGRA SIGN VIRAMA..DOGRA SIGN NUKTA +11943 ; Bottom # Mn DIVES AKURU SIGN NUKTA +119D4..119D7 ; Bottom # Mn [4] NANDINAGARI VOWEL SIGN U..NANDINAGARI VOWEL SIGN VOCALIC RR +119E0 ; Bottom # Mn NANDINAGARI SIGN VIRAMA +11A02..11A03 ; Bottom # Mn [2] ZANABAZAR SQUARE VOWEL SIGN UE..ZANABAZAR SQUARE VOWEL SIGN U +11A0A ; Bottom # Mn ZANABAZAR SQUARE VOWEL LENGTH MARK +11A33..11A34 ; Bottom # Mn [2] ZANABAZAR SQUARE FINAL CONSONANT MARK..ZANABAZAR SQUARE SIGN VIRAMA +11A3B..11A3E ; Bottom # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11A52..11A53 ; Bottom # Mn [2] SOYOMBO VOWEL SIGN UE..SOYOMBO VOWEL SIGN U +11A59..11A5B ; Bottom # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11A8A..11A95 ; Bottom # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A +11C32..11C36 ; Bottom # Mn [5] BHAIKSUKI VOWEL SIGN U..BHAIKSUKI VOWEL SIGN VOCALIC L +11C3F ; Bottom # Mn BHAIKSUKI SIGN VIRAMA +11C92..11CA7 ; Bottom # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CAA..11CB0 ; Bottom # Mn [7] MARCHEN SUBJOINED LETTER RA..MARCHEN VOWEL SIGN AA +11CB2 ; Bottom # Mn MARCHEN VOWEL SIGN U +11D36 ; Bottom # Mn MASARAM GONDI VOWEL SIGN VOCALIC R +11D42 ; Bottom # Mn MASARAM GONDI SIGN NUKTA +11D44 ; Bottom # Mn MASARAM GONDI SIGN HALANTA +11D47 ; Bottom # Mn MASARAM GONDI RA-KARA +11EF4 ; Bottom # Mn MAKASAR VOWEL SIGN U + +# Indic_Positional_Category=Top_And_Bottom + +0C48 ; Top_And_Bottom # Mn TELUGU VOWEL SIGN AI +0F73 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN II +0F76..0F79 ; Top_And_Bottom # Mn [4] TIBETAN VOWEL SIGN VOCALIC R..TIBETAN VOWEL SIGN VOCALIC LL +0F81 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN REVERSED II +1B3C ; Top_And_Bottom # Mn BALINESE VOWEL SIGN LA LENGA +1112E..1112F ; Top_And_Bottom # Mn [2] CHAKMA VOWEL SIGN O..CHAKMA VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Right + +0AC9 ; Top_And_Right # Mc GUJARATI VOWEL SIGN CANDRA O +0B57 ; Top_And_Right # Mc ORIYA AU LENGTH MARK +0CC0 ; Top_And_Right # Mc KANNADA VOWEL SIGN II +0CC7..0CC8 ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +1925..1926 ; Top_And_Right # Mc [2] LIMBU VOWEL SIGN OO..LIMBU VOWEL SIGN AU +1B43 ; Top_And_Right # Mc BALINESE VOWEL SIGN PEPET TEDUNG +111BF ; Top_And_Right # Mc SHARADA VOWEL SIGN AU +11232..11233 ; Top_And_Right # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Left + +0B48 ; Top_And_Left # Mc ORIYA VOWEL SIGN AI +0DDA ; Top_And_Left # Mc SINHALA VOWEL SIGN DIGA KOMBUVA +17BE ; Top_And_Left # Mc KHMER VOWEL SIGN OE +1C29 ; Top_And_Left # Mc LEPCHA VOWEL SIGN OO +114BB ; Top_And_Left # Mc TIRHUTA VOWEL SIGN AI +115B9 ; Top_And_Left # Mc SIDDHAM VOWEL SIGN AI + +# Indic_Positional_Category=Top_And_Left_And_Right + +0B4C ; Top_And_Left_And_Right # Mc ORIYA VOWEL SIGN AU +0DDD ; Top_And_Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA +17BF ; Top_And_Left_And_Right # Mc KHMER VOWEL SIGN YA +115BB ; Top_And_Left_And_Right # Mc SIDDHAM VOWEL SIGN AU + +# Indic_Positional_Category=Bottom_And_Right + +1B3B ; Bottom_And_Right # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +A9BE ; Bottom_And_Right # Mc JAVANESE CONSONANT SIGN PENGKAL +A9C0 ; Bottom_And_Right # Mc JAVANESE PANGKON +11942 ; Bottom_And_Right # Mc DIVES AKURU MEDIAL RA + +# Indic_Positional_Category=Bottom_And_Left + +A9BF ; Bottom_And_Left # Mc JAVANESE CONSONANT SIGN CAKRA + +# Indic_Positional_Category=Top_And_Bottom_And_Right + +1B3D ; Top_And_Bottom_And_Right # Mc BALINESE VOWEL SIGN LA LENGA TEDUNG + +# Indic_Positional_Category=Top_And_Bottom_And_Left + +103C ; Top_And_Bottom_And_Left # Mc MYANMAR CONSONANT SIGN MEDIAL RA +1171E ; Top_And_Bottom_And_Left # Mn AHOM CONSONANT SIGN MEDIAL RA + +# Indic_Positional_Category=Overstruck + +1CD4 ; Overstruck # Mn VEDIC SIGN YAJURVEDIC MIDLINE SVARITA +1CE2..1CE8 ; Overstruck # Mn [7] VEDIC SIGN VISARGA SVARITA..VEDIC SIGN VISARGA ANUDATTA WITH TAIL +10A01 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN I +10A06 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN O + +# EOF diff --git a/data/13.0.0-indic-syllabic-category.txt b/data/13.0.0-indic-syllabic-category.txt new file mode 100644 index 0000000..8297578 --- /dev/null +++ b/data/13.0.0-indic-syllabic-category.txt @@ -0,0 +1,1310 @@ +# IndicSyllabicCategory-13.0.0.txt +# Date: 2019-07-22, 19:55:00 GMT [KW, RP] +# © 2019 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# +# For documentation, see UAX #44: Unicode Character Database, +# at http://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Syllabic_Category enumerated property +# +# Scope: This property is aimed at two general problem +# areas involving the analysis and processing of Indic scripts: +# +# 1. Specification of syllabic structure. +# 2. Specification of segmentation rules. +# +# Both of these problem areas may benefit from having defined subtypes +# of Indic script characters which are relevant to how Indic +# syllables (or aksaras) are constructed. Note that rules for +# syllabic structure in Indic scripts may differ significantly +# from how phonological syllables are defined. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Syllabic_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as Indic in the structural sense used for the +# Indic_Syllabic_Category are the following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Dives Akuru, Dogra, Grantha, Gujarati, +# Gunjala Gondi, Gurmukhi, Hanunoo, Javanese, Kaithi, Kannada, +# Kayah Li, Kharoshthi, Khmer, Khojki, Khudawadi, Lao, Lepcha, Limbu, +# Mahajani, Makasar, Malayalam, Marchen, Masaram Gondi, Meetei Mayek, +# Modi, Multani, Myanmar, Nandinagari, Newa, New Tai Lue, Oriya, +# Phags-pa, Rejang, Saurashtra, Sharada, Siddham, Sinhala, Soyombo, +# Sundanese, Syloti Nagri, Tagalog, Tagbanwa, Tai Le, Tai Tham, +# Tai Viet, Takri, Tamil, Telugu, Thai, Tibetan, Tirhuta, and +# Zanabazar Square. +# +# All characters for all other scripts not in that list +# take the default value for this property, unless they +# are individually listed in this data file. +# + +# ================================================ + +# Property: Indic_Syllabic_Category +# +# All code points not explicitly listed for Indic_Syllabic_Category +# have the value Other. +# +# @missing: 0000..10FFFF; Other + +# ================================================ + +# Indic_Syllabic_Category=Bindu + +# Bindu/Anusvara (nasalization or -n) + +# [Not derivable] + +0900..0902 ; Bindu # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +0981 ; Bindu # Mn BENGALI SIGN CANDRABINDU +0982 ; Bindu # Mc BENGALI SIGN ANUSVARA +09FC ; Bindu # Lo BENGALI LETTER VEDIC ANUSVARA +0A01..0A02 ; Bindu # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A70 ; Bindu # Mn GURMUKHI TIPPI +0A81..0A82 ; Bindu # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0B01 ; Bindu # Mn ORIYA SIGN CANDRABINDU +0B02 ; Bindu # Mc ORIYA SIGN ANUSVARA +0B82 ; Bindu # Mn TAMIL SIGN ANUSVARA +0C00 ; Bindu # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C01..0C02 ; Bindu # Mc [2] TELUGU SIGN CANDRABINDU..TELUGU SIGN ANUSVARA +0C04 ; Bindu # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C80 ; Bindu # Lo KANNADA SIGN SPACING CANDRABINDU +0C81 ; Bindu # Mn KANNADA SIGN CANDRABINDU +0C82 ; Bindu # Mc KANNADA SIGN ANUSVARA +0D00..0D01 ; Bindu # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU +0D02 ; Bindu # Mc MALAYALAM SIGN ANUSVARA +0D04 ; Bindu # Lo MALAYALAM LETTER VEDIC ANUSVARA +0D81 ; Bindu # Mn SINHALA SIGN CANDRABINDU +0D82 ; Bindu # Mc SINHALA SIGN ANUSVARAYA +0E4D ; Bindu # Mn THAI CHARACTER NIKHAHIT +0ECD ; Bindu # Mn LAO NIGGAHITA +0F7E ; Bindu # Mn TIBETAN SIGN RJES SU NGA RO +0F82..0F83 ; Bindu # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +1036 ; Bindu # Mn MYANMAR SIGN ANUSVARA +17C6 ; Bindu # Mn KHMER SIGN NIKAHIT +1932 ; Bindu # Mn LIMBU SMALL LETTER ANUSVARA +1A74 ; Bindu # Mn TAI THAM SIGN MAI KANG +1B00..1B02 ; Bindu # Mn [3] BALINESE SIGN ULU RICEM..BALINESE SIGN CECEK +1B80 ; Bindu # Mn SUNDANESE SIGN PANYECEK +1C34..1C35 ; Bindu # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A80B ; Bindu # Mn SYLOTI NAGRI SIGN ANUSVARA +A873 ; Bindu # Lo PHAGS-PA LETTER CANDRABINDU +A880 ; Bindu # Mc SAURASHTRA SIGN ANUSVARA +A8C5 ; Bindu # Mn SAURASHTRA SIGN CANDRABINDU +A8F2..A8F3 ; Bindu # Lo [2] DEVANAGARI SIGN SPACING CANDRABINDU..DEVANAGARI SIGN CANDRABINDU VIRAMA +A980..A981 ; Bindu # Mn [2] JAVANESE SIGN PANYANGGA..JAVANESE SIGN CECAK +10A0E ; Bindu # Mn KHAROSHTHI SIGN ANUSVARA +11000 ; Bindu # Mc BRAHMI SIGN CANDRABINDU +11001 ; Bindu # Mn BRAHMI SIGN ANUSVARA +11080..11081 ; Bindu # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +11100..11101 ; Bindu # Mn [2] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN ANUSVARA +11180..11181 ; Bindu # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +111CF ; Bindu # Mn SHARADA SIGN INVERTED CANDRABINDU +11234 ; Bindu # Mn KHOJKI SIGN ANUSVARA +112DF ; Bindu # Mn KHUDAWADI SIGN ANUSVARA +11300..11301 ; Bindu # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11302 ; Bindu # Mc GRANTHA SIGN ANUSVARA +1135E..1135F ; Bindu # Lo [2] GRANTHA LETTER VEDIC ANUSVARA..GRANTHA LETTER VEDIC DOUBLE ANUSVARA +11443..11444 ; Bindu # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +1145F ; Bindu # Lo NEWA LETTER VEDIC ANUSVARA +114BF..114C0 ; Bindu # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Bindu # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +1163D ; Bindu # Mn MODI SIGN ANUSVARA +116AB ; Bindu # Mn TAKRI SIGN ANUSVARA +11837 ; Bindu # Mn DOGRA SIGN ANUSVARA +1193B..1193C ; Bindu # Mn [2] DIVES AKURU SIGN ANUSVARA..DIVES AKURU SIGN CANDRABINDU +119DE ; Bindu # Mc NANDINAGARI SIGN ANUSVARA +11A35..11A38 ; Bindu # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A96 ; Bindu # Mn SOYOMBO SIGN ANUSVARA +11C3C..11C3D ; Bindu # Mn [2] BHAIKSUKI SIGN CANDRABINDU..BHAIKSUKI SIGN ANUSVARA +11CB5..11CB6 ; Bindu # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D40 ; Bindu # Mn MASARAM GONDI SIGN ANUSVARA +11D95 ; Bindu # Mn GUNJALA GONDI SIGN ANUSVARA + +# ================================================ + +# Indic_Syllabic_Category=Visarga + +# Visarga (-h) +# Excludes letters for jihvamuliya and upadhmaniya, which are +# related, but structured somewhat differently. + +# [Not derivable] + +0903 ; Visarga # Mc DEVANAGARI SIGN VISARGA +0983 ; Visarga # Mc BENGALI SIGN VISARGA +0A03 ; Visarga # Mc GURMUKHI SIGN VISARGA +0A83 ; Visarga # Mc GUJARATI SIGN VISARGA +0B03 ; Visarga # Mc ORIYA SIGN VISARGA +0C03 ; Visarga # Mc TELUGU SIGN VISARGA +0C83 ; Visarga # Mc KANNADA SIGN VISARGA +0D03 ; Visarga # Mc MALAYALAM SIGN VISARGA +0D83 ; Visarga # Mc SINHALA SIGN VISARGAYA +0F7F ; Visarga # Mc TIBETAN SIGN RNAM BCAD +1038 ; Visarga # Mc MYANMAR SIGN VISARGA +17C7 ; Visarga # Mc KHMER SIGN REAHMUK +1B04 ; Visarga # Mc BALINESE SIGN BISAH +1B82 ; Visarga # Mc SUNDANESE SIGN PANGWISAD +A881 ; Visarga # Mc SAURASHTRA SIGN VISARGA +A983 ; Visarga # Mc JAVANESE SIGN WIGNYAN +AAF5 ; Visarga # Mc MEETEI MAYEK VOWEL SIGN VISARGA +10A0F ; Visarga # Mn KHAROSHTHI SIGN VISARGA +11002 ; Visarga # Mc BRAHMI SIGN VISARGA +11082 ; Visarga # Mc KAITHI SIGN VISARGA +11102 ; Visarga # Mn CHAKMA SIGN VISARGA +11182 ; Visarga # Mc SHARADA SIGN VISARGA +11303 ; Visarga # Mc GRANTHA SIGN VISARGA +11445 ; Visarga # Mc NEWA SIGN VISARGA +114C1 ; Visarga # Mc TIRHUTA SIGN VISARGA +115BE ; Visarga # Mc SIDDHAM SIGN VISARGA +1163E ; Visarga # Mc MODI SIGN VISARGA +116AC ; Visarga # Mc TAKRI SIGN VISARGA +11838 ; Visarga # Mc DOGRA SIGN VISARGA +119DF ; Visarga # Mc NANDINAGARI SIGN VISARGA +11A39 ; Visarga # Mc ZANABAZAR SQUARE SIGN VISARGA +11A97 ; Visarga # Mc SOYOMBO SIGN VISARGA +11C3E ; Visarga # Mc BHAIKSUKI SIGN VISARGA +11D41 ; Visarga # Mn MASARAM GONDI SIGN VISARGA +11D96 ; Visarga # Mc GUNJALA GONDI SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Avagraha + +# Avagraha (elision of initial a- in sandhi) + +# [Not derivable] + +093D ; Avagraha # Lo DEVANAGARI SIGN AVAGRAHA +09BD ; Avagraha # Lo BENGALI SIGN AVAGRAHA +0ABD ; Avagraha # Lo GUJARATI SIGN AVAGRAHA +0B3D ; Avagraha # Lo ORIYA SIGN AVAGRAHA +0C3D ; Avagraha # Lo TELUGU SIGN AVAGRAHA +0CBD ; Avagraha # Lo KANNADA SIGN AVAGRAHA +0D3D ; Avagraha # Lo MALAYALAM SIGN AVAGRAHA +0F85 ; Avagraha # Po TIBETAN MARK PALUTA +17DC ; Avagraha # Lo KHMER SIGN AVAKRAHASANYA +1BBA ; Avagraha # Lo SUNDANESE AVAGRAHA +111C1 ; Avagraha # Lo SHARADA SIGN AVAGRAHA +1133D ; Avagraha # Lo GRANTHA SIGN AVAGRAHA +11447 ; Avagraha # Lo NEWA SIGN AVAGRAHA +114C4 ; Avagraha # Lo TIRHUTA SIGN AVAGRAHA +119E1 ; Avagraha # Lo NANDINAGARI SIGN AVAGRAHA +11A9D ; Avagraha # Lo SOYOMBO MARK PLUTA +11C40 ; Avagraha # Lo BHAIKSUKI SIGN AVAGRAHA + +# ================================================ + +# Indic_Syllabic_Category=Nukta + +# Nukta (diacritic for borrowed consonants or other consonant +# modifications). Note that while the resulting sound is typically a +# consonant, the base letter a nukta follows may be an independent +# vowel. For example, is used to transcribe ARABIC LETTER +# AIN. + +# [Not derivable] + +093C ; Nukta # Mn DEVANAGARI SIGN NUKTA +09BC ; Nukta # Mn BENGALI SIGN NUKTA +0A3C ; Nukta # Mn GURMUKHI SIGN NUKTA +0ABC ; Nukta # Mn GUJARATI SIGN NUKTA +0AFD..0AFF ; Nukta # Mn [3] GUJARATI SIGN THREE-DOT NUKTA ABOVE..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B3C ; Nukta # Mn ORIYA SIGN NUKTA +0CBC ; Nukta # Mn KANNADA SIGN NUKTA +0F39 ; Nukta # Mn TIBETAN MARK TSA -PHRU +1B34 ; Nukta # Mn BALINESE SIGN REREKAN +1BE6 ; Nukta # Mn BATAK SIGN TOMPI +1C37 ; Nukta # Mn LEPCHA SIGN NUKTA +A9B3 ; Nukta # Mn JAVANESE SIGN CECAK TELU +10A38..10A3A ; Nukta # Mn [3] KHAROSHTHI SIGN BAR ABOVE..KHAROSHTHI SIGN DOT BELOW +110BA ; Nukta # Mn KAITHI SIGN NUKTA +11173 ; Nukta # Mn MAHAJANI SIGN NUKTA +111CA ; Nukta # Mn SHARADA SIGN NUKTA +11236 ; Nukta # Mn KHOJKI SIGN NUKTA +112E9 ; Nukta # Mn KHUDAWADI SIGN NUKTA +1133B..1133C ; Nukta # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA +11446 ; Nukta # Mn NEWA SIGN NUKTA +114C3 ; Nukta # Mn TIRHUTA SIGN NUKTA +115C0 ; Nukta # Mn SIDDHAM SIGN NUKTA +116B7 ; Nukta # Mn TAKRI SIGN NUKTA +1183A ; Nukta # Mn DOGRA SIGN NUKTA +11943 ; Nukta # Mn DIVES AKURU SIGN NUKTA +11D42 ; Nukta # Mn MASARAM GONDI SIGN NUKTA + +# ================================================ + +# Indic_Syllabic_Category=Virama + +# Virama (killing of inherent vowel in consonant sequence +# or consonant stacker) +# Only includes characters that can act both as visible killer viramas +# and consonant stackers. Separate property values exist for characters +# that can only act as pure killers or only as consonant stackers. + +# [Derivation: (ccc=9) - (InSC=Pure_Killer) - (InSC=Invisible_Stacker) +# - (InSC=Number_Joiner) - 2D7F] + +094D ; Virama # Mn DEVANAGARI SIGN VIRAMA +09CD ; Virama # Mn BENGALI SIGN VIRAMA +0A4D ; Virama # Mn GURMUKHI SIGN VIRAMA +0ACD ; Virama # Mn GUJARATI SIGN VIRAMA +0B4D ; Virama # Mn ORIYA SIGN VIRAMA +0BCD ; Virama # Mn TAMIL SIGN VIRAMA +0C4D ; Virama # Mn TELUGU SIGN VIRAMA +0CCD ; Virama # Mn KANNADA SIGN VIRAMA +0D4D ; Virama # Mn MALAYALAM SIGN VIRAMA +0DCA ; Virama # Mn SINHALA SIGN AL-LAKUNA +1B44 ; Virama # Mc BALINESE ADEG ADEG +A806 ; Virama # Mn SYLOTI NAGRI SIGN HASANTA +A8C4 ; Virama # Mn SAURASHTRA SIGN VIRAMA +A9C0 ; Virama # Mc JAVANESE PANGKON +11046 ; Virama # Mn BRAHMI VIRAMA +110B9 ; Virama # Mn KAITHI SIGN VIRAMA +111C0 ; Virama # Mc SHARADA SIGN VIRAMA +11235 ; Virama # Mc KHOJKI SIGN VIRAMA +1134D ; Virama # Mc GRANTHA SIGN VIRAMA +11442 ; Virama # Mn NEWA SIGN VIRAMA +114C2 ; Virama # Mn TIRHUTA SIGN VIRAMA +115BF ; Virama # Mn SIDDHAM SIGN VIRAMA +1163F ; Virama # Mn MODI SIGN VIRAMA +116B6 ; Virama # Mc TAKRI SIGN VIRAMA +11839 ; Virama # Mn DOGRA SIGN VIRAMA +119E0 ; Virama # Mn NANDINAGARI SIGN VIRAMA +11C3F ; Virama # Mn BHAIKSUKI SIGN VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Pure_Killer + +# Pure killer (killing of inherent vowel in consonant sequence, +# with no consonant stacking behavior) + +# [Not derivable] + +0D3B..0D3C ; Pure_Killer # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA +0E3A ; Pure_Killer # Mn THAI CHARACTER PHINTHU +0E4E ; Pure_Killer # Mn THAI CHARACTER YAMAKKAN +0EBA ; Pure_Killer # Mn LAO SIGN PALI VIRAMA +0F84 ; Pure_Killer # Mn TIBETAN MARK HALANTA +103A ; Pure_Killer # Mn MYANMAR SIGN ASAT +1714 ; Pure_Killer # Mn TAGALOG SIGN VIRAMA +1734 ; Pure_Killer # Mn HANUNOO SIGN PAMUDPOD +17D1 ; Pure_Killer # Mn KHMER SIGN VIRIAM +1A7A ; Pure_Killer # Mn TAI THAM SIGN RA HAAM +1BAA ; Pure_Killer # Mc SUNDANESE SIGN PAMAAEH +1BF2..1BF3 ; Pure_Killer # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +A82C ; Pure_Killer # Mn SYLOTI NAGRI SIGN ALTERNATE HASANTA +A953 ; Pure_Killer # Mc REJANG VIRAMA +ABED ; Pure_Killer # Mn MEETEI MAYEK APUN IYEK +11134 ; Pure_Killer # Mn CHAKMA MAAYYAA +112EA ; Pure_Killer # Mn KHUDAWADI SIGN VIRAMA +1172B ; Pure_Killer # Mn AHOM SIGN KILLER +1193D ; Pure_Killer # Mc DIVES AKURU SIGN HALANTA +11A34 ; Pure_Killer # Mn ZANABAZAR SQUARE SIGN VIRAMA +11D44 ; Pure_Killer # Mn MASARAM GONDI SIGN HALANTA + +# ================================================ + +# Indic_Syllabic_Category=Invisible_Stacker + +# Invisible stacker (invisible consonant stacker virama). +# +# Note that in some scripts, such as Kharoshthi and Masaram Gondi, an invisible +# stacker may have a second function, changing the shape and/or location of the +# consonant preceding it, even when there is no consonant following the +# invisible stacker. + +# [Not derivable] + +1039 ; Invisible_Stacker # Mn MYANMAR SIGN VIRAMA +17D2 ; Invisible_Stacker # Mn KHMER SIGN COENG +1A60 ; Invisible_Stacker # Mn TAI THAM SIGN SAKOT +1BAB ; Invisible_Stacker # Mn SUNDANESE SIGN VIRAMA +AAF6 ; Invisible_Stacker # Mn MEETEI MAYEK VIRAMA +10A3F ; Invisible_Stacker # Mn KHAROSHTHI VIRAMA +11133 ; Invisible_Stacker # Mn CHAKMA VIRAMA +1193E ; Invisible_Stacker # Mn DIVES AKURU VIRAMA +11A47 ; Invisible_Stacker # Mn ZANABAZAR SQUARE SUBJOINER +11A99 ; Invisible_Stacker # Mn SOYOMBO SUBJOINER +11D45 ; Invisible_Stacker # Mn MASARAM GONDI VIRAMA +11D97 ; Invisible_Stacker # Mn GUNJALA GONDI VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Independent + +# Independent Vowels (contrasted with matras) + +# [Not derivable] + +0904..0914 ; Vowel_Independent # Lo [17] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER AU +0960..0961 ; Vowel_Independent # Lo [2] DEVANAGARI LETTER VOCALIC RR..DEVANAGARI LETTER VOCALIC LL +0972..0977 ; Vowel_Independent # Lo [6] DEVANAGARI LETTER CANDRA A..DEVANAGARI LETTER UUE +0985..098C ; Vowel_Independent # Lo [8] BENGALI LETTER A..BENGALI LETTER VOCALIC L +098F..0990 ; Vowel_Independent # Lo [2] BENGALI LETTER E..BENGALI LETTER AI +0993..0994 ; Vowel_Independent # Lo [2] BENGALI LETTER O..BENGALI LETTER AU +09E0..09E1 ; Vowel_Independent # Lo [2] BENGALI LETTER VOCALIC RR..BENGALI LETTER VOCALIC LL +0A05..0A0A ; Vowel_Independent # Lo [6] GURMUKHI LETTER A..GURMUKHI LETTER UU +0A0F..0A10 ; Vowel_Independent # Lo [2] GURMUKHI LETTER EE..GURMUKHI LETTER AI +0A13..0A14 ; Vowel_Independent # Lo [2] GURMUKHI LETTER OO..GURMUKHI LETTER AU +0A85..0A8D ; Vowel_Independent # Lo [9] GUJARATI LETTER A..GUJARATI VOWEL CANDRA E +0A8F..0A91 ; Vowel_Independent # Lo [3] GUJARATI LETTER E..GUJARATI VOWEL CANDRA O +0A93..0A94 ; Vowel_Independent # Lo [2] GUJARATI LETTER O..GUJARATI LETTER AU +0AE0..0AE1 ; Vowel_Independent # Lo [2] GUJARATI LETTER VOCALIC RR..GUJARATI LETTER VOCALIC LL +0B05..0B0C ; Vowel_Independent # Lo [8] ORIYA LETTER A..ORIYA LETTER VOCALIC L +0B0F..0B10 ; Vowel_Independent # Lo [2] ORIYA LETTER E..ORIYA LETTER AI +0B13..0B14 ; Vowel_Independent # Lo [2] ORIYA LETTER O..ORIYA LETTER AU +0B60..0B61 ; Vowel_Independent # Lo [2] ORIYA LETTER VOCALIC RR..ORIYA LETTER VOCALIC LL +0B85..0B8A ; Vowel_Independent # Lo [6] TAMIL LETTER A..TAMIL LETTER UU +0B8E..0B90 ; Vowel_Independent # Lo [3] TAMIL LETTER E..TAMIL LETTER AI +0B92..0B94 ; Vowel_Independent # Lo [3] TAMIL LETTER O..TAMIL LETTER AU +0C05..0C0C ; Vowel_Independent # Lo [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L +0C0E..0C10 ; Vowel_Independent # Lo [3] TELUGU LETTER E..TELUGU LETTER AI +0C12..0C14 ; Vowel_Independent # Lo [3] TELUGU LETTER O..TELUGU LETTER AU +0C60..0C61 ; Vowel_Independent # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL +0C85..0C8C ; Vowel_Independent # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L +0C8E..0C90 ; Vowel_Independent # Lo [3] KANNADA LETTER E..KANNADA LETTER AI +0C92..0C94 ; Vowel_Independent # Lo [3] KANNADA LETTER O..KANNADA LETTER AU +0CE0..0CE1 ; Vowel_Independent # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL +0D05..0D0C ; Vowel_Independent # Lo [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L +0D0E..0D10 ; Vowel_Independent # Lo [3] MALAYALAM LETTER E..MALAYALAM LETTER AI +0D12..0D14 ; Vowel_Independent # Lo [3] MALAYALAM LETTER O..MALAYALAM LETTER AU +0D5F..0D61 ; Vowel_Independent # Lo [3] MALAYALAM LETTER ARCHAIC II..MALAYALAM LETTER VOCALIC LL +0D85..0D96 ; Vowel_Independent # Lo [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA +1021..102A ; Vowel_Independent # Lo [10] MYANMAR LETTER A..MYANMAR LETTER AU +1052..1055 ; Vowel_Independent # Lo [4] MYANMAR LETTER VOCALIC R..MYANMAR LETTER VOCALIC LL +1700..1702 ; Vowel_Independent # Lo [3] TAGALOG LETTER A..TAGALOG LETTER U +1720..1722 ; Vowel_Independent # Lo [3] HANUNOO LETTER A..HANUNOO LETTER U +1740..1742 ; Vowel_Independent # Lo [3] BUHID LETTER A..BUHID LETTER U +1760..1762 ; Vowel_Independent # Lo [3] TAGBANWA LETTER A..TAGBANWA LETTER U +17A3..17B3 ; Vowel_Independent # Lo [17] KHMER INDEPENDENT VOWEL QAQ..KHMER INDEPENDENT VOWEL QAU +1A4D..1A52 ; Vowel_Independent # Lo [6] TAI THAM LETTER I..TAI THAM LETTER OO +1B05..1B12 ; Vowel_Independent # Lo [14] BALINESE LETTER AKARA..BALINESE LETTER OKARA TEDUNG +1B83..1B89 ; Vowel_Independent # Lo [7] SUNDANESE LETTER A..SUNDANESE LETTER EU +1BE4..1BE5 ; Vowel_Independent # Lo [2] BATAK LETTER I..BATAK LETTER U +A800..A801 ; Vowel_Independent # Lo [2] SYLOTI NAGRI LETTER A..SYLOTI NAGRI LETTER I +A803..A805 ; Vowel_Independent # Lo [3] SYLOTI NAGRI LETTER U..SYLOTI NAGRI LETTER O +A882..A891 ; Vowel_Independent # Lo [16] SAURASHTRA LETTER A..SAURASHTRA LETTER AU +A8FE ; Vowel_Independent # Lo DEVANAGARI LETTER AY +A984..A988 ; Vowel_Independent # Lo [5] JAVANESE LETTER A..JAVANESE LETTER U +A98C..A98E ; Vowel_Independent # Lo [3] JAVANESE LETTER E..JAVANESE LETTER O +AA00..AA05 ; Vowel_Independent # Lo [6] CHAM LETTER A..CHAM LETTER O +AAE0..AAE1 ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER E..MEETEI MAYEK LETTER O +ABCE..ABCF ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER UN..MEETEI MAYEK LETTER I +ABD1 ; Vowel_Independent # Lo MEETEI MAYEK LETTER ATIYA +11005..11012 ; Vowel_Independent # Lo [14] BRAHMI LETTER A..BRAHMI LETTER AU +11083..1108C ; Vowel_Independent # Lo [10] KAITHI LETTER A..KAITHI LETTER AU +11103..11106 ; Vowel_Independent # Lo [4] CHAKMA LETTER AA..CHAKMA LETTER E +11183..11190 ; Vowel_Independent # Lo [14] SHARADA LETTER A..SHARADA LETTER AU +11200..11207 ; Vowel_Independent # Lo [8] KHOJKI LETTER A..KHOJKI LETTER AU +11280..11283 ; Vowel_Independent # Lo [4] MULTANI LETTER A..MULTANI LETTER E +112B0..112B9 ; Vowel_Independent # Lo [10] KHUDAWADI LETTER A..KHUDAWADI LETTER AU +11305..1130C ; Vowel_Independent # Lo [8] GRANTHA LETTER A..GRANTHA LETTER VOCALIC L +1130F..11310 ; Vowel_Independent # Lo [2] GRANTHA LETTER EE..GRANTHA LETTER AI +11313..11314 ; Vowel_Independent # Lo [2] GRANTHA LETTER OO..GRANTHA LETTER AU +11360..11361 ; Vowel_Independent # Lo [2] GRANTHA LETTER VOCALIC RR..GRANTHA LETTER VOCALIC LL +11400..1140D ; Vowel_Independent # Lo [14] NEWA LETTER A..NEWA LETTER AU +11481..1148E ; Vowel_Independent # Lo [14] TIRHUTA LETTER A..TIRHUTA LETTER AU +11580..1158D ; Vowel_Independent # Lo [14] SIDDHAM LETTER A..SIDDHAM LETTER AU +115D8..115DB ; Vowel_Independent # Lo [4] SIDDHAM LETTER THREE-CIRCLE ALTERNATE I..SIDDHAM LETTER ALTERNATE U +11600..1160D ; Vowel_Independent # Lo [14] MODI LETTER A..MODI LETTER AU +11680..11689 ; Vowel_Independent # Lo [10] TAKRI LETTER A..TAKRI LETTER AU +11800..11809 ; Vowel_Independent # Lo [10] DOGRA LETTER A..DOGRA LETTER AU +11900..11906 ; Vowel_Independent # Lo [7] DIVES AKURU LETTER A..DIVES AKURU LETTER E +11909 ; Vowel_Independent # Lo DIVES AKURU LETTER O +119A0..119A7 ; Vowel_Independent # Lo [8] NANDINAGARI LETTER A..NANDINAGARI LETTER VOCALIC RR +119AA..119AD ; Vowel_Independent # Lo [4] NANDINAGARI LETTER E..NANDINAGARI LETTER AU +11A00 ; Vowel_Independent # Lo ZANABAZAR SQUARE LETTER A +11A50 ; Vowel_Independent # Lo SOYOMBO LETTER A +11C00..11C08 ; Vowel_Independent # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L +11C0A..11C0D ; Vowel_Independent # Lo [4] BHAIKSUKI LETTER E..BHAIKSUKI LETTER AU +11D00..11D06 ; Vowel_Independent # Lo [7] MASARAM GONDI LETTER A..MASARAM GONDI LETTER E +11D08..11D09 ; Vowel_Independent # Lo [2] MASARAM GONDI LETTER AI..MASARAM GONDI LETTER O +11D0B ; Vowel_Independent # Lo MASARAM GONDI LETTER AU +11D60..11D65 ; Vowel_Independent # Lo [6] GUNJALA GONDI LETTER A..GUNJALA GONDI LETTER UU +11D67..11D68 ; Vowel_Independent # Lo [2] GUNJALA GONDI LETTER EE..GUNJALA GONDI LETTER AI +11D6A..11D6B ; Vowel_Independent # Lo [2] GUNJALA GONDI LETTER OO..GUNJALA GONDI LETTER AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Dependent + +# Dependent Vowels (contrasted with independent vowels and/or with +# complex placement). Known as matras in Indic scripts. Also +# includes vowel modifiers that follow dependent (and sometimes +# independent) vowels. + +# [Not derivable] + +093A ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN OE +093B ; Vowel_Dependent # Mc DEVANAGARI VOWEL SIGN OOE +093E..0940 ; Vowel_Dependent # Mc [3] DEVANAGARI VOWEL SIGN AA..DEVANAGARI VOWEL SIGN II +0941..0948 ; Vowel_Dependent # Mn [8] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN AI +0949..094C ; Vowel_Dependent # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094E..094F ; Vowel_Dependent # Mc [2] DEVANAGARI VOWEL SIGN PRISHTHAMATRA E..DEVANAGARI VOWEL SIGN AW +0955..0957 ; Vowel_Dependent # Mn [3] DEVANAGARI VOWEL SIGN CANDRA LONG E..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Vowel_Dependent # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BE..09C0 ; Vowel_Dependent # Mc [3] BENGALI VOWEL SIGN AA..BENGALI VOWEL SIGN II +09C1..09C4 ; Vowel_Dependent # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09C7..09C8 ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +09CB..09CC ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +09D7 ; Vowel_Dependent # Mc BENGALI AU LENGTH MARK +09E2..09E3 ; Vowel_Dependent # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3E..0A40 ; Vowel_Dependent # Mc [3] GURMUKHI VOWEL SIGN AA..GURMUKHI VOWEL SIGN II +0A41..0A42 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A47..0A48 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0ABE..0AC0 ; Vowel_Dependent # Mc [3] GUJARATI VOWEL SIGN AA..GUJARATI VOWEL SIGN II +0AC1..0AC5 ; Vowel_Dependent # Mn [5] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AC9 ; Vowel_Dependent # Mc GUJARATI VOWEL SIGN CANDRA O +0ACB..0ACC ; Vowel_Dependent # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0AE2..0AE3 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3E ; Vowel_Dependent # Mc ORIYA VOWEL SIGN AA +0B3F ; Vowel_Dependent # Mn ORIYA VOWEL SIGN I +0B40 ; Vowel_Dependent # Mc ORIYA VOWEL SIGN II +0B41..0B44 ; Vowel_Dependent # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B47..0B48 ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI +0B4B..0B4C ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN O..ORIYA VOWEL SIGN AU +0B55..0B56 ; Vowel_Dependent # Mn [2] ORIYA SIGN OVERLINE..ORIYA AI LENGTH MARK +0B57 ; Vowel_Dependent # Mc ORIYA AU LENGTH MARK +0B62..0B63 ; Vowel_Dependent # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BBE..0BBF ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC0 ; Vowel_Dependent # Mn TAMIL VOWEL SIGN II +0BC1..0BC2 ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BC6..0BC8 ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0BCA..0BCC ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0BD7 ; Vowel_Dependent # Mc TAMIL AU LENGTH MARK +0C3E..0C40 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C41..0C44 ; Vowel_Dependent # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C46..0C48 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI +0C4A..0C4C ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C55..0C56 ; Vowel_Dependent # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK +0C62..0C63 ; Vowel_Dependent # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBE ; Vowel_Dependent # Mc KANNADA VOWEL SIGN AA +0CBF ; Vowel_Dependent # Mn KANNADA VOWEL SIGN I +0CC0..0CC4 ; Vowel_Dependent # Mc [5] KANNADA VOWEL SIGN II..KANNADA VOWEL SIGN VOCALIC RR +0CC6 ; Vowel_Dependent # Mn KANNADA VOWEL SIGN E +0CC7..0CC8 ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +0CCC ; Vowel_Dependent # Mn KANNADA VOWEL SIGN AU +0CD5..0CD6 ; Vowel_Dependent # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CE2..0CE3 ; Vowel_Dependent # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D3E..0D40 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D44 ; Vowel_Dependent # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR +0D46..0D48 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0D4A..0D4C ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0D57 ; Vowel_Dependent # Mc MALAYALAM AU LENGTH MARK +0D62..0D63 ; Vowel_Dependent # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DCF..0DD1 ; Vowel_Dependent # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD2..0DD4 ; Vowel_Dependent # Mn [3] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Vowel_Dependent # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0DD8..0DDF ; Vowel_Dependent # Mc [8] SINHALA VOWEL SIGN GAETTA-PILLA..SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Vowel_Dependent # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Vowel_Dependent # Lo THAI CHARACTER SARA A +0E31 ; Vowel_Dependent # Mn THAI CHARACTER MAI HAN-AKAT +0E32..0E33 ; Vowel_Dependent # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E34..0E39 ; Vowel_Dependent # Mn [6] THAI CHARACTER SARA I..THAI CHARACTER SARA UU +0E40..0E45 ; Vowel_Dependent # Lo [6] THAI CHARACTER SARA E..THAI CHARACTER LAKKHANGYAO +0E47 ; Vowel_Dependent # Mn THAI CHARACTER MAITAIKHU +0EB0 ; Vowel_Dependent # Lo LAO VOWEL SIGN A +0EB1 ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KAN +0EB2..0EB3 ; Vowel_Dependent # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0EB4..0EB9 ; Vowel_Dependent # Mn [6] LAO VOWEL SIGN I..LAO VOWEL SIGN UU +0EBB ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KON +0EC0..0EC4 ; Vowel_Dependent # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +0F71..0F7D ; Vowel_Dependent # Mn [13] TIBETAN VOWEL SIGN AA..TIBETAN VOWEL SIGN OO +0F80..0F81 ; Vowel_Dependent # Mn [2] TIBETAN VOWEL SIGN REVERSED I..TIBETAN VOWEL SIGN REVERSED II +102B..102C ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +102D..1030 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN UU +1031 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN E +1032..1035 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +1056..1057 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1058..1059 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1062 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1071..1074 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1083..1084 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN SHAN AA..MYANMAR VOWEL SIGN SHAN E +1085..1086 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109C ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN AITON A +109D ; Vowel_Dependent # Mn MYANMAR VOWEL SIGN AITON AI +1712..1713 ; Vowel_Dependent # Mn [2] TAGALOG VOWEL SIGN I..TAGALOG VOWEL SIGN U +1732..1733 ; Vowel_Dependent # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1752..1753 ; Vowel_Dependent # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U +1772..1773 ; Vowel_Dependent # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U +17B6 ; Vowel_Dependent # Mc KHMER VOWEL SIGN AA +17B7..17BD ; Vowel_Dependent # Mn [7] KHMER VOWEL SIGN I..KHMER VOWEL SIGN UA +17BE..17C5 ; Vowel_Dependent # Mc [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU +17C8 ; Vowel_Dependent # Mc KHMER SIGN YUUKALEAPINTU +1920..1922 ; Vowel_Dependent # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U +1923..1926 ; Vowel_Dependent # Mc [4] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AU +1927..1928 ; Vowel_Dependent # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Vowel_Dependent # Mn LIMBU SIGN KEMPHRENG +19B0..19C0 ; Vowel_Dependent # Lo [17] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN IY +1A17..1A18 ; Vowel_Dependent # Mn [2] BUGINESE VOWEL SIGN I..BUGINESE VOWEL SIGN U +1A19..1A1A ; Vowel_Dependent # Mc [2] BUGINESE VOWEL SIGN E..BUGINESE VOWEL SIGN O +1A1B ; Vowel_Dependent # Mn BUGINESE VOWEL SIGN AE +1A61 ; Vowel_Dependent # Mc TAI THAM VOWEL SIGN A +1A62 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN MAI SAT +1A63..1A64 ; Vowel_Dependent # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A65..1A6C ; Vowel_Dependent # Mn [8] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN OA BELOW +1A6D..1A72 ; Vowel_Dependent # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI +1A73 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN OA ABOVE +1B35 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN TEDUNG +1B36..1B3A ; Vowel_Dependent # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA +1B3B ; Vowel_Dependent # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +1B3C ; Vowel_Dependent # Mn BALINESE VOWEL SIGN LA LENGA +1B3D..1B41 ; Vowel_Dependent # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1B42 ; Vowel_Dependent # Mn BALINESE VOWEL SIGN PEPET +1B43 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN PEPET TEDUNG +1BA4..1BA5 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PANGHULU..SUNDANESE VOWEL SIGN PANYUKU +1BA6..1BA7 ; Vowel_Dependent # Mc [2] SUNDANESE VOWEL SIGN PANAELAENG..SUNDANESE VOWEL SIGN PANOLONG +1BA8..1BA9 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE7 ; Vowel_Dependent # Mc BATAK VOWEL SIGN E +1BE8..1BE9 ; Vowel_Dependent # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BEA..1BEC ; Vowel_Dependent # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BED ; Vowel_Dependent # Mn BATAK VOWEL SIGN KARO O +1BEE ; Vowel_Dependent # Mc BATAK VOWEL SIGN U +1BEF ; Vowel_Dependent # Mn BATAK VOWEL SIGN U FOR SIMALUNGUN SA +1C26..1C2B ; Vowel_Dependent # Mc [6] LEPCHA VOWEL SIGN AA..LEPCHA VOWEL SIGN UU +1C2C ; Vowel_Dependent # Mn LEPCHA VOWEL SIGN E +A802 ; Vowel_Dependent # Mn SYLOTI NAGRI SIGN DVISVARA +A823..A824 ; Vowel_Dependent # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A825..A826 ; Vowel_Dependent # Mn [2] SYLOTI NAGRI VOWEL SIGN U..SYLOTI NAGRI VOWEL SIGN E +A827 ; Vowel_Dependent # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Vowel_Dependent # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A8FF ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN AY +A947..A94E ; Vowel_Dependent # Mn [8] REJANG VOWEL SIGN I..REJANG VOWEL SIGN EA +A9B4..A9B5 ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9B6..A9B9 ; Vowel_Dependent # Mn [4] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BA..A9BB ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +A9BC ; Vowel_Dependent # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Vowel_Dependent # Mn MYANMAR SIGN SHAN SAW +AA29..AA2E ; Vowel_Dependent # Mn [6] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN OE +AA2F..AA30 ; Vowel_Dependent # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA31..AA32 ; Vowel_Dependent # Mn [2] CHAM VOWEL SIGN AU..CHAM VOWEL SIGN UE +AAB0 ; Vowel_Dependent # Mn TAI VIET MAI KANG +AAB1 ; Vowel_Dependent # Lo TAI VIET VOWEL AA +AAB2..AAB4 ; Vowel_Dependent # Mn [3] TAI VIET VOWEL I..TAI VIET VOWEL U +AAB5..AAB6 ; Vowel_Dependent # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB7..AAB8 ; Vowel_Dependent # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AAB9..AABD ; Vowel_Dependent # Lo [5] TAI VIET VOWEL UEA..TAI VIET VOWEL AN +AABE ; Vowel_Dependent # Mn TAI VIET VOWEL AM +AAEB ; Vowel_Dependent # Mc MEETEI MAYEK VOWEL SIGN II +AAEC..AAED ; Vowel_Dependent # Mn [2] MEETEI MAYEK VOWEL SIGN UU..MEETEI MAYEK VOWEL SIGN AAI +AAEE..AAEF ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN AU..MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE5 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN ANAP +ABE6..ABE7 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE8 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABE9..ABEA ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +10A01..10A03 ; Vowel_Dependent # Mn [3] KHAROSHTHI VOWEL SIGN I..KHAROSHTHI VOWEL SIGN VOCALIC R +10A05..10A06 ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O +10A0C..10A0D ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN DOUBLE RING BELOW +11038..11045 ; Vowel_Dependent # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +110B0..110B2 ; Vowel_Dependent # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II +110B3..110B6 ; Vowel_Dependent # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI +110B7..110B8 ; Vowel_Dependent # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11127..1112B ; Vowel_Dependent # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU +1112C ; Vowel_Dependent # Mc CHAKMA VOWEL SIGN E +1112D..11132 ; Vowel_Dependent # Mn [6] CHAKMA VOWEL SIGN AI..CHAKMA AU MARK +11145..11146 ; Vowel_Dependent # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI +111B3..111B5 ; Vowel_Dependent # Mc [3] SHARADA VOWEL SIGN AA..SHARADA VOWEL SIGN II +111B6..111BE ; Vowel_Dependent # Mn [9] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN O +111BF ; Vowel_Dependent # Mc SHARADA VOWEL SIGN AU +111CB..111CC ; Vowel_Dependent # Mn [2] SHARADA VOWEL MODIFIER MARK..SHARADA EXTRA SHORT VOWEL MARK +111CE ; Vowel_Dependent # Mc SHARADA VOWEL SIGN PRISHTHAMATRA E +1122C..1122E ; Vowel_Dependent # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +1122F..11231 ; Vowel_Dependent # Mn [3] KHOJKI VOWEL SIGN U..KHOJKI VOWEL SIGN AI +11232..11233 ; Vowel_Dependent # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU +112E0..112E2 ; Vowel_Dependent # Mc [3] KHUDAWADI VOWEL SIGN AA..KHUDAWADI VOWEL SIGN II +112E3..112E8 ; Vowel_Dependent # Mn [6] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN AU +1133E..1133F ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11340 ; Vowel_Dependent # Mn GRANTHA VOWEL SIGN II +11341..11344 ; Vowel_Dependent # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +11347..11348 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +1134B..1134C ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +11357 ; Vowel_Dependent # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +11435..11437 ; Vowel_Dependent # Mc [3] NEWA VOWEL SIGN AA..NEWA VOWEL SIGN II +11438..1143F ; Vowel_Dependent # Mn [8] NEWA VOWEL SIGN U..NEWA VOWEL SIGN AI +11440..11441 ; Vowel_Dependent # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +114B0..114B2 ; Vowel_Dependent # Mc [3] TIRHUTA VOWEL SIGN AA..TIRHUTA VOWEL SIGN II +114B3..114B8 ; Vowel_Dependent # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114B9 ; Vowel_Dependent # Mc TIRHUTA VOWEL SIGN E +114BA ; Vowel_Dependent # Mn TIRHUTA VOWEL SIGN SHORT E +114BB..114BE ; Vowel_Dependent # Mc [4] TIRHUTA VOWEL SIGN AI..TIRHUTA VOWEL SIGN AU +115AF..115B1 ; Vowel_Dependent # Mc [3] SIDDHAM VOWEL SIGN AA..SIDDHAM VOWEL SIGN II +115B2..115B5 ; Vowel_Dependent # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115B8..115BB ; Vowel_Dependent # Mc [4] SIDDHAM VOWEL SIGN E..SIDDHAM VOWEL SIGN AU +115DC..115DD ; Vowel_Dependent # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11630..11632 ; Vowel_Dependent # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +11633..1163A ; Vowel_Dependent # Mn [8] MODI VOWEL SIGN U..MODI VOWEL SIGN AI +1163B..1163C ; Vowel_Dependent # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +11640 ; Vowel_Dependent # Mn MODI SIGN ARDHACANDRA +116AD ; Vowel_Dependent # Mn TAKRI VOWEL SIGN AA +116AE..116AF ; Vowel_Dependent # Mc [2] TAKRI VOWEL SIGN I..TAKRI VOWEL SIGN II +116B0..116B5 ; Vowel_Dependent # Mn [6] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN AU +11720..11721 ; Vowel_Dependent # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +11722..11725 ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN I..AHOM VOWEL SIGN UU +11726 ; Vowel_Dependent # Mc AHOM VOWEL SIGN E +11727..1172A ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN AW..AHOM VOWEL SIGN AM +1182C..1182E ; Vowel_Dependent # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II +1182F..11836 ; Vowel_Dependent # Mn [8] DOGRA VOWEL SIGN U..DOGRA VOWEL SIGN AU +11930..11935 ; Vowel_Dependent # Mc [6] DIVES AKURU VOWEL SIGN AA..DIVES AKURU VOWEL SIGN E +11937..11938 ; Vowel_Dependent # Mc [2] DIVES AKURU VOWEL SIGN AI..DIVES AKURU VOWEL SIGN O +119D1..119D3 ; Vowel_Dependent # Mc [3] NANDINAGARI VOWEL SIGN AA..NANDINAGARI VOWEL SIGN II +119D4..119D7 ; Vowel_Dependent # Mn [4] NANDINAGARI VOWEL SIGN U..NANDINAGARI VOWEL SIGN VOCALIC RR +119DA..119DB ; Vowel_Dependent # Mn [2] NANDINAGARI VOWEL SIGN E..NANDINAGARI VOWEL SIGN AI +119DC..119DD ; Vowel_Dependent # Mc [2] NANDINAGARI VOWEL SIGN O..NANDINAGARI VOWEL SIGN AU +119E4 ; Vowel_Dependent # Mc NANDINAGARI VOWEL SIGN PRISHTHAMATRA E +11A01..11A0A ; Vowel_Dependent # Mn [10] ZANABAZAR SQUARE VOWEL SIGN I..ZANABAZAR SQUARE VOWEL LENGTH MARK +11A51..11A56 ; Vowel_Dependent # Mn [6] SOYOMBO VOWEL SIGN I..SOYOMBO VOWEL SIGN OE +11A57..11A58 ; Vowel_Dependent # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A59..11A5B ; Vowel_Dependent # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11C2F ; Vowel_Dependent # Mc BHAIKSUKI VOWEL SIGN AA +11C30..11C36 ; Vowel_Dependent # Mn [7] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN VOCALIC L +11C38..11C3B ; Vowel_Dependent # Mn [4] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI VOWEL SIGN AU +11CB0 ; Vowel_Dependent # Mn MARCHEN VOWEL SIGN AA +11CB1 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN I +11CB2..11CB3 ; Vowel_Dependent # Mn [2] MARCHEN VOWEL SIGN U..MARCHEN VOWEL SIGN E +11CB4 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN O +11D31..11D36 ; Vowel_Dependent # Mn [6] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN VOCALIC R +11D3A ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Vowel_Dependent # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN AU +11D43 ; Vowel_Dependent # Mn MASARAM GONDI SIGN CANDRA +11D8A..11D8E ; Vowel_Dependent # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU +11D90..11D91 ; Vowel_Dependent # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI +11D93..11D94 ; Vowel_Dependent # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU +11EF3..11EF4 ; Vowel_Dependent # Mn [2] MAKASAR VOWEL SIGN I..MAKASAR VOWEL SIGN U +11EF5..11EF6 ; Vowel_Dependent # Mc [2] MAKASAR VOWEL SIGN E..MAKASAR VOWEL SIGN O + +# ================================================ + +# Indic_Syllabic_Category=Vowel + +# (Other) Vowels (reanalyzed as ordinary alphabetic letters or marks) + +# [Not derivable] + +1963..196D ; Vowel # Lo [11] TAI LE LETTER A..TAI LE LETTER AI +A85E..A861 ; Vowel # Lo [4] PHAGS-PA LETTER I..PHAGS-PA LETTER O +A866 ; Vowel # Lo PHAGS-PA LETTER EE +A922..A925 ; Vowel # Lo [4] KAYAH LI LETTER A..KAYAH LI LETTER OO +A926..A92A ; Vowel # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O +11150..11154 ; Vowel # Lo [5] MAHAJANI LETTER A..MAHAJANI LETTER O + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Placeholder + +# Consonant Placeholder +# This includes generic placeholders used for +# Indic script layout (NBSP and dotted circle), as well as a few script- +# specific vowel-holder characters which are not technically +# consonants, but serve instead as bases for placement of vowel marks. + +# [Not derivable] + +002D ; Consonant_Placeholder # Pd HYPHEN-MINUS +00A0 ; Consonant_Placeholder # Zs NO-BREAK SPACE +00D7 ; Consonant_Placeholder # Sm MULTIPLICATION SIGN +0980 ; Consonant_Placeholder # Lo BENGALI ANJI +0A72..0A73 ; Consonant_Placeholder # Lo [2] GURMUKHI IRI..GURMUKHI URA +104B ; Consonant_Placeholder # Po MYANMAR SIGN SECTION +104E ; Consonant_Placeholder # Po MYANMAR SYMBOL AFOREMENTIONED +1900 ; Consonant_Placeholder # Lo LIMBU VOWEL-CARRIER LETTER +1CFA ; Consonant_Placeholder # Lo VEDIC SIGN DOUBLE ANUSVARA ANTARGOMUKHA +2010..2014 ; Consonant_Placeholder # Pd [5] HYPHEN..EM DASH +25CC ; Consonant_Placeholder # So DOTTED CIRCLE +AA74..AA76 ; Consonant_Placeholder # Lo [3] MYANMAR LOGOGRAM KHAMTI OAY..MYANMAR LOGOGRAM KHAMTI HM +11A3F ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL HEAD MARK +11A45 ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL DOUBLE-LINED HEAD MARK +11EF2 ; Consonant_Placeholder # Lo MAKASAR ANGKA + +# ================================================ + +# Indic_Syllabic_Category=Consonant + +# Consonant (ordinary abugida consonants, with inherent vowels) + +# [Not derivable] + +0915..0939 ; Consonant # Lo [37] DEVANAGARI LETTER KA..DEVANAGARI LETTER HA +0958..095F ; Consonant # Lo [8] DEVANAGARI LETTER QA..DEVANAGARI LETTER YYA +0978..097F ; Consonant # Lo [8] DEVANAGARI LETTER MARWARI DDA..DEVANAGARI LETTER BBA +0995..09A8 ; Consonant # Lo [20] BENGALI LETTER KA..BENGALI LETTER NA +09AA..09B0 ; Consonant # Lo [7] BENGALI LETTER PA..BENGALI LETTER RA +09B2 ; Consonant # Lo BENGALI LETTER LA +09B6..09B9 ; Consonant # Lo [4] BENGALI LETTER SHA..BENGALI LETTER HA +09DC..09DD ; Consonant # Lo [2] BENGALI LETTER RRA..BENGALI LETTER RHA +09DF ; Consonant # Lo BENGALI LETTER YYA +09F0..09F1 ; Consonant # Lo [2] BENGALI LETTER RA WITH MIDDLE DIAGONAL..BENGALI LETTER RA WITH LOWER DIAGONAL +0A15..0A28 ; Consonant # Lo [20] GURMUKHI LETTER KA..GURMUKHI LETTER NA +0A2A..0A30 ; Consonant # Lo [7] GURMUKHI LETTER PA..GURMUKHI LETTER RA +0A32..0A33 ; Consonant # Lo [2] GURMUKHI LETTER LA..GURMUKHI LETTER LLA +0A35..0A36 ; Consonant # Lo [2] GURMUKHI LETTER VA..GURMUKHI LETTER SHA +0A38..0A39 ; Consonant # Lo [2] GURMUKHI LETTER SA..GURMUKHI LETTER HA +0A59..0A5C ; Consonant # Lo [4] GURMUKHI LETTER KHHA..GURMUKHI LETTER RRA +0A5E ; Consonant # Lo GURMUKHI LETTER FA +0A95..0AA8 ; Consonant # Lo [20] GUJARATI LETTER KA..GUJARATI LETTER NA +0AAA..0AB0 ; Consonant # Lo [7] GUJARATI LETTER PA..GUJARATI LETTER RA +0AB2..0AB3 ; Consonant # Lo [2] GUJARATI LETTER LA..GUJARATI LETTER LLA +0AB5..0AB9 ; Consonant # Lo [5] GUJARATI LETTER VA..GUJARATI LETTER HA +0AF9 ; Consonant # Lo GUJARATI LETTER ZHA +0B15..0B28 ; Consonant # Lo [20] ORIYA LETTER KA..ORIYA LETTER NA +0B2A..0B30 ; Consonant # Lo [7] ORIYA LETTER PA..ORIYA LETTER RA +0B32..0B33 ; Consonant # Lo [2] ORIYA LETTER LA..ORIYA LETTER LLA +0B35..0B39 ; Consonant # Lo [5] ORIYA LETTER VA..ORIYA LETTER HA +0B5C..0B5D ; Consonant # Lo [2] ORIYA LETTER RRA..ORIYA LETTER RHA +0B5F ; Consonant # Lo ORIYA LETTER YYA +0B71 ; Consonant # Lo ORIYA LETTER WA +0B95 ; Consonant # Lo TAMIL LETTER KA +0B99..0B9A ; Consonant # Lo [2] TAMIL LETTER NGA..TAMIL LETTER CA +0B9C ; Consonant # Lo TAMIL LETTER JA +0B9E..0B9F ; Consonant # Lo [2] TAMIL LETTER NYA..TAMIL LETTER TTA +0BA3..0BA4 ; Consonant # Lo [2] TAMIL LETTER NNA..TAMIL LETTER TA +0BA8..0BAA ; Consonant # Lo [3] TAMIL LETTER NA..TAMIL LETTER PA +0BAE..0BB9 ; Consonant # Lo [12] TAMIL LETTER MA..TAMIL LETTER HA +0C15..0C28 ; Consonant # Lo [20] TELUGU LETTER KA..TELUGU LETTER NA +0C2A..0C39 ; Consonant # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C58..0C5A ; Consonant # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C95..0CA8 ; Consonant # Lo [20] KANNADA LETTER KA..KANNADA LETTER NA +0CAA..0CB3 ; Consonant # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA +0CB5..0CB9 ; Consonant # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA +0CDE ; Consonant # Lo KANNADA LETTER FA +0D15..0D3A ; Consonant # Lo [38] MALAYALAM LETTER KA..MALAYALAM LETTER TTTA +0D9A..0DB1 ; Consonant # Lo [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA +0DB3..0DBB ; Consonant # Lo [9] SINHALA LETTER SANYAKA DAYANNA..SINHALA LETTER RAYANNA +0DBD ; Consonant # Lo SINHALA LETTER DANTAJA LAYANNA +0DC0..0DC6 ; Consonant # Lo [7] SINHALA LETTER VAYANNA..SINHALA LETTER FAYANNA +0E01..0E2E ; Consonant # Lo [46] THAI CHARACTER KO KAI..THAI CHARACTER HO NOKHUK +0E81..0E82 ; Consonant # Lo [2] LAO LETTER KO..LAO LETTER KHO SUNG +0E84 ; Consonant # Lo LAO LETTER KHO TAM +0E86..0E8A ; Consonant # Lo [5] LAO LETTER PALI GHA..LAO LETTER SO TAM +0E8C..0EA3 ; Consonant # Lo [24] LAO LETTER PALI JHA..LAO LETTER LO LING +0EA5 ; Consonant # Lo LAO LETTER LO LOOT +0EA7..0EAE ; Consonant # Lo [8] LAO LETTER WO..LAO LETTER HO TAM +0EDC..0EDF ; Consonant # Lo [4] LAO HO NO..LAO LETTER KHMU NYO +0F40..0F47 ; Consonant # Lo [8] TIBETAN LETTER KA..TIBETAN LETTER JA +0F49..0F6C ; Consonant # Lo [36] TIBETAN LETTER NYA..TIBETAN LETTER RRA +1000..1020 ; Consonant # Lo [33] MYANMAR LETTER KA..MYANMAR LETTER LLA +103F ; Consonant # Lo MYANMAR LETTER GREAT SA +1050..1051 ; Consonant # Lo [2] MYANMAR LETTER SHA..MYANMAR LETTER SSA +105A..105D ; Consonant # Lo [4] MYANMAR LETTER MON NGA..MYANMAR LETTER MON BBE +1061 ; Consonant # Lo MYANMAR LETTER SGAW KAREN SHA +1065..1066 ; Consonant # Lo [2] MYANMAR LETTER WESTERN PWO KAREN THA..MYANMAR LETTER WESTERN PWO KAREN PWA +106E..1070 ; Consonant # Lo [3] MYANMAR LETTER EASTERN PWO KAREN NNA..MYANMAR LETTER EASTERN PWO KAREN GHWA +1075..1081 ; Consonant # Lo [13] MYANMAR LETTER SHAN KA..MYANMAR LETTER SHAN HA +108E ; Consonant # Lo MYANMAR LETTER RUMAI PALAUNG FA +1703..170C ; Consonant # Lo [10] TAGALOG LETTER KA..TAGALOG LETTER YA +170E..1711 ; Consonant # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1723..1731 ; Consonant # Lo [15] HANUNOO LETTER KA..HANUNOO LETTER HA +1743..1751 ; Consonant # Lo [15] BUHID LETTER KA..BUHID LETTER HA +1763..176C ; Consonant # Lo [10] TAGBANWA LETTER KA..TAGBANWA LETTER YA +176E..1770 ; Consonant # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA +1780..17A2 ; Consonant # Lo [35] KHMER LETTER KA..KHMER LETTER QA +1901..191E ; Consonant # Lo [30] LIMBU LETTER KA..LIMBU LETTER TRA +1950..1962 ; Consonant # Lo [19] TAI LE LETTER KA..TAI LE LETTER NA +1980..19AB ; Consonant # Lo [44] NEW TAI LUE LETTER HIGH QA..NEW TAI LUE LETTER LOW SUA +1A00..1A16 ; Consonant # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA +1A20..1A4C ; Consonant # Lo [45] TAI THAM LETTER HIGH KA..TAI THAM LETTER LOW HA +1A53..1A54 ; Consonant # Lo [2] TAI THAM LETTER LAE..TAI THAM LETTER GREAT SA +1B13..1B33 ; Consonant # Lo [33] BALINESE LETTER KA..BALINESE LETTER HA +1B45..1B4B ; Consonant # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B8A..1BA0 ; Consonant # Lo [23] SUNDANESE LETTER KA..SUNDANESE LETTER HA +1BAE..1BAF ; Consonant # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA +1BBB..1BBD ; Consonant # Lo [3] SUNDANESE LETTER REU..SUNDANESE LETTER BHA +1BC0..1BE3 ; Consonant # Lo [36] BATAK LETTER A..BATAK LETTER MBA +1C00..1C23 ; Consonant # Lo [36] LEPCHA LETTER KA..LEPCHA LETTER A +1C4D..1C4F ; Consonant # Lo [3] LEPCHA LETTER TTA..LEPCHA LETTER DDA +A807..A80A ; Consonant # Lo [4] SYLOTI NAGRI LETTER KO..SYLOTI NAGRI LETTER GHO +A80C..A822 ; Consonant # Lo [23] SYLOTI NAGRI LETTER CO..SYLOTI NAGRI LETTER HO +A840..A85D ; Consonant # Lo [30] PHAGS-PA LETTER KA..PHAGS-PA LETTER A +A862..A865 ; Consonant # Lo [4] PHAGS-PA LETTER QA..PHAGS-PA LETTER GGA +A869..A870 ; Consonant # Lo [8] PHAGS-PA LETTER TTA..PHAGS-PA LETTER ASPIRATED FA +A872 ; Consonant # Lo PHAGS-PA SUPERFIXED LETTER RA +A892..A8B3 ; Consonant # Lo [34] SAURASHTRA LETTER KA..SAURASHTRA LETTER LLA +A90A..A921 ; Consonant # Lo [24] KAYAH LI LETTER KA..KAYAH LI LETTER CA +A930..A946 ; Consonant # Lo [23] REJANG LETTER KA..REJANG LETTER A +A989..A98B ; Consonant # Lo [3] JAVANESE LETTER PA CEREK..JAVANESE LETTER NGA LELET RASWADI +A98F..A9B2 ; Consonant # Lo [36] JAVANESE LETTER KA..JAVANESE LETTER HA +A9E0..A9E4 ; Consonant # Lo [5] MYANMAR LETTER SHAN GHA..MYANMAR LETTER SHAN BHA +A9E7..A9EF ; Consonant # Lo [9] MYANMAR LETTER TAI LAING NYA..MYANMAR LETTER TAI LAING NNA +A9FA..A9FE ; Consonant # Lo [5] MYANMAR LETTER TAI LAING LLA..MYANMAR LETTER TAI LAING BHA +AA06..AA28 ; Consonant # Lo [35] CHAM LETTER KA..CHAM LETTER HA +AA60..AA6F ; Consonant # Lo [16] MYANMAR LETTER KHAMTI GA..MYANMAR LETTER KHAMTI FA +AA71..AA73 ; Consonant # Lo [3] MYANMAR LETTER KHAMTI XA..MYANMAR LETTER KHAMTI RA +AA7A ; Consonant # Lo MYANMAR LETTER AITON RA +AA7E..AA7F ; Consonant # Lo [2] MYANMAR LETTER SHWE PALAUNG CHA..MYANMAR LETTER SHWE PALAUNG SHA +AA80..AAAF ; Consonant # Lo [48] TAI VIET LETTER LOW KO..TAI VIET LETTER HIGH O +AAE2..AAEA ; Consonant # Lo [9] MEETEI MAYEK LETTER CHA..MEETEI MAYEK LETTER SSA +ABC0..ABCD ; Consonant # Lo [14] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER HUK +ABD0 ; Consonant # Lo MEETEI MAYEK LETTER PHAM +ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTER BHAM +10A00 ; Consonant # Lo KHAROSHTHI LETTER A +10A10..10A13 ; Consonant # Lo [4] KHAROSHTHI LETTER KA..KHAROSHTHI LETTER GHA +10A15..10A17 ; Consonant # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA +10A19..10A35 ; Consonant # Lo [29] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER VHA +11013..11037 ; Consonant # Lo [37] BRAHMI LETTER KA..BRAHMI LETTER OLD TAMIL NNNA +1108D..110AF ; Consonant # Lo [35] KAITHI LETTER KA..KAITHI LETTER HA +11107..11126 ; Consonant # Lo [32] CHAKMA LETTER KAA..CHAKMA LETTER HAA +11144 ; Consonant # Lo CHAKMA LETTER LHAA +11147 ; Consonant # Lo CHAKMA LETTER VAA +11155..11172 ; Consonant # Lo [30] MAHAJANI LETTER KA..MAHAJANI LETTER RRA +11191..111B2 ; Consonant # Lo [34] SHARADA LETTER KA..SHARADA LETTER HA +11208..11211 ; Consonant # Lo [10] KHOJKI LETTER KA..KHOJKI LETTER JJA +11213..1122B ; Consonant # Lo [25] KHOJKI LETTER NYA..KHOJKI LETTER LLA +11284..11286 ; Consonant # Lo [3] MULTANI LETTER KA..MULTANI LETTER GA +11288 ; Consonant # Lo MULTANI LETTER GHA +1128A..1128D ; Consonant # Lo [4] MULTANI LETTER CA..MULTANI LETTER JJA +1128F..1129D ; Consonant # Lo [15] MULTANI LETTER NYA..MULTANI LETTER BA +1129F..112A8 ; Consonant # Lo [10] MULTANI LETTER BHA..MULTANI LETTER RHA +112BA..112DE ; Consonant # Lo [37] KHUDAWADI LETTER KA..KHUDAWADI LETTER HA +11315..11328 ; Consonant # Lo [20] GRANTHA LETTER KA..GRANTHA LETTER NA +1132A..11330 ; Consonant # Lo [7] GRANTHA LETTER PA..GRANTHA LETTER RA +11332..11333 ; Consonant # Lo [2] GRANTHA LETTER LA..GRANTHA LETTER LLA +11335..11339 ; Consonant # Lo [5] GRANTHA LETTER VA..GRANTHA LETTER HA +1140E..11434 ; Consonant # Lo [39] NEWA LETTER KA..NEWA LETTER HA +1148F..114AF ; Consonant # Lo [33] TIRHUTA LETTER KA..TIRHUTA LETTER HA +1158E..115AE ; Consonant # Lo [33] SIDDHAM LETTER KA..SIDDHAM LETTER HA +1160E..1162F ; Consonant # Lo [34] MODI LETTER KA..MODI LETTER LLA +1168A..116AA ; Consonant # Lo [33] TAKRI LETTER KA..TAKRI LETTER RRA +116B8 ; Consonant # Lo TAKRI LETTER ARCHAIC KHA +11700..1171A ; Consonant # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA +1180A..1182B ; Consonant # Lo [34] DOGRA LETTER KA..DOGRA LETTER RRA +1190C..11913 ; Consonant # Lo [8] DIVES AKURU LETTER KA..DIVES AKURU LETTER JA +11915..11916 ; Consonant # Lo [2] DIVES AKURU LETTER NYA..DIVES AKURU LETTER TTA +11918..1192F ; Consonant # Lo [24] DIVES AKURU LETTER DDA..DIVES AKURU LETTER ZA +119AE..119D0 ; Consonant # Lo [35] NANDINAGARI LETTER KA..NANDINAGARI LETTER RRA +11A0B..11A32 ; Consonant # Lo [40] ZANABAZAR SQUARE LETTER KA..ZANABAZAR SQUARE LETTER KSSA +11A5C..11A83 ; Consonant # Lo [40] SOYOMBO LETTER KA..SOYOMBO LETTER KSSA +11C0E..11C2E ; Consonant # Lo [33] BHAIKSUKI LETTER KA..BHAIKSUKI LETTER HA +11C72..11C8F ; Consonant # Lo [30] MARCHEN LETTER KA..MARCHEN LETTER A +11D0C..11D30 ; Consonant # Lo [37] MASARAM GONDI LETTER KA..MASARAM GONDI LETTER TRA +11D6C..11D89 ; Consonant # Lo [30] GUNJALA GONDI LETTER YA..GUNJALA GONDI LETTER SA +11EE0..11EF1 ; Consonant # Lo [18] MAKASAR LETTER KA..MAKASAR LETTER A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Dead + +# Dead Consonant (special consonant with killed vowel) + +# [Not derivable] + +09CE ; Consonant_Dead # Lo BENGALI LETTER KHANDA TA +0D54..0D56 ; Consonant_Dead # Lo [3] MALAYALAM LETTER CHILLU M..MALAYALAM LETTER CHILLU LLL +0D7A..0D7F ; Consonant_Dead # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K +1CF2..1CF3 ; Consonant_Dead # Lo [2] VEDIC SIGN ARDHAVISARGA..VEDIC SIGN ROTATED ARDHAVISARGA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_With_Stacker + +# Consonants that may make stacked ligatures with the next consonant +# without the use of a virama + +# [Not derivable] + +0CF1..0CF2 ; Consonant_With_Stacker # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA +1CF5..1CF6 ; Consonant_With_Stacker # Lo [2] VEDIC SIGN JIHVAMULIYA..VEDIC SIGN UPADHMANIYA +11003..11004 ; Consonant_With_Stacker # Lo [2] BRAHMI SIGN JIHVAMULIYA..BRAHMI SIGN UPADHMANIYA +11460..11461 ; Consonant_With_Stacker # Lo [2] NEWA SIGN JIHVAMULIYA..NEWA SIGN UPADHMANIYA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Prefixed + +# Cluster-initial consonants + +# [Not derivable] + +111C2..111C3 ; Consonant_Prefixed # Lo [2] SHARADA SIGN JIHVAMULIYA..SHARADA SIGN UPADHMANIYA +1193F ; Consonant_Prefixed # Lo DIVES AKURU PREFIXED NASAL SIGN +11A3A ; Consonant_Prefixed # Lo ZANABAZAR SQUARE CLUSTER-INITIAL LETTER RA +11A84..11A89 ; Consonant_Prefixed # Lo [6] SOYOMBO SIGN JIHVAMULIYA..SOYOMBO CLUSTER-INITIAL LETTER SA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Preceding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when preceding the main +# consonant. + +# [Not derivable] + +0D4E ; Consonant_Preceding_Repha # Lo MALAYALAM LETTER DOT REPH +11941 ; Consonant_Preceding_Repha # Lo DIVES AKURU INITIAL RA +11D46 ; Consonant_Preceding_Repha # Lo MASARAM GONDI REPHA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Initial_Postfixed + +# Consonants that succeed the main consonant in character sequences, but are +# pronounced before it. + +# [Not derivable] + +1A5A ; Consonant_Initial_Postfixed # Mn TAI THAM CONSONANT SIGN LOW PA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Succeeding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when succeeding the main +# consonant. + +# [Not derivable] + +17CC ; Consonant_Succeeding_Repha # Mn KHMER SIGN ROBAT +1B03 ; Consonant_Succeeding_Repha # Mn BALINESE SIGN SURANG +1B81 ; Consonant_Succeeding_Repha # Mn SUNDANESE SIGN PANGLAYAR +A982 ; Consonant_Succeeding_Repha # Mn JAVANESE SIGN LAYAR + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Subjoined + +# Subjoined Consonant (C2 form subtending a base consonant in Tibetan, etc.) + +# [Not derivable] + +0F8D..0F97 ; Consonant_Subjoined # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Consonant_Subjoined # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +1929..192B ; Consonant_Subjoined # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1A57 ; Consonant_Subjoined # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A5B..1A5E ; Consonant_Subjoined # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1BA1 ; Consonant_Subjoined # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA2..1BA3 ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BAC..1BAD ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C24..1C25 ; Consonant_Subjoined # Mc [2] LEPCHA SUBJOINED LETTER YA..LEPCHA SUBJOINED LETTER RA +A867..A868 ; Consonant_Subjoined # Lo [2] PHAGS-PA SUBJOINED LETTER WA..PHAGS-PA SUBJOINED LETTER YA +A871 ; Consonant_Subjoined # Lo PHAGS-PA SUBJOINED LETTER RA +11C92..11CA7 ; Consonant_Subjoined # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CA9 ; Consonant_Subjoined # Mc MARCHEN SUBJOINED LETTER YA +11CAA..11CAF ; Consonant_Subjoined # Mn [6] MARCHEN SUBJOINED LETTER RA..MARCHEN SUBJOINED LETTER A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Medial + +# Medial Consonant (medial liquid, occurring in clusters) + +# [Not derivable] + +0A75 ; Consonant_Medial # Mn GURMUKHI SIGN YAKASH +0EBC ; Consonant_Medial # Mn LAO SEMIVOWEL SIGN LO +0EBD ; Consonant_Medial # Lo LAO SEMIVOWEL SIGN NYO +103B..103C ; Consonant_Medial # Mc [2] MYANMAR CONSONANT SIGN MEDIAL YA..MYANMAR CONSONANT SIGN MEDIAL RA +103D..103E ; Consonant_Medial # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +105E..1060 ; Consonant_Medial # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Consonant_Medial # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +1A55 ; Consonant_Medial # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A56 ; Consonant_Medial # Mn TAI THAM CONSONANT SIGN MEDIAL LA +A8B4 ; Consonant_Medial # Mc SAURASHTRA CONSONANT SIGN HAARU +A9BD ; Consonant_Medial # Mn JAVANESE CONSONANT SIGN KERET +A9BE..A9BF ; Consonant_Medial # Mc [2] JAVANESE CONSONANT SIGN PENGKAL..JAVANESE CONSONANT SIGN CAKRA +AA33..AA34 ; Consonant_Medial # Mc [2] CHAM CONSONANT SIGN YA..CHAM CONSONANT SIGN RA +AA35..AA36 ; Consonant_Medial # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +1171D..1171F ; Consonant_Medial # Mn [3] AHOM CONSONANT SIGN MEDIAL LA..AHOM CONSONANT SIGN MEDIAL LIGATING RA +11940 ; Consonant_Medial # Mc DIVES AKURU MEDIAL YA +11942 ; Consonant_Medial # Mc DIVES AKURU MEDIAL RA +11A3B..11A3E ; Consonant_Medial # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11D47 ; Consonant_Medial # Mn MASARAM GONDI RA-KARA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Final + +# Final Consonant (special final forms which do not take vowels) + +# [Not derivable] + +1930..1931 ; Consonant_Final # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Consonant_Final # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +1939 ; Consonant_Final # Mn LIMBU SIGN MUKPHRENG +19C1..19C7 ; Consonant_Final # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B +1A58..1A59 ; Consonant_Final # Mn [2] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN FINAL NGA +1BBE..1BBF ; Consonant_Final # Lo [2] SUNDANESE LETTER FINAL K..SUNDANESE LETTER FINAL M +1BF0..1BF1 ; Consonant_Final # Mn [2] BATAK CONSONANT SIGN NG..BATAK CONSONANT SIGN H +1C2D..1C33 ; Consonant_Final # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +A94F..A951 ; Consonant_Final # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A952 ; Consonant_Final # Mc REJANG CONSONANT SIGN H +AA40..AA42 ; Consonant_Final # Lo [3] CHAM LETTER FINAL K..CHAM LETTER FINAL NG +AA43 ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL NG +AA44..AA4B ; Consonant_Final # Lo [8] CHAM LETTER FINAL CH..CHAM LETTER FINAL SS +AA4C ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL M +AA4D ; Consonant_Final # Mc CHAM CONSONANT SIGN FINAL H +ABDB..ABE2 ; Consonant_Final # Lo [8] MEETEI MAYEK LETTER KOK LONSUM..MEETEI MAYEK LETTER I LONSUM +11A8A..11A95 ; Consonant_Final # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Head_Letter + +# Head Letter (Tibetan) + +# [Not derivable] + +0F88..0F8C ; Consonant_Head_Letter # Lo [5] TIBETAN SIGN LCE TSA CAN..TIBETAN SIGN INVERTED MCHU CAN + +# ================================================ + +# Indic_Syllabic_Category=Modifying_Letter + +# Reanalyzed letters not participating in the abugida structure, but +# serving to modify the sound of an adjacent vowel or consonant. +# Note that this is not the same as General_Category=Modifier_Letter. + +# [Not derivable] + +0B83 ; Modifying_Letter # Lo TAMIL SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Tone_Letter + +# Tone Letter (spacing lexical tone mark with status as a letter) + +# [Not derivable] + +1970..1974 ; Tone_Letter # Lo [5] TAI LE LETTER TONE-2..TAI LE LETTER TONE-6 +AAC0 ; Tone_Letter # Lo TAI VIET TONE MAI NUENG +AAC2 ; Tone_Letter # Lo TAI VIET TONE MAI SONG + +# ================================================ + +# Indic_Syllabic_Category=Tone_Mark + +# Tone Mark (nonspacing or spacing lexical tone mark) + +# [Not derivable] + +0E48..0E4B ; Tone_Mark # Mn [4] THAI CHARACTER MAI EK..THAI CHARACTER MAI CHATTAWA +0EC8..0ECB ; Tone_Mark # Mn [4] LAO TONE MAI EK..LAO TONE MAI CATAWA +1037 ; Tone_Mark # Mn MYANMAR SIGN DOT BELOW +1063..1064 ; Tone_Mark # Mc [2] MYANMAR TONE MARK SGAW KAREN HATHI..MYANMAR TONE MARK SGAW KAREN KE PHO +1069..106D ; Tone_Mark # Mc [5] MYANMAR SIGN WESTERN PWO KAREN TONE-1..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1087..108C ; Tone_Mark # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108D ; Tone_Mark # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +108F ; Tone_Mark # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109B ; Tone_Mark # Mc [2] MYANMAR SIGN KHAMTI TONE-1..MYANMAR SIGN KHAMTI TONE-3 +19C8..19C9 ; Tone_Mark # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A75..1A79 ; Tone_Mark # Mn [5] TAI THAM SIGN TONE-1..TAI THAM SIGN KHUEN TONE-5 +A92B..A92D ; Tone_Mark # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +AA7B ; Tone_Mark # Mc MYANMAR SIGN PAO KAREN TONE +AA7C ; Tone_Mark # Mn MYANMAR SIGN TAI LAING TONE-2 +AA7D ; Tone_Mark # Mc MYANMAR SIGN TAI LAING TONE-5 +AABF ; Tone_Mark # Mn TAI VIET TONE MAI EK +AAC1 ; Tone_Mark # Mn TAI VIET TONE MAI THO +ABEC ; Tone_Mark # Mc MEETEI MAYEK LUM IYEK + +# ================================================ + +# Indic_Syllabic_Category=Gemination_Mark + +# Gemination Mark (doubling of the preceding or following consonant) + +# [Not derivable] + +0A71 ; Gemination_Mark # Mn GURMUKHI ADDAK +11237 ; Gemination_Mark # Mn KHOJKI SIGN SHADDA +11A98 ; Gemination_Mark # Mn SOYOMBO GEMINATION MARK + +# ================================================ + +# Indic_Syllabic_Category=Cantillation_Mark + +# Cantillation Mark (recitation marks, such as svara markers for the Samaveda) + +# [Not derivable] + +0951..0952 ; Cantillation_Mark # Mn [2] DEVANAGARI STRESS SIGN UDATTA..DEVANAGARI STRESS SIGN ANUDATTA +0A51 ; Cantillation_Mark # Mn GURMUKHI SIGN UDAAT +0AFA..0AFC ; Cantillation_Mark # Mn [3] GUJARATI SIGN SUKUN..GUJARATI SIGN MADDAH +1CD0..1CD2 ; Cantillation_Mark # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CD4..1CE0 ; Cantillation_Mark # Mn [13] VEDIC SIGN YAJURVEDIC MIDLINE SVARITA..VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CE1 ; Cantillation_Mark # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF4 ; Cantillation_Mark # Mn VEDIC TONE CANDRA ABOVE +1CF7 ; Cantillation_Mark # Mc VEDIC SIGN ATIKRAMA +1CF8..1CF9 ; Cantillation_Mark # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE +20F0 ; Cantillation_Mark # Mn COMBINING ASTERISK ABOVE +A8E0..A8F1 ; Cantillation_Mark # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +1123E ; Cantillation_Mark # Mn KHOJKI SIGN SUKUN +11366..1136C ; Cantillation_Mark # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Cantillation_Mark # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA + +# ================================================ + +# Indic_Syllabic_Category=Register_Shifter + +# Register Shifter (shifts register for consonants, akin to a tone mark) + +# [Not derivable] + +17C9..17CA ; Register_Shifter # Mn [2] KHMER SIGN MUUSIKATOAN..KHMER SIGN TRIISAP + +# ================================================ + +# Indic_Syllabic_Category=Syllable_Modifier + +# Syllable Modifier (miscellaneous combining characters that modify +# something in the orthographic syllable they succeed) + +# [Not derivable] + +00B2..00B3 ; Syllable_Modifier # No [2] SUPERSCRIPT TWO..SUPERSCRIPT THREE +09FE ; Syllable_Modifier # Mn BENGALI SANDHI MARK +0F35 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0FC6 ; Syllable_Modifier # Mn TIBETAN SYMBOL PADMA GDAN +17CB ; Syllable_Modifier # Mn KHMER SIGN BANTOC +17CE..17D0 ; Syllable_Modifier # Mn [3] KHMER SIGN KAKABAT..KHMER SIGN SAMYOK SANNYA +17D3 ; Syllable_Modifier # Mn KHMER SIGN BATHAMASAT +17DD ; Syllable_Modifier # Mn KHMER SIGN ATTHACAN +193B ; Syllable_Modifier # Mn LIMBU SIGN SA-I +1A7B..1A7C ; Syllable_Modifier # Mn [2] TAI THAM SIGN MAI SAM..TAI THAM SIGN KHUEN-LUE KARAN +1A7F ; Syllable_Modifier # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1C36 ; Syllable_Modifier # Mn LEPCHA SIGN RAN +1DFB ; Syllable_Modifier # Mn COMBINING DELETION MARK +2074 ; Syllable_Modifier # No SUPERSCRIPT FOUR +2082..2084 ; Syllable_Modifier # No [3] SUBSCRIPT TWO..SUBSCRIPT FOUR +111C9 ; Syllable_Modifier # Mn SHARADA SANDHI MARK +1145E ; Syllable_Modifier # Mn NEWA SANDHI MARK +11A33 ; Syllable_Modifier # Mn ZANABAZAR SQUARE FINAL CONSONANT MARK + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Killer + +# Consonant Killer (signifies that the previous consonant or consonants are +# not pronounced) + +# [Not derivable] + +0E4C ; Consonant_Killer # Mn THAI CHARACTER THANTHAKHAT +17CD ; Consonant_Killer # Mn KHMER SIGN TOANDAKHIAT + +# ================================================ + +# Indic_Syllabic_Category=Non_Joiner + +# Non_Joiner (Zero Width Non-Joiner) + +# [Not derivable] + +200C ; Non_Joiner # Cf ZERO WIDTH NON-JOINER + +# ================================================ + +# Indic_Syllabic_Category=Joiner + +# Joiner (Zero Width Joiner) + +# [Not derivable] + +200D ; Joiner # Cf ZERO WIDTH JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number_Joiner + +# Number_Joiner (forms ligatures between numbers for multiplication) + +# [Not derivable] + +1107F ; Number_Joiner # Mn BRAHMI NUMBER JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number + +# Number (can be used as vowel-holders like consonant placeholders) +# Note: A number may even hold subjoined consonants which may in turn +# have been formed using a virama or a stacker, e.g. the sequence +# where THAI THAM LETTER LOW TA is subjoined to +# TAI THAM THAM DIGIT THREE using an invisible stacker. + +# [Not derivable] + +0030..0039 ; Number # Nd [10] DIGIT ZERO..DIGIT NINE +0966..096F ; Number # Nd [10] DEVANAGARI DIGIT ZERO..DEVANAGARI DIGIT NINE +09E6..09EF ; Number # Nd [10] BENGALI DIGIT ZERO..BENGALI DIGIT NINE +0A66..0A6F ; Number # Nd [10] GURMUKHI DIGIT ZERO..GURMUKHI DIGIT NINE +0AE6..0AEF ; Number # Nd [10] GUJARATI DIGIT ZERO..GUJARATI DIGIT NINE +0B66..0B6F ; Number # Nd [10] ORIYA DIGIT ZERO..ORIYA DIGIT NINE +0BE6..0BEF ; Number # Nd [10] TAMIL DIGIT ZERO..TAMIL DIGIT NINE +0C66..0C6F ; Number # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE +0CE6..0CEF ; Number # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE +0D66..0D6F ; Number # Nd [10] MALAYALAM DIGIT ZERO..MALAYALAM DIGIT NINE +0DE6..0DEF ; Number # Nd [10] SINHALA LITH DIGIT ZERO..SINHALA LITH DIGIT NINE +0E50..0E59 ; Number # Nd [10] THAI DIGIT ZERO..THAI DIGIT NINE +0ED0..0ED9 ; Number # Nd [10] LAO DIGIT ZERO..LAO DIGIT NINE +0F20..0F29 ; Number # Nd [10] TIBETAN DIGIT ZERO..TIBETAN DIGIT NINE +0F2A..0F33 ; Number # No [10] TIBETAN DIGIT HALF ONE..TIBETAN DIGIT HALF ZERO +1040..1049 ; Number # Nd [10] MYANMAR DIGIT ZERO..MYANMAR DIGIT NINE +1090..1099 ; Number # Nd [10] MYANMAR SHAN DIGIT ZERO..MYANMAR SHAN DIGIT NINE +17E0..17E9 ; Number # Nd [10] KHMER DIGIT ZERO..KHMER DIGIT NINE +1946..194F ; Number # Nd [10] LIMBU DIGIT ZERO..LIMBU DIGIT NINE +19D0..19D9 ; Number # Nd [10] NEW TAI LUE DIGIT ZERO..NEW TAI LUE DIGIT NINE +19DA ; Number # No NEW TAI LUE THAM DIGIT ONE +1A80..1A89 ; Number # Nd [10] TAI THAM HORA DIGIT ZERO..TAI THAM HORA DIGIT NINE +1A90..1A99 ; Number # Nd [10] TAI THAM THAM DIGIT ZERO..TAI THAM THAM DIGIT NINE +1B50..1B59 ; Number # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE +1BB0..1BB9 ; Number # Nd [10] SUNDANESE DIGIT ZERO..SUNDANESE DIGIT NINE +1C40..1C49 ; Number # Nd [10] LEPCHA DIGIT ZERO..LEPCHA DIGIT NINE +A8D0..A8D9 ; Number # Nd [10] SAURASHTRA DIGIT ZERO..SAURASHTRA DIGIT NINE +A900..A909 ; Number # Nd [10] KAYAH LI DIGIT ZERO..KAYAH LI DIGIT NINE +A9D0..A9D9 ; Number # Nd [10] JAVANESE DIGIT ZERO..JAVANESE DIGIT NINE +A9F0..A9F9 ; Number # Nd [10] MYANMAR TAI LAING DIGIT ZERO..MYANMAR TAI LAING DIGIT NINE +AA50..AA59 ; Number # Nd [10] CHAM DIGIT ZERO..CHAM DIGIT NINE +ABF0..ABF9 ; Number # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE +10A40..10A48 ; Number # No [9] KHAROSHTHI DIGIT ONE..KHAROSHTHI FRACTION ONE HALF +11066..1106F ; Number # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11136..1113F ; Number # Nd [10] CHAKMA DIGIT ZERO..CHAKMA DIGIT NINE +111D0..111D9 ; Number # Nd [10] SHARADA DIGIT ZERO..SHARADA DIGIT NINE +111E1..111F4 ; Number # No [20] SINHALA ARCHAIC DIGIT ONE..SINHALA ARCHAIC NUMBER ONE THOUSAND +112F0..112F9 ; Number # Nd [10] KHUDAWADI DIGIT ZERO..KHUDAWADI DIGIT NINE +11450..11459 ; Number # Nd [10] NEWA DIGIT ZERO..NEWA DIGIT NINE +114D0..114D9 ; Number # Nd [10] TIRHUTA DIGIT ZERO..TIRHUTA DIGIT NINE +11650..11659 ; Number # Nd [10] MODI DIGIT ZERO..MODI DIGIT NINE +116C0..116C9 ; Number # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE +11730..11739 ; Number # Nd [10] AHOM DIGIT ZERO..AHOM DIGIT NINE +1173A..1173B ; Number # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY +11950..11959 ; Number # Nd [10] DIVES AKURU DIGIT ZERO..DIVES AKURU DIGIT NINE +11C50..11C59 ; Number # Nd [10] BHAIKSUKI DIGIT ZERO..BHAIKSUKI DIGIT NINE +11C5A..11C6C ; Number # No [19] BHAIKSUKI NUMBER ONE..BHAIKSUKI HUNDREDS UNIT MARK +11D50..11D59 ; Number # Nd [10] MASARAM GONDI DIGIT ZERO..MASARAM GONDI DIGIT NINE +11DA0..11DA9 ; Number # Nd [10] GUNJALA GONDI DIGIT ZERO..GUNJALA GONDI DIGIT NINE + +# ================================================ + +# Indic_Syllabic_Category=Brahmi_Joining_Number + +# Brahmi Joining Number (similar to Number in that in can be used as +# vowel-holders like Consonant_Placeholder, but may also be joined by +# a Number_Joiner of the same script, e.g. in Brahmi) + +# [Not derivable] + +11052..11065 ; Brahmi_Joining_Number # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND + +# EOF diff --git a/data/14.0.0-indic-positional-category.txt b/data/14.0.0-indic-positional-category.txt new file mode 100644 index 0000000..69109ac --- /dev/null +++ b/data/14.0.0-indic-positional-category.txt @@ -0,0 +1,796 @@ +# IndicPositionalCategory-14.0.0.txt +# Date: 2021-05-22, 01:01:00 GMT [KW, RP] +# © 2021 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# +# For documentation, see UAX #44: Unicode Character Database, +# at http://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Positional_Category enumerated property +# +# Scope: This property is aimed at the problem of +# the specification of syllabic structure for Indic scripts. +# Because dependent vowels (matras), visible viramas, and other +# characters are placed in notional slots around the consonant (or +# consonant cluster) core of an Indic syllable, there may be +# cooccurrence constraints or other interactions. Also, it may be +# desirable, in cases where more than one such character may occur in +# sequence, as for example, in a top slot and a bottom slot, to +# specify preferred orders for spelling. As such, this property +# is designed primarily to supplement the Indic_Syllabic_Category +# property. +# +# In addition to combining marks associated with Indic scripts, the +# Indic_Positional_Category has non-trivial values for special signs +# associated with Indic_Syllabic_Category=Consonant_Prefixed +# or Indic_Syllabic_Category=Consonant_Preceding_Repha. Those signs +# have General_Category=Lo, rather than being combining marks. +# They occur in initial position in syllabic structure. However, when +# rendered, they appear as marks positioned with respect to another +# base letter (usually above it). Hence, having an explicit value for +# Indic_Positional_Category for those signs can be helpful. +# +# Note that this property is *not* intended as +# a prescriptive property regarding display or font design, +# for a number of reasons. Good font design requires information +# that is outside the context of a character encoding standard, +# and is best handled in other venues. For Indic dependent +# vowels and similar characters, in particular: +# +# 1. Matra placement may vary somewhat based on typeface design. +# 2. Matra placement, even within a single script, may vary +# somewhat according to historic period or local conventions. +# 3. Matra placement may be changed by explicit orthographic reform +# decisions. +# 4. Matras may ligate in various ways with a consonant (or even +# other elements of a syllable) instead of occurring in a +# discrete location. +# 5. Matra display may be contextually determined. This is +# notable, for example, in the Tamil script, where the shape +# and placement of -u and -uu vowels depends strongly on +# which consonant they adjoin. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Positional_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as containing dependent vowels or similar characters +# in the structural sense used for the Indic_Positional_Category are the +# following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Dives Akuru, Dogra, Grantha, Gujarati, +# Gunjala Gondi, Gurmukhi, Hanunoo, Javanese, Kaithi, Kannada, +# Kharoshthi, Khmer, Khojki, Khudawadi, Lao, Lepcha, Limbu, Makasar, +# Malayalam, Marchen, Masaram Gondi, Meetei Mayek, Modi, Myanmar, +# Nandinagari, Newa, New Tai Lue, Oriya, Rejang, Saurashtra, Sharada, +# Siddham, Sinhala, Soyombo, Sundanese, Syloti Nagri, Tagalog, +# Tagbanwa, Tai Tham, Tai Viet, Takri, Tamil, Telugu, Thai, Tibetan, +# Tirhuta, and Zanabazar Square. +# +# All characters for all other scripts not in that list +# take the default value for this property. +# +# See IndicSyllabicCategory.txt for a slightly more extended +# list of Indic scripts, including those which do not have +# positional characters. Currently, those additional +# Indic scripts without positional characters are +# Multani, Phags-pa, and Tai Le. +# +# Notes: +# +# 1. The following characters are all assigned the positional category Right, +# but may have different positions in some cases: +# * U+0BC1 TAMIL VOWEL SIGN U and U+0BC2 TAMIL VOWEL SIGN UU have +# contextually variable placement in Tamil. +# * U+0D41 MALAYALAM VOWEL SIGN U and U+0D42 MALAYALAM VOWEL SIGN UU form +# complex ligatures with consonants in older Malayalam orthography. +# * U+11341 GRANTHA VOWEL SIGN U and U+11342 GRANTHA VOWEL SIGN UU have +# contextually variable placement in Grantha. +# * U+11440 NEWA VOWEL SIGN O and U+11441 NEWA VOWEL SIGN AU have contextually +# variable placement in Newa. +# +# 2. The following characters are all assigned the positional category Top, +# but may have different positions in some cases: +# * U+1143E NEWA VOWEL SIGN E and U+1143F NEWA VOWEL SIGN AI have contextually +# variable placement in Newa. +# +# 3. The following characters are all assigned the positional category Bottom, +# but may have different positions in some cases: +# * U+102F MYANMAR VOWEL SIGN U and U+1030 MYANMAR VOWEL SIGN UU have +# contextually variable placement in Myanmar. +# * U+1A69 TAI THAM VOWEL SIGN U and U+1A6A TAI THAM VOWEL SIGN UU have +# contextually variable placement in Tai Tham. +# +# 4. The following character is assigned the positional category Left, but +# may have different positions in different styles: +# * U+119D2 NANDINAGARI VOWEL SIGN I has stylistically variable placement +# in Nandinagari. + + +# ================================================ + +# Property: Indic_Positional_Category +# +# All code points not explicitly listed for Indic_Positional_Category +# have the value NA (not applicable). +# +# @missing: 0000..10FFFF; NA + +# ------------------------------------------------ + +# Indic_Positional_Category=Right + +0903 ; Right # Mc DEVANAGARI SIGN VISARGA +093B ; Right # Mc DEVANAGARI VOWEL SIGN OOE +093E ; Right # Mc DEVANAGARI VOWEL SIGN AA +0940 ; Right # Mc DEVANAGARI VOWEL SIGN II +0949..094C ; Right # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094F ; Right # Mc DEVANAGARI VOWEL SIGN AW +0982..0983 ; Right # Mc [2] BENGALI SIGN ANUSVARA..BENGALI SIGN VISARGA +09BE ; Right # Mc BENGALI VOWEL SIGN AA +09C0 ; Right # Mc BENGALI VOWEL SIGN II +09D7 ; Right # Mc BENGALI AU LENGTH MARK +0A03 ; Right # Mc GURMUKHI SIGN VISARGA +0A3E ; Right # Mc GURMUKHI VOWEL SIGN AA +0A40 ; Right # Mc GURMUKHI VOWEL SIGN II +0A83 ; Right # Mc GUJARATI SIGN VISARGA +0ABE ; Right # Mc GUJARATI VOWEL SIGN AA +0AC0 ; Right # Mc GUJARATI VOWEL SIGN II +0ACB..0ACC ; Right # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0B02..0B03 ; Right # Mc [2] ORIYA SIGN ANUSVARA..ORIYA SIGN VISARGA +0B3E ; Right # Mc ORIYA VOWEL SIGN AA +0B40 ; Right # Mc ORIYA VOWEL SIGN II +0BBE..0BBF ; Right # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC1..0BC2 ; Right # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BD7 ; Right # Mc TAMIL AU LENGTH MARK +0C01..0C03 ; Right # Mc [3] TELUGU SIGN CANDRABINDU..TELUGU SIGN VISARGA +0C41..0C44 ; Right # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C82..0C83 ; Right # Mc [2] KANNADA SIGN ANUSVARA..KANNADA SIGN VISARGA +0CBE ; Right # Mc KANNADA VOWEL SIGN AA +0CC1..0CC4 ; Right # Mc [4] KANNADA VOWEL SIGN U..KANNADA VOWEL SIGN VOCALIC RR +0CD5..0CD6 ; Right # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0D02..0D03 ; Right # Mc [2] MALAYALAM SIGN ANUSVARA..MALAYALAM SIGN VISARGA +0D3E..0D40 ; Right # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D42 ; Right # Mn [2] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN UU +0D57 ; Right # Mc MALAYALAM AU LENGTH MARK +0D82..0D83 ; Right # Mc [2] SINHALA SIGN ANUSVARAYA..SINHALA SIGN VISARGAYA +0DCF..0DD1 ; Right # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD8 ; Right # Mc SINHALA VOWEL SIGN GAETTA-PILLA +0DDF ; Right # Mc SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Right # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Right # Lo THAI CHARACTER SARA A +0E32..0E33 ; Right # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E45 ; Right # Lo THAI CHARACTER LAKKHANGYAO +0EB0 ; Right # Lo LAO VOWEL SIGN A +0EB2..0EB3 ; Right # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0F3E ; Right # Mc TIBETAN SIGN YAR TSHES +0F7F ; Right # Mc TIBETAN SIGN RNAM BCAD +102B..102C ; Right # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +1038 ; Right # Mc MYANMAR SIGN VISARGA +103B ; Right # Mc MYANMAR CONSONANT SIGN MEDIAL YA +1056..1057 ; Right # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1062..1064 ; Right # Mc [3] MYANMAR VOWEL SIGN SGAW KAREN EU..MYANMAR TONE MARK SGAW KAREN KE PHO +1067..106D ; Right # Mc [7] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1083 ; Right # Mc MYANMAR VOWEL SIGN SHAN AA +1087..108C ; Right # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108F ; Right # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109C ; Right # Mc [3] MYANMAR SIGN KHAMTI TONE-1..MYANMAR VOWEL SIGN AITON A +1715 ; Right # Mc TAGALOG SIGN PAMUDPOD +1734 ; Right # Mc HANUNOO SIGN PAMUDPOD +17B6 ; Right # Mc KHMER VOWEL SIGN AA +17C7..17C8 ; Right # Mc [2] KHMER SIGN REAHMUK..KHMER SIGN YUUKALEAPINTU +1923..1924 ; Right # Mc [2] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AI +1929..192B ; Right # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1930..1931 ; Right # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Right # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +19B0..19B4 ; Right # Lo [5] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN UU +19B8..19B9 ; Right # Lo [2] NEW TAI LUE VOWEL SIGN OA..NEW TAI LUE VOWEL SIGN UE +19BB..19C0 ; Right # Lo [6] NEW TAI LUE VOWEL SIGN AAY..NEW TAI LUE VOWEL SIGN IY +19C8..19C9 ; Right # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A1A ; Right # Mc BUGINESE VOWEL SIGN O +1A57 ; Right # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A61 ; Right # Mc TAI THAM VOWEL SIGN A +1A63..1A64 ; Right # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A6D ; Right # Mc TAI THAM VOWEL SIGN OY +1B04 ; Right # Mc BALINESE SIGN BISAH +1B35 ; Right # Mc BALINESE VOWEL SIGN TEDUNG +1B44 ; Right # Mc BALINESE ADEG ADEG +1B82 ; Right # Mc SUNDANESE SIGN PANGWISAD +1BA1 ; Right # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA7 ; Right # Mc SUNDANESE VOWEL SIGN PANOLONG +1BAA ; Right # Mc SUNDANESE SIGN PAMAAEH +1BE7 ; Right # Mc BATAK VOWEL SIGN E +1BEA..1BEC ; Right # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BEE ; Right # Mc BATAK VOWEL SIGN U +1BF2..1BF3 ; Right # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +1C24..1C26 ; Right # Mc [3] LEPCHA SUBJOINED LETTER YA..LEPCHA VOWEL SIGN AA +1C2A..1C2B ; Right # Mc [2] LEPCHA VOWEL SIGN U..LEPCHA VOWEL SIGN UU +1CE1 ; Right # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF7 ; Right # Mc VEDIC SIGN ATIKRAMA +A823..A824 ; Right # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A827 ; Right # Mc SYLOTI NAGRI VOWEL SIGN OO +A880..A881 ; Right # Mc [2] SAURASHTRA SIGN ANUSVARA..SAURASHTRA SIGN VISARGA +A8B4..A8C3 ; Right # Mc [16] SAURASHTRA CONSONANT SIGN HAARU..SAURASHTRA VOWEL SIGN AU +A952..A953 ; Right # Mc [2] REJANG CONSONANT SIGN H..REJANG VIRAMA +A983 ; Right # Mc JAVANESE SIGN WIGNYAN +A9B4..A9B5 ; Right # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +AA33 ; Right # Mc CHAM CONSONANT SIGN YA +AA4D ; Right # Mc CHAM CONSONANT SIGN FINAL H +AA7B ; Right # Mc MYANMAR SIGN PAO KAREN TONE +AA7D ; Right # Mc MYANMAR SIGN TAI LAING TONE-5 +AAB1 ; Right # Lo TAI VIET VOWEL AA +AABA ; Right # Lo TAI VIET VOWEL UA +AABD ; Right # Lo TAI VIET VOWEL AN +AAEF ; Right # Mc MEETEI MAYEK VOWEL SIGN AAU +AAF5 ; Right # Mc MEETEI MAYEK VOWEL SIGN VISARGA +ABE3..ABE4 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE6..ABE7 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE9..ABEA ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +ABEC ; Right # Mc MEETEI MAYEK LUM IYEK +11000 ; Right # Mc BRAHMI SIGN CANDRABINDU +11002 ; Right # Mc BRAHMI SIGN VISARGA +11082 ; Right # Mc KAITHI SIGN VISARGA +110B0 ; Right # Mc KAITHI VOWEL SIGN AA +110B2 ; Right # Mc KAITHI VOWEL SIGN II +110B7..110B8 ; Right # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11145..11146 ; Right # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI +11182 ; Right # Mc SHARADA SIGN VISARGA +111B3 ; Right # Mc SHARADA VOWEL SIGN AA +111B5 ; Right # Mc SHARADA VOWEL SIGN II +111C0 ; Right # Mc SHARADA SIGN VIRAMA +1122C..1122E ; Right # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +11235 ; Right # Mc KHOJKI SIGN VIRAMA +112E0 ; Right # Mc KHUDAWADI VOWEL SIGN AA +112E2 ; Right # Mc KHUDAWADI VOWEL SIGN II +11302..11303 ; Right # Mc [2] GRANTHA SIGN ANUSVARA..GRANTHA SIGN VISARGA +1133E..1133F ; Right # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11341..11344 ; Right # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +1134D ; Right # Mc GRANTHA SIGN VIRAMA +11357 ; Right # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Right # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +11435 ; Right # Mc NEWA VOWEL SIGN AA +11437 ; Right # Mc NEWA VOWEL SIGN II +11440..11441 ; Right # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +11445 ; Right # Mc NEWA SIGN VISARGA +114B0 ; Right # Mc TIRHUTA VOWEL SIGN AA +114B2 ; Right # Mc TIRHUTA VOWEL SIGN II +114BD ; Right # Mc TIRHUTA VOWEL SIGN SHORT O +114C1 ; Right # Mc TIRHUTA SIGN VISARGA +115AF ; Right # Mc SIDDHAM VOWEL SIGN AA +115B1 ; Right # Mc SIDDHAM VOWEL SIGN II +115BE ; Right # Mc SIDDHAM SIGN VISARGA +11630..11632 ; Right # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +1163B..1163C ; Right # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +1163E ; Right # Mc MODI SIGN VISARGA +116AC ; Right # Mc TAKRI SIGN VISARGA +116AF ; Right # Mc TAKRI VOWEL SIGN II +116B6 ; Right # Mc TAKRI SIGN VIRAMA +11720..11721 ; Right # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +1182C ; Right # Mc DOGRA VOWEL SIGN AA +1182E ; Right # Mc DOGRA VOWEL SIGN II +11838 ; Right # Mc DOGRA SIGN VISARGA +11930..11934 ; Right # Mc [5] DIVES AKURU VOWEL SIGN AA..DIVES AKURU VOWEL SIGN UU +1193D ; Right # Mc DIVES AKURU SIGN HALANTA +11940 ; Right # Mc DIVES AKURU MEDIAL YA +119D1 ; Right # Mc NANDINAGARI VOWEL SIGN AA +119D3 ; Right # Mc NANDINAGARI VOWEL SIGN II +119DC..119DF ; Right # Mc [4] NANDINAGARI VOWEL SIGN O..NANDINAGARI SIGN VISARGA +11A39 ; Right # Mc ZANABAZAR SQUARE SIGN VISARGA +11A57..11A58 ; Right # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A97 ; Right # Mc SOYOMBO SIGN VISARGA +11C2F ; Right # Mc BHAIKSUKI VOWEL SIGN AA +11C3E ; Right # Mc BHAIKSUKI SIGN VISARGA +11CA9 ; Right # Mc MARCHEN SUBJOINED LETTER YA +11CB4 ; Right # Mc MARCHEN VOWEL SIGN O +11D46 ; Right # Lo MASARAM GONDI REPHA +11D8A..11D8E ; Right # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU +11D93..11D94 ; Right # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU +11D96 ; Right # Mc GUNJALA GONDI SIGN VISARGA +11EF6 ; Right # Mc MAKASAR VOWEL SIGN O + +# Indic_Positional_Category=Left + +093F ; Left # Mc DEVANAGARI VOWEL SIGN I +094E ; Left # Mc DEVANAGARI VOWEL SIGN PRISHTHAMATRA E +09BF ; Left # Mc BENGALI VOWEL SIGN I +09C7..09C8 ; Left # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +0A3F ; Left # Mc GURMUKHI VOWEL SIGN I +0ABF ; Left # Mc GUJARATI VOWEL SIGN I +0B47 ; Left # Mc ORIYA VOWEL SIGN E +0BC6..0BC8 ; Left # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0D46..0D48 ; Left # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0DD9 ; Left # Mc SINHALA VOWEL SIGN KOMBUVA +0DDB ; Left # Mc SINHALA VOWEL SIGN KOMBU DEKA +0F3F ; Left # Mc TIBETAN SIGN MAR TSHES +1031 ; Left # Mc MYANMAR VOWEL SIGN E +1084 ; Left # Mc MYANMAR VOWEL SIGN SHAN E +17C1..17C3 ; Left # Mc [3] KHMER VOWEL SIGN E..KHMER VOWEL SIGN AI +1A19 ; Left # Mc BUGINESE VOWEL SIGN E +1A55 ; Left # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A6E..1A72 ; Left # Mc [5] TAI THAM VOWEL SIGN E..TAI THAM VOWEL SIGN THAM AI +1B3E..1B3F ; Left # Mc [2] BALINESE VOWEL SIGN TALING..BALINESE VOWEL SIGN TALING REPA +1BA6 ; Left # Mc SUNDANESE VOWEL SIGN PANAELAENG +1C27..1C28 ; Left # Mc [2] LEPCHA VOWEL SIGN I..LEPCHA VOWEL SIGN O +1C34..1C35 ; Left # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A9BA..A9BB ; Left # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +AA2F..AA30 ; Left # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA34 ; Left # Mc CHAM CONSONANT SIGN RA +AAEB ; Left # Mc MEETEI MAYEK VOWEL SIGN II +AAEE ; Left # Mc MEETEI MAYEK VOWEL SIGN AU +110B1 ; Left # Mc KAITHI VOWEL SIGN I +1112C ; Left # Mc CHAKMA VOWEL SIGN E +111B4 ; Left # Mc SHARADA VOWEL SIGN I +111CE ; Left # Mc SHARADA VOWEL SIGN PRISHTHAMATRA E +112E1 ; Left # Mc KHUDAWADI VOWEL SIGN I +11347..11348 ; Left # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +11436 ; Left # Mc NEWA VOWEL SIGN I +114B1 ; Left # Mc TIRHUTA VOWEL SIGN I +114B9 ; Left # Mc TIRHUTA VOWEL SIGN E +115B0 ; Left # Mc SIDDHAM VOWEL SIGN I +115B8 ; Left # Mc SIDDHAM VOWEL SIGN E +116AE ; Left # Mc TAKRI VOWEL SIGN I +11726 ; Left # Mc AHOM VOWEL SIGN E +1182D ; Left # Mc DOGRA VOWEL SIGN I +11935 ; Left # Mc DIVES AKURU VOWEL SIGN E +11937 ; Left # Mc DIVES AKURU VOWEL SIGN AI +119D2 ; Left # Mc NANDINAGARI VOWEL SIGN I +119E4 ; Left # Mc NANDINAGARI VOWEL SIGN PRISHTHAMATRA E +11CB1 ; Left # Mc MARCHEN VOWEL SIGN I +11EF5 ; Left # Mc MAKASAR VOWEL SIGN E + +# Indic_Positional_Category=Visual_Order_Left + +# These are dependent vowels that occur to the left of the consonant +# letter in a syllable, but which occur in scripts using the visual order +# model, instead of the logical order model. Because of the different +# model, these left-side vowels occur first in the backing store (before +# the consonant letter) and are not reordered during text rendering. +# +# [Derivation: Logical_Order_Exception=Yes] + +0E40..0E44 ; Visual_Order_Left # Lo [5] THAI CHARACTER SARA E..THAI CHARACTER SARA AI MAIMALAI +0EC0..0EC4 ; Visual_Order_Left # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +19B5..19B7 ; Visual_Order_Left # Lo [3] NEW TAI LUE VOWEL SIGN E..NEW TAI LUE VOWEL SIGN O +19BA ; Visual_Order_Left # Lo NEW TAI LUE VOWEL SIGN AY +AAB5..AAB6 ; Visual_Order_Left # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB9 ; Visual_Order_Left # Lo TAI VIET VOWEL UEA +AABB..AABC ; Visual_Order_Left # Lo [2] TAI VIET VOWEL AUE..TAI VIET VOWEL AY + +# Indic_Positional_Category=Left_And_Right + +09CB..09CC ; Left_And_Right # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +0B4B ; Left_And_Right # Mc ORIYA VOWEL SIGN O +0BCA..0BCC ; Left_And_Right # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0D4A..0D4C ; Left_And_Right # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0DDC ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA +0DDE ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA +17C0 ; Left_And_Right # Mc KHMER VOWEL SIGN IE +17C4..17C5 ; Left_And_Right # Mc [2] KHMER VOWEL SIGN OO..KHMER VOWEL SIGN AU +1B40..1B41 ; Left_And_Right # Mc [2] BALINESE VOWEL SIGN TALING TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1134B..1134C ; Left_And_Right # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +114BC ; Left_And_Right # Mc TIRHUTA VOWEL SIGN O +114BE ; Left_And_Right # Mc TIRHUTA VOWEL SIGN AU +115BA ; Left_And_Right # Mc SIDDHAM VOWEL SIGN O +11938 ; Left_And_Right # Mc DIVES AKURU VOWEL SIGN O + +# Indic_Positional_Category=Top + +0900..0902 ; Top # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +093A ; Top # Mn DEVANAGARI VOWEL SIGN OE +0945..0948 ; Top # Mn [4] DEVANAGARI VOWEL SIGN CANDRA E..DEVANAGARI VOWEL SIGN AI +0951 ; Top # Mn DEVANAGARI STRESS SIGN UDATTA +0953..0955 ; Top # Mn [3] DEVANAGARI GRAVE ACCENT..DEVANAGARI VOWEL SIGN CANDRA LONG E +0981 ; Top # Mn BENGALI SIGN CANDRABINDU +09FE ; Top # Mn BENGALI SANDHI MARK +0A01..0A02 ; Top # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A47..0A48 ; Top # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Top # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0A70..0A71 ; Top # Mn [2] GURMUKHI TIPPI..GURMUKHI ADDAK +0A81..0A82 ; Top # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0AC5 ; Top # Mn GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Top # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AFA..0AFF ; Top # Mn [6] GUJARATI SIGN SUKUN..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B01 ; Top # Mn ORIYA SIGN CANDRABINDU +0B3F ; Top # Mn ORIYA VOWEL SIGN I +0B55..0B56 ; Top # Mn [2] ORIYA SIGN OVERLINE..ORIYA AI LENGTH MARK +0B82 ; Top # Mn TAMIL SIGN ANUSVARA +0BC0 ; Top # Mn TAMIL VOWEL SIGN II +0BCD ; Top # Mn TAMIL SIGN VIRAMA +0C00 ; Top # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C04 ; Top # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C3E..0C40 ; Top # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C46..0C47 ; Top # Mn [2] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN EE +0C4A..0C4D ; Top # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA +0C55 ; Top # Mn TELUGU LENGTH MARK +0C81 ; Top # Mn KANNADA SIGN CANDRABINDU +0CBF ; Top # Mn KANNADA VOWEL SIGN I +0CC6 ; Top # Mn KANNADA VOWEL SIGN E +0CCC..0CCD ; Top # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA +0D00..0D01 ; Top # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU +0D3B..0D3C ; Top # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA +0D4D ; Top # Mn MALAYALAM SIGN VIRAMA +0D4E ; Top # Lo MALAYALAM LETTER DOT REPH +0D81 ; Top # Mn SINHALA SIGN CANDRABINDU +0DCA ; Top # Mn SINHALA SIGN AL-LAKUNA +0DD2..0DD3 ; Top # Mn [2] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN DIGA IS-PILLA +0E31 ; Top # Mn THAI CHARACTER MAI HAN-AKAT +0E34..0E37 ; Top # Mn [4] THAI CHARACTER SARA I..THAI CHARACTER SARA UEE +0E47..0E4E ; Top # Mn [8] THAI CHARACTER MAITAIKHU..THAI CHARACTER YAMAKKAN +0EB1 ; Top # Mn LAO VOWEL SIGN MAI KAN +0EB4..0EB7 ; Top # Mn [4] LAO VOWEL SIGN I..LAO VOWEL SIGN YY +0EBB ; Top # Mn LAO VOWEL SIGN MAI KON +0EC8..0ECD ; Top # Mn [6] LAO TONE MAI EK..LAO NIGGAHITA +0F39 ; Top # Mn TIBETAN MARK TSA -PHRU +0F72 ; Top # Mn TIBETAN VOWEL SIGN I +0F7A..0F7E ; Top # Mn [5] TIBETAN VOWEL SIGN E..TIBETAN SIGN RJES SU NGA RO +0F80 ; Top # Mn TIBETAN VOWEL SIGN REVERSED I +0F82..0F83 ; Top # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +0F86..0F87 ; Top # Mn [2] TIBETAN SIGN LCI RTAGS..TIBETAN SIGN YANG RTAGS +102D..102E ; Top # Mn [2] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN II +1032..1036 ; Top # Mn [5] MYANMAR VOWEL SIGN AI..MYANMAR SIGN ANUSVARA +103A ; Top # Mn MYANMAR SIGN ASAT +1071..1074 ; Top # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1085..1086 ; Top # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109D ; Top # Mn MYANMAR VOWEL SIGN AITON AI +1712 ; Top # Mn TAGALOG VOWEL SIGN I +1732 ; Top # Mn HANUNOO VOWEL SIGN I +1752 ; Top # Mn BUHID VOWEL SIGN I +1772 ; Top # Mn TAGBANWA VOWEL SIGN I +17B7..17BA ; Top # Mn [4] KHMER VOWEL SIGN I..KHMER VOWEL SIGN YY +17C6 ; Top # Mn KHMER SIGN NIKAHIT +17C9..17D1 ; Top # Mn [9] KHMER SIGN MUUSIKATOAN..KHMER SIGN VIRIAM +17D3 ; Top # Mn KHMER SIGN BATHAMASAT +17DD ; Top # Mn KHMER SIGN ATTHACAN +1920..1921 ; Top # Mn [2] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN I +1927..1928 ; Top # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Top # Mn LIMBU SIGN KEMPHRENG +1A17 ; Top # Mn BUGINESE VOWEL SIGN I +1A1B ; Top # Mn BUGINESE VOWEL SIGN AE +1A58..1A5A ; Top # Mn [3] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN LOW PA +1A62 ; Top # Mn TAI THAM VOWEL SIGN MAI SAT +1A65..1A68 ; Top # Mn [4] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN UUE +1A6B ; Top # Mn TAI THAM VOWEL SIGN O +1A73..1A7C ; Top # Mn [10] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN KHUEN-LUE KARAN +1B00..1B03 ; Top # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG +1B34 ; Top # Mn BALINESE SIGN REREKAN +1B36..1B37 ; Top # Mn [2] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN ULU SARI +1B42 ; Top # Mn BALINESE VOWEL SIGN PEPET +1B6B ; Top # Mn BALINESE MUSICAL SYMBOL COMBINING TEGEH +1B6D..1B73 ; Top # Mn [7] BALINESE MUSICAL SYMBOL COMBINING KEMPUL..BALINESE MUSICAL SYMBOL COMBINING GONG +1B80..1B81 ; Top # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR +1BA4 ; Top # Mn SUNDANESE VOWEL SIGN PANGHULU +1BA8..1BA9 ; Top # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE6 ; Top # Mn BATAK SIGN TOMPI +1BE8..1BE9 ; Top # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BED ; Top # Mn BATAK VOWEL SIGN KARO O +1BEF..1BF1 ; Top # Mn [3] BATAK VOWEL SIGN U FOR SIMALUNGUN SA..BATAK CONSONANT SIGN H +1C2D..1C33 ; Top # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +1C36 ; Top # Mn LEPCHA SIGN RAN +1CD0..1CD2 ; Top # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CDA..1CDB ; Top # Mn [2] VEDIC TONE DOUBLE SVARITA..VEDIC TONE TRIPLE SVARITA +1CE0 ; Top # Mn VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CF4 ; Top # Mn VEDIC TONE CANDRA ABOVE +1DFB ; Top # Mn COMBINING DELETION MARK +20F0 ; Top # Mn COMBINING ASTERISK ABOVE +A802 ; Top # Mn SYLOTI NAGRI SIGN DVISVARA +A806 ; Top # Mn SYLOTI NAGRI SIGN HASANTA +A80B ; Top # Mn SYLOTI NAGRI SIGN ANUSVARA +A826 ; Top # Mn SYLOTI NAGRI VOWEL SIGN E +A8C5 ; Top # Mn SAURASHTRA SIGN CANDRABINDU +A8E0..A8F1 ; Top # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +A8FF ; Top # Mn DEVANAGARI VOWEL SIGN AY +A94A ; Top # Mn REJANG VOWEL SIGN AI +A94F..A951 ; Top # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A980..A982 ; Top # Mn [3] JAVANESE SIGN PANYANGGA..JAVANESE SIGN LAYAR +A9B3 ; Top # Mn JAVANESE SIGN CECAK TELU +A9B6..A9B7 ; Top # Mn [2] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN WULU MELIK +A9BC ; Top # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Top # Mn MYANMAR SIGN SHAN SAW +AA29..AA2C ; Top # Mn [4] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN EI +AA2E ; Top # Mn CHAM VOWEL SIGN OE +AA31 ; Top # Mn CHAM VOWEL SIGN AU +AA43 ; Top # Mn CHAM CONSONANT SIGN FINAL NG +AA4C ; Top # Mn CHAM CONSONANT SIGN FINAL M +AA7C ; Top # Mn MYANMAR SIGN TAI LAING TONE-2 +AAB0 ; Top # Mn TAI VIET MAI KANG +AAB2..AAB3 ; Top # Mn [2] TAI VIET VOWEL I..TAI VIET VOWEL UE +AAB7..AAB8 ; Top # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AABE..AABF ; Top # Mn [2] TAI VIET VOWEL AM..TAI VIET TONE MAI EK +AAC1 ; Top # Mn TAI VIET TONE MAI THO +AAED ; Top # Mn MEETEI MAYEK VOWEL SIGN AAI +ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP +10A05 ; Top # Mn KHAROSHTHI VOWEL SIGN E +10A0F ; Top # Mn KHAROSHTHI SIGN VISARGA +10A38 ; Top # Mn KHAROSHTHI SIGN BAR ABOVE +11001 ; Top # Mn BRAHMI SIGN ANUSVARA +11038..1103B ; Top # Mn [4] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN II +11042..11046 ; Top # Mn [5] BRAHMI VOWEL SIGN E..BRAHMI VIRAMA +11070 ; Top # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11073..11074 ; Top # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O +11080..11081 ; Top # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +110B5..110B6 ; Top # Mn [2] KAITHI VOWEL SIGN E..KAITHI VOWEL SIGN AI +11100..11102 ; Top # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA +11127..11129 ; Top # Mn [3] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN II +1112D ; Top # Mn CHAKMA VOWEL SIGN AI +11130 ; Top # Mn CHAKMA VOWEL SIGN OI +11134 ; Top # Mn CHAKMA MAAYYAA +11180..11181 ; Top # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +111BC..111BE ; Top # Mn [3] SHARADA VOWEL SIGN E..SHARADA VOWEL SIGN O +111C2..111C3 ; Top # Lo [2] SHARADA SIGN JIHVAMULIYA..SHARADA SIGN UPADHMANIYA +111CB ; Top # Mn SHARADA VOWEL MODIFIER MARK +111CF ; Top # Mn SHARADA SIGN INVERTED CANDRABINDU +11230..11231 ; Top # Mn [2] KHOJKI VOWEL SIGN E..KHOJKI VOWEL SIGN AI +11234 ; Top # Mn KHOJKI SIGN ANUSVARA +11236..11237 ; Top # Mn [2] KHOJKI SIGN NUKTA..KHOJKI SIGN SHADDA +1123E ; Top # Mn KHOJKI SIGN SUKUN +112DF ; Top # Mn KHUDAWADI SIGN ANUSVARA +112E5..112E8 ; Top # Mn [4] KHUDAWADI VOWEL SIGN E..KHUDAWADI VOWEL SIGN AU +11300..11301 ; Top # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11340 ; Top # Mn GRANTHA VOWEL SIGN II +11366..1136C ; Top # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Top # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA +1143E..1143F ; Top # Mn [2] NEWA VOWEL SIGN E..NEWA VOWEL SIGN AI +11443..11444 ; Top # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +1145E ; Top # Mn NEWA SANDHI MARK +114BA ; Top # Mn TIRHUTA VOWEL SIGN SHORT E +114BF..114C0 ; Top # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Top # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +11639..1163A ; Top # Mn [2] MODI VOWEL SIGN E..MODI VOWEL SIGN AI +1163D ; Top # Mn MODI SIGN ANUSVARA +11640 ; Top # Mn MODI SIGN ARDHACANDRA +116AB ; Top # Mn TAKRI SIGN ANUSVARA +116AD ; Top # Mn TAKRI VOWEL SIGN AA +116B2..116B5 ; Top # Mn [4] TAKRI VOWEL SIGN E..TAKRI VOWEL SIGN AU +1171F ; Top # Mn AHOM CONSONANT SIGN MEDIAL LIGATING RA +11722..11723 ; Top # Mn [2] AHOM VOWEL SIGN I..AHOM VOWEL SIGN II +11727 ; Top # Mn AHOM VOWEL SIGN AW +11729..1172B ; Top # Mn [3] AHOM VOWEL SIGN AI..AHOM SIGN KILLER +11833..11837 ; Top # Mn [5] DOGRA VOWEL SIGN E..DOGRA SIGN ANUSVARA +1193B..1193C ; Top # Mn [2] DIVES AKURU SIGN ANUSVARA..DIVES AKURU SIGN CANDRABINDU +1193F ; Top # Lo DIVES AKURU PREFIXED NASAL SIGN +11941 ; Top # Lo DIVES AKURU INITIAL RA +119DA..119DB ; Top # Mn [2] NANDINAGARI VOWEL SIGN E..NANDINAGARI VOWEL SIGN AI +11A01 ; Top # Mn ZANABAZAR SQUARE VOWEL SIGN I +11A04..11A09 ; Top # Mn [6] ZANABAZAR SQUARE VOWEL SIGN E..ZANABAZAR SQUARE VOWEL SIGN REVERSED I +11A35..11A38 ; Top # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A3A ; Top # Lo ZANABAZAR SQUARE CLUSTER-INITIAL LETTER RA +11A51 ; Top # Mn SOYOMBO VOWEL SIGN I +11A54..11A56 ; Top # Mn [3] SOYOMBO VOWEL SIGN E..SOYOMBO VOWEL SIGN OE +11A84..11A89 ; Top # Lo [6] SOYOMBO SIGN JIHVAMULIYA..SOYOMBO CLUSTER-INITIAL LETTER SA +11A96 ; Top # Mn SOYOMBO SIGN ANUSVARA +11A98 ; Top # Mn SOYOMBO GEMINATION MARK +11C30..11C31 ; Top # Mn [2] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN II +11C38..11C3D ; Top # Mn [6] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI SIGN ANUSVARA +11CB3 ; Top # Mn MARCHEN VOWEL SIGN E +11CB5..11CB6 ; Top # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D31..11D35 ; Top # Mn [5] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN UU +11D3A ; Top # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Top # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F..11D41 ; Top # Mn [3] MASARAM GONDI VOWEL SIGN AU..MASARAM GONDI SIGN VISARGA +11D43 ; Top # Mn MASARAM GONDI SIGN CANDRA +11D90..11D91 ; Top # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI +11D95 ; Top # Mn GUNJALA GONDI SIGN ANUSVARA +11EF3 ; Top # Mn MAKASAR VOWEL SIGN I + +# Indic_Positional_Category=Bottom + +093C ; Bottom # Mn DEVANAGARI SIGN NUKTA +0941..0944 ; Bottom # Mn [4] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN VOCALIC RR +094D ; Bottom # Mn DEVANAGARI SIGN VIRAMA +0952 ; Bottom # Mn DEVANAGARI STRESS SIGN ANUDATTA +0956..0957 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN UE..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BC ; Bottom # Mn BENGALI SIGN NUKTA +09C1..09C4 ; Bottom # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09CD ; Bottom # Mn BENGALI SIGN VIRAMA +09E2..09E3 ; Bottom # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3C ; Bottom # Mn GURMUKHI SIGN NUKTA +0A41..0A42 ; Bottom # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A4D ; Bottom # Mn GURMUKHI SIGN VIRAMA +0A51 ; Bottom # Mn GURMUKHI SIGN UDAAT +0A75 ; Bottom # Mn GURMUKHI SIGN YAKASH +0ABC ; Bottom # Mn GUJARATI SIGN NUKTA +0AC1..0AC4 ; Bottom # Mn [4] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN VOCALIC RR +0ACD ; Bottom # Mn GUJARATI SIGN VIRAMA +0AE2..0AE3 ; Bottom # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3C ; Bottom # Mn ORIYA SIGN NUKTA +0B41..0B44 ; Bottom # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B4D ; Bottom # Mn ORIYA SIGN VIRAMA +0B62..0B63 ; Bottom # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0C3C ; Bottom # Mn TELUGU SIGN NUKTA +0C56 ; Bottom # Mn TELUGU AI LENGTH MARK +0C62..0C63 ; Bottom # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBC ; Bottom # Mn KANNADA SIGN NUKTA +0CE2..0CE3 ; Bottom # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D43..0D44 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC R..MALAYALAM VOWEL SIGN VOCALIC RR +0D62..0D63 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DD4 ; Bottom # Mn SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Bottom # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0E38..0E3A ; Bottom # Mn [3] THAI CHARACTER SARA U..THAI CHARACTER PHINTHU +0EB8..0EBA ; Bottom # Mn [3] LAO VOWEL SIGN U..LAO SIGN PALI VIRAMA +0EBC ; Bottom # Mn LAO SEMIVOWEL SIGN LO +0F18..0F19 ; Bottom # Mn [2] TIBETAN ASTROLOGICAL SIGN -KHYUD PA..TIBETAN ASTROLOGICAL SIGN SDONG TSHUGS +0F35 ; Bottom # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Bottom # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0F71 ; Bottom # Mn TIBETAN VOWEL SIGN AA +0F74..0F75 ; Bottom # Mn [2] TIBETAN VOWEL SIGN U..TIBETAN VOWEL SIGN UU +0F84 ; Bottom # Mn TIBETAN MARK HALANTA +0F8D..0F97 ; Bottom # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Bottom # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +0FC6 ; Bottom # Mn TIBETAN SYMBOL PADMA GDAN +102F..1030 ; Bottom # Mn [2] MYANMAR VOWEL SIGN U..MYANMAR VOWEL SIGN UU +1037 ; Bottom # Mn MYANMAR SIGN DOT BELOW +103D..103E ; Bottom # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +1058..1059 ; Bottom # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +105E..1060 ; Bottom # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Bottom # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +108D ; Bottom # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +1713..1714 ; Bottom # Mn [2] TAGALOG VOWEL SIGN U..TAGALOG SIGN VIRAMA +1733 ; Bottom # Mn HANUNOO VOWEL SIGN U +1753 ; Bottom # Mn BUHID VOWEL SIGN U +1773 ; Bottom # Mn TAGBANWA VOWEL SIGN U +17BB..17BD ; Bottom # Mn [3] KHMER VOWEL SIGN U..KHMER VOWEL SIGN UA +1922 ; Bottom # Mn LIMBU VOWEL SIGN U +1932 ; Bottom # Mn LIMBU SMALL LETTER ANUSVARA +1939 ; Bottom # Mn LIMBU SIGN MUKPHRENG +193B ; Bottom # Mn LIMBU SIGN SA-I +1A18 ; Bottom # Mn BUGINESE VOWEL SIGN U +1A56 ; Bottom # Mn TAI THAM CONSONANT SIGN MEDIAL LA +1A5B..1A5E ; Bottom # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1A69..1A6A ; Bottom # Mn [2] TAI THAM VOWEL SIGN U..TAI THAM VOWEL SIGN UU +1A6C ; Bottom # Mn TAI THAM VOWEL SIGN OA BELOW +1A7F ; Bottom # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1B38..1B3A ; Bottom # Mn [3] BALINESE VOWEL SIGN SUKU..BALINESE VOWEL SIGN RA REPA +1B6C ; Bottom # Mn BALINESE MUSICAL SYMBOL COMBINING ENDEP +1BA2..1BA3 ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BA5 ; Bottom # Mn SUNDANESE VOWEL SIGN PANYUKU +1BAC..1BAD ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C2C ; Bottom # Mn LEPCHA VOWEL SIGN E +1C37 ; Bottom # Mn LEPCHA SIGN NUKTA +1CD5..1CD9 ; Bottom # Mn [5] VEDIC TONE YAJURVEDIC AGGRAVATED INDEPENDENT SVARITA..VEDIC TONE YAJURVEDIC KATHAKA INDEPENDENT SVARITA SCHROEDER +1CDC..1CDF ; Bottom # Mn [4] VEDIC TONE KATHAKA ANUDATTA..VEDIC TONE THREE DOTS BELOW +1CED ; Bottom # Mn VEDIC SIGN TIRYAK +A825 ; Bottom # Mn SYLOTI NAGRI VOWEL SIGN U +A82C ; Bottom # Mn SYLOTI NAGRI SIGN ALTERNATE HASANTA +A8C4 ; Bottom # Mn SAURASHTRA SIGN VIRAMA +A92B..A92D ; Bottom # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +A947..A949 ; Bottom # Mn [3] REJANG VOWEL SIGN I..REJANG VOWEL SIGN E +A94B..A94E ; Bottom # Mn [4] REJANG VOWEL SIGN O..REJANG VOWEL SIGN EA +A9B8..A9B9 ; Bottom # Mn [2] JAVANESE VOWEL SIGN SUKU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BD ; Bottom # Mn JAVANESE CONSONANT SIGN KERET +AA2D ; Bottom # Mn CHAM VOWEL SIGN U +AA32 ; Bottom # Mn CHAM VOWEL SIGN UE +AA35..AA36 ; Bottom # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +AAB4 ; Bottom # Mn TAI VIET VOWEL U +AAEC ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UU +ABE8 ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK +10A02..10A03 ; Bottom # Mn [2] KHAROSHTHI VOWEL SIGN U..KHAROSHTHI VOWEL SIGN VOCALIC R +10A0C..10A0E ; Bottom # Mn [3] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN ANUSVARA +10A39..10A3A ; Bottom # Mn [2] KHAROSHTHI SIGN CAUDA..KHAROSHTHI SIGN DOT BELOW +1103C..11041 ; Bottom # Mn [6] BRAHMI VOWEL SIGN U..BRAHMI VOWEL SIGN VOCALIC LL +110B3..110B4 ; Bottom # Mn [2] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN UU +110B9..110BA ; Bottom # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +110C2 ; Bottom # Mn KAITHI VOWEL SIGN VOCALIC R +1112A..1112B ; Bottom # Mn [2] CHAKMA VOWEL SIGN U..CHAKMA VOWEL SIGN UU +11131..11132 ; Bottom # Mn [2] CHAKMA O MARK..CHAKMA AU MARK +11173 ; Bottom # Mn MAHAJANI SIGN NUKTA +111B6..111BB ; Bottom # Mn [6] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN VOCALIC LL +111C9..111CA ; Bottom # Mn [2] SHARADA SANDHI MARK..SHARADA SIGN NUKTA +111CC ; Bottom # Mn SHARADA EXTRA SHORT VOWEL MARK +1122F ; Bottom # Mn KHOJKI VOWEL SIGN U +112E3..112E4 ; Bottom # Mn [2] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN UU +112E9..112EA ; Bottom # Mn [2] KHUDAWADI SIGN NUKTA..KHUDAWADI SIGN VIRAMA +1133B..1133C ; Bottom # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA +11438..1143D ; Bottom # Mn [6] NEWA VOWEL SIGN U..NEWA VOWEL SIGN VOCALIC LL +11442 ; Bottom # Mn NEWA SIGN VIRAMA +11446 ; Bottom # Mn NEWA SIGN NUKTA +114B3..114B8 ; Bottom # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114C2..114C3 ; Bottom # Mn [2] TIRHUTA SIGN VIRAMA..TIRHUTA SIGN NUKTA +115B2..115B5 ; Bottom # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115BF..115C0 ; Bottom # Mn [2] SIDDHAM SIGN VIRAMA..SIDDHAM SIGN NUKTA +115DC..115DD ; Bottom # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11633..11638 ; Bottom # Mn [6] MODI VOWEL SIGN U..MODI VOWEL SIGN VOCALIC LL +1163F ; Bottom # Mn MODI SIGN VIRAMA +116B0..116B1 ; Bottom # Mn [2] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN UU +116B7 ; Bottom # Mn TAKRI SIGN NUKTA +1171D ; Bottom # Mn AHOM CONSONANT SIGN MEDIAL LA +11724..11725 ; Bottom # Mn [2] AHOM VOWEL SIGN U..AHOM VOWEL SIGN UU +11728 ; Bottom # Mn AHOM VOWEL SIGN O +1182F..11832 ; Bottom # Mn [4] DOGRA VOWEL SIGN U..DOGRA VOWEL SIGN VOCALIC RR +11839..1183A ; Bottom # Mn [2] DOGRA SIGN VIRAMA..DOGRA SIGN NUKTA +11943 ; Bottom # Mn DIVES AKURU SIGN NUKTA +119D4..119D7 ; Bottom # Mn [4] NANDINAGARI VOWEL SIGN U..NANDINAGARI VOWEL SIGN VOCALIC RR +119E0 ; Bottom # Mn NANDINAGARI SIGN VIRAMA +11A02..11A03 ; Bottom # Mn [2] ZANABAZAR SQUARE VOWEL SIGN UE..ZANABAZAR SQUARE VOWEL SIGN U +11A0A ; Bottom # Mn ZANABAZAR SQUARE VOWEL LENGTH MARK +11A33..11A34 ; Bottom # Mn [2] ZANABAZAR SQUARE FINAL CONSONANT MARK..ZANABAZAR SQUARE SIGN VIRAMA +11A3B..11A3E ; Bottom # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11A52..11A53 ; Bottom # Mn [2] SOYOMBO VOWEL SIGN UE..SOYOMBO VOWEL SIGN U +11A59..11A5B ; Bottom # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11A8A..11A95 ; Bottom # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A +11C32..11C36 ; Bottom # Mn [5] BHAIKSUKI VOWEL SIGN U..BHAIKSUKI VOWEL SIGN VOCALIC L +11C3F ; Bottom # Mn BHAIKSUKI SIGN VIRAMA +11C92..11CA7 ; Bottom # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CAA..11CB0 ; Bottom # Mn [7] MARCHEN SUBJOINED LETTER RA..MARCHEN VOWEL SIGN AA +11CB2 ; Bottom # Mn MARCHEN VOWEL SIGN U +11D36 ; Bottom # Mn MASARAM GONDI VOWEL SIGN VOCALIC R +11D42 ; Bottom # Mn MASARAM GONDI SIGN NUKTA +11D44 ; Bottom # Mn MASARAM GONDI SIGN HALANTA +11D47 ; Bottom # Mn MASARAM GONDI RA-KARA +11EF4 ; Bottom # Mn MAKASAR VOWEL SIGN U + +# Indic_Positional_Category=Top_And_Bottom + +0C48 ; Top_And_Bottom # Mn TELUGU VOWEL SIGN AI +0F73 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN II +0F76..0F79 ; Top_And_Bottom # Mn [4] TIBETAN VOWEL SIGN VOCALIC R..TIBETAN VOWEL SIGN VOCALIC LL +0F81 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN REVERSED II +1B3C ; Top_And_Bottom # Mn BALINESE VOWEL SIGN LA LENGA +1112E..1112F ; Top_And_Bottom # Mn [2] CHAKMA VOWEL SIGN O..CHAKMA VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Right + +0AC9 ; Top_And_Right # Mc GUJARATI VOWEL SIGN CANDRA O +0B57 ; Top_And_Right # Mc ORIYA AU LENGTH MARK +0CC0 ; Top_And_Right # Mc KANNADA VOWEL SIGN II +0CC7..0CC8 ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +1925..1926 ; Top_And_Right # Mc [2] LIMBU VOWEL SIGN OO..LIMBU VOWEL SIGN AU +1B43 ; Top_And_Right # Mc BALINESE VOWEL SIGN PEPET TEDUNG +111BF ; Top_And_Right # Mc SHARADA VOWEL SIGN AU +11232..11233 ; Top_And_Right # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Left + +0B48 ; Top_And_Left # Mc ORIYA VOWEL SIGN AI +0DDA ; Top_And_Left # Mc SINHALA VOWEL SIGN DIGA KOMBUVA +17BE ; Top_And_Left # Mc KHMER VOWEL SIGN OE +1C29 ; Top_And_Left # Mc LEPCHA VOWEL SIGN OO +114BB ; Top_And_Left # Mc TIRHUTA VOWEL SIGN AI +115B9 ; Top_And_Left # Mc SIDDHAM VOWEL SIGN AI + +# Indic_Positional_Category=Top_And_Left_And_Right + +0B4C ; Top_And_Left_And_Right # Mc ORIYA VOWEL SIGN AU +0DDD ; Top_And_Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA +17BF ; Top_And_Left_And_Right # Mc KHMER VOWEL SIGN YA +115BB ; Top_And_Left_And_Right # Mc SIDDHAM VOWEL SIGN AU + +# Indic_Positional_Category=Bottom_And_Right + +1B3B ; Bottom_And_Right # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +A9BE ; Bottom_And_Right # Mc JAVANESE CONSONANT SIGN PENGKAL +A9C0 ; Bottom_And_Right # Mc JAVANESE PANGKON +11942 ; Bottom_And_Right # Mc DIVES AKURU MEDIAL RA + +# Indic_Positional_Category=Bottom_And_Left + +A9BF ; Bottom_And_Left # Mc JAVANESE CONSONANT SIGN CAKRA + +# Indic_Positional_Category=Top_And_Bottom_And_Right + +1B3D ; Top_And_Bottom_And_Right # Mc BALINESE VOWEL SIGN LA LENGA TEDUNG + +# Indic_Positional_Category=Top_And_Bottom_And_Left + +103C ; Top_And_Bottom_And_Left # Mc MYANMAR CONSONANT SIGN MEDIAL RA +1171E ; Top_And_Bottom_And_Left # Mn AHOM CONSONANT SIGN MEDIAL RA + +# Indic_Positional_Category=Overstruck + +1CD4 ; Overstruck # Mn VEDIC SIGN YAJURVEDIC MIDLINE SVARITA +1CE2..1CE8 ; Overstruck # Mn [7] VEDIC SIGN VISARGA SVARITA..VEDIC SIGN VISARGA ANUDATTA WITH TAIL +10A01 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN I +10A06 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN O + +# EOF diff --git a/data/14.0.0-indic-syllabic-category.txt b/data/14.0.0-indic-syllabic-category.txt new file mode 100644 index 0000000..23b8637 --- /dev/null +++ b/data/14.0.0-indic-syllabic-category.txt @@ -0,0 +1,1320 @@ +# IndicSyllabicCategory-14.0.0.txt +# Date: 2021-05-22, 01:01:00 GMT [KW, RP] +# © 2021 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# +# For documentation, see UAX #44: Unicode Character Database, +# at http://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Syllabic_Category enumerated property +# +# Scope: This property is aimed at two general problem +# areas involving the analysis and processing of Indic scripts: +# +# 1. Specification of syllabic structure. +# 2. Specification of segmentation rules. +# +# Both of these problem areas may benefit from having defined subtypes +# of Indic script characters which are relevant to how Indic +# syllables (or aksaras) are constructed. Note that rules for +# syllabic structure in Indic scripts may differ significantly +# from how phonological syllables are defined. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Syllabic_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as Indic in the structural sense used for the +# Indic_Syllabic_Category are the following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Dives Akuru, Dogra, Grantha, Gujarati, +# Gunjala Gondi, Gurmukhi, Hanunoo, Javanese, Kaithi, Kannada, +# Kayah Li, Kharoshthi, Khmer, Khojki, Khudawadi, Lao, Lepcha, Limbu, +# Mahajani, Makasar, Malayalam, Marchen, Masaram Gondi, Meetei Mayek, +# Modi, Multani, Myanmar, Nandinagari, Newa, New Tai Lue, Oriya, +# Phags-pa, Rejang, Saurashtra, Sharada, Siddham, Sinhala, Soyombo, +# Sundanese, Syloti Nagri, Tagalog, Tagbanwa, Tai Le, Tai Tham, +# Tai Viet, Takri, Tamil, Telugu, Thai, Tibetan, Tirhuta, and +# Zanabazar Square. +# +# All characters for all other scripts not in that list +# take the default value for this property, unless they +# are individually listed in this data file. +# + +# ================================================ + +# Property: Indic_Syllabic_Category +# +# All code points not explicitly listed for Indic_Syllabic_Category +# have the value Other. +# +# @missing: 0000..10FFFF; Other + +# ================================================ + +# Indic_Syllabic_Category=Bindu + +# Bindu/Anusvara (nasalization or -n) + +# [Not derivable] + +0900..0902 ; Bindu # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +0981 ; Bindu # Mn BENGALI SIGN CANDRABINDU +0982 ; Bindu # Mc BENGALI SIGN ANUSVARA +09FC ; Bindu # Lo BENGALI LETTER VEDIC ANUSVARA +0A01..0A02 ; Bindu # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A70 ; Bindu # Mn GURMUKHI TIPPI +0A81..0A82 ; Bindu # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0B01 ; Bindu # Mn ORIYA SIGN CANDRABINDU +0B02 ; Bindu # Mc ORIYA SIGN ANUSVARA +0B82 ; Bindu # Mn TAMIL SIGN ANUSVARA +0C00 ; Bindu # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C01..0C02 ; Bindu # Mc [2] TELUGU SIGN CANDRABINDU..TELUGU SIGN ANUSVARA +0C04 ; Bindu # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C80 ; Bindu # Lo KANNADA SIGN SPACING CANDRABINDU +0C81 ; Bindu # Mn KANNADA SIGN CANDRABINDU +0C82 ; Bindu # Mc KANNADA SIGN ANUSVARA +0D00..0D01 ; Bindu # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU +0D02 ; Bindu # Mc MALAYALAM SIGN ANUSVARA +0D04 ; Bindu # Lo MALAYALAM LETTER VEDIC ANUSVARA +0D81 ; Bindu # Mn SINHALA SIGN CANDRABINDU +0D82 ; Bindu # Mc SINHALA SIGN ANUSVARAYA +0E4D ; Bindu # Mn THAI CHARACTER NIKHAHIT +0ECD ; Bindu # Mn LAO NIGGAHITA +0F7E ; Bindu # Mn TIBETAN SIGN RJES SU NGA RO +0F82..0F83 ; Bindu # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +1036 ; Bindu # Mn MYANMAR SIGN ANUSVARA +17C6 ; Bindu # Mn KHMER SIGN NIKAHIT +1932 ; Bindu # Mn LIMBU SMALL LETTER ANUSVARA +1A74 ; Bindu # Mn TAI THAM SIGN MAI KANG +1B00..1B02 ; Bindu # Mn [3] BALINESE SIGN ULU RICEM..BALINESE SIGN CECEK +1B80 ; Bindu # Mn SUNDANESE SIGN PANYECEK +1C34..1C35 ; Bindu # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A80B ; Bindu # Mn SYLOTI NAGRI SIGN ANUSVARA +A873 ; Bindu # Lo PHAGS-PA LETTER CANDRABINDU +A880 ; Bindu # Mc SAURASHTRA SIGN ANUSVARA +A8C5 ; Bindu # Mn SAURASHTRA SIGN CANDRABINDU +A8F2..A8F3 ; Bindu # Lo [2] DEVANAGARI SIGN SPACING CANDRABINDU..DEVANAGARI SIGN CANDRABINDU VIRAMA +A980..A981 ; Bindu # Mn [2] JAVANESE SIGN PANYANGGA..JAVANESE SIGN CECAK +10A0E ; Bindu # Mn KHAROSHTHI SIGN ANUSVARA +11000 ; Bindu # Mc BRAHMI SIGN CANDRABINDU +11001 ; Bindu # Mn BRAHMI SIGN ANUSVARA +11080..11081 ; Bindu # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +11100..11101 ; Bindu # Mn [2] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN ANUSVARA +11180..11181 ; Bindu # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +111CF ; Bindu # Mn SHARADA SIGN INVERTED CANDRABINDU +11234 ; Bindu # Mn KHOJKI SIGN ANUSVARA +112DF ; Bindu # Mn KHUDAWADI SIGN ANUSVARA +11300..11301 ; Bindu # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11302 ; Bindu # Mc GRANTHA SIGN ANUSVARA +1135E..1135F ; Bindu # Lo [2] GRANTHA LETTER VEDIC ANUSVARA..GRANTHA LETTER VEDIC DOUBLE ANUSVARA +11443..11444 ; Bindu # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +1145F ; Bindu # Lo NEWA LETTER VEDIC ANUSVARA +114BF..114C0 ; Bindu # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Bindu # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +1163D ; Bindu # Mn MODI SIGN ANUSVARA +116AB ; Bindu # Mn TAKRI SIGN ANUSVARA +11837 ; Bindu # Mn DOGRA SIGN ANUSVARA +1193B..1193C ; Bindu # Mn [2] DIVES AKURU SIGN ANUSVARA..DIVES AKURU SIGN CANDRABINDU +119DE ; Bindu # Mc NANDINAGARI SIGN ANUSVARA +11A35..11A38 ; Bindu # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A96 ; Bindu # Mn SOYOMBO SIGN ANUSVARA +11C3C..11C3D ; Bindu # Mn [2] BHAIKSUKI SIGN CANDRABINDU..BHAIKSUKI SIGN ANUSVARA +11CB5..11CB6 ; Bindu # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D40 ; Bindu # Mn MASARAM GONDI SIGN ANUSVARA +11D95 ; Bindu # Mn GUNJALA GONDI SIGN ANUSVARA + +# ================================================ + +# Indic_Syllabic_Category=Visarga + +# Visarga (-h) +# Excludes letters for jihvamuliya and upadhmaniya, which are +# related, but structured somewhat differently. + +# [Not derivable] + +0903 ; Visarga # Mc DEVANAGARI SIGN VISARGA +0983 ; Visarga # Mc BENGALI SIGN VISARGA +0A03 ; Visarga # Mc GURMUKHI SIGN VISARGA +0A83 ; Visarga # Mc GUJARATI SIGN VISARGA +0B03 ; Visarga # Mc ORIYA SIGN VISARGA +0C03 ; Visarga # Mc TELUGU SIGN VISARGA +0C83 ; Visarga # Mc KANNADA SIGN VISARGA +0D03 ; Visarga # Mc MALAYALAM SIGN VISARGA +0D83 ; Visarga # Mc SINHALA SIGN VISARGAYA +0F7F ; Visarga # Mc TIBETAN SIGN RNAM BCAD +1038 ; Visarga # Mc MYANMAR SIGN VISARGA +17C7 ; Visarga # Mc KHMER SIGN REAHMUK +1B04 ; Visarga # Mc BALINESE SIGN BISAH +1B82 ; Visarga # Mc SUNDANESE SIGN PANGWISAD +A881 ; Visarga # Mc SAURASHTRA SIGN VISARGA +A983 ; Visarga # Mc JAVANESE SIGN WIGNYAN +AAF5 ; Visarga # Mc MEETEI MAYEK VOWEL SIGN VISARGA +10A0F ; Visarga # Mn KHAROSHTHI SIGN VISARGA +11002 ; Visarga # Mc BRAHMI SIGN VISARGA +11082 ; Visarga # Mc KAITHI SIGN VISARGA +11102 ; Visarga # Mn CHAKMA SIGN VISARGA +11182 ; Visarga # Mc SHARADA SIGN VISARGA +11303 ; Visarga # Mc GRANTHA SIGN VISARGA +11445 ; Visarga # Mc NEWA SIGN VISARGA +114C1 ; Visarga # Mc TIRHUTA SIGN VISARGA +115BE ; Visarga # Mc SIDDHAM SIGN VISARGA +1163E ; Visarga # Mc MODI SIGN VISARGA +116AC ; Visarga # Mc TAKRI SIGN VISARGA +11838 ; Visarga # Mc DOGRA SIGN VISARGA +119DF ; Visarga # Mc NANDINAGARI SIGN VISARGA +11A39 ; Visarga # Mc ZANABAZAR SQUARE SIGN VISARGA +11A97 ; Visarga # Mc SOYOMBO SIGN VISARGA +11C3E ; Visarga # Mc BHAIKSUKI SIGN VISARGA +11D41 ; Visarga # Mn MASARAM GONDI SIGN VISARGA +11D96 ; Visarga # Mc GUNJALA GONDI SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Avagraha + +# Avagraha (elision of initial a- in sandhi) + +# [Not derivable] + +093D ; Avagraha # Lo DEVANAGARI SIGN AVAGRAHA +09BD ; Avagraha # Lo BENGALI SIGN AVAGRAHA +0ABD ; Avagraha # Lo GUJARATI SIGN AVAGRAHA +0B3D ; Avagraha # Lo ORIYA SIGN AVAGRAHA +0C3D ; Avagraha # Lo TELUGU SIGN AVAGRAHA +0CBD ; Avagraha # Lo KANNADA SIGN AVAGRAHA +0D3D ; Avagraha # Lo MALAYALAM SIGN AVAGRAHA +0F85 ; Avagraha # Po TIBETAN MARK PALUTA +17DC ; Avagraha # Lo KHMER SIGN AVAKRAHASANYA +1BBA ; Avagraha # Lo SUNDANESE AVAGRAHA +111C1 ; Avagraha # Lo SHARADA SIGN AVAGRAHA +1133D ; Avagraha # Lo GRANTHA SIGN AVAGRAHA +11447 ; Avagraha # Lo NEWA SIGN AVAGRAHA +114C4 ; Avagraha # Lo TIRHUTA SIGN AVAGRAHA +119E1 ; Avagraha # Lo NANDINAGARI SIGN AVAGRAHA +11A9D ; Avagraha # Lo SOYOMBO MARK PLUTA +11C40 ; Avagraha # Lo BHAIKSUKI SIGN AVAGRAHA + +# ================================================ + +# Indic_Syllabic_Category=Nukta + +# Nukta (diacritic for borrowed consonants or other consonant +# modifications). Note that while the resulting sound is typically a +# consonant, the base letter a nukta follows may be an independent +# vowel. For example, is used to transcribe ARABIC LETTER +# AIN. + +# [Not derivable] + +093C ; Nukta # Mn DEVANAGARI SIGN NUKTA +09BC ; Nukta # Mn BENGALI SIGN NUKTA +0A3C ; Nukta # Mn GURMUKHI SIGN NUKTA +0ABC ; Nukta # Mn GUJARATI SIGN NUKTA +0AFD..0AFF ; Nukta # Mn [3] GUJARATI SIGN THREE-DOT NUKTA ABOVE..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B3C ; Nukta # Mn ORIYA SIGN NUKTA +0C3C ; Nukta # Mn TELUGU SIGN NUKTA +0CBC ; Nukta # Mn KANNADA SIGN NUKTA +0F39 ; Nukta # Mn TIBETAN MARK TSA -PHRU +1B34 ; Nukta # Mn BALINESE SIGN REREKAN +1BE6 ; Nukta # Mn BATAK SIGN TOMPI +1C37 ; Nukta # Mn LEPCHA SIGN NUKTA +A9B3 ; Nukta # Mn JAVANESE SIGN CECAK TELU +10A38..10A3A ; Nukta # Mn [3] KHAROSHTHI SIGN BAR ABOVE..KHAROSHTHI SIGN DOT BELOW +110BA ; Nukta # Mn KAITHI SIGN NUKTA +11173 ; Nukta # Mn MAHAJANI SIGN NUKTA +111CA ; Nukta # Mn SHARADA SIGN NUKTA +11236 ; Nukta # Mn KHOJKI SIGN NUKTA +112E9 ; Nukta # Mn KHUDAWADI SIGN NUKTA +1133B..1133C ; Nukta # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA +11446 ; Nukta # Mn NEWA SIGN NUKTA +114C3 ; Nukta # Mn TIRHUTA SIGN NUKTA +115C0 ; Nukta # Mn SIDDHAM SIGN NUKTA +116B7 ; Nukta # Mn TAKRI SIGN NUKTA +1183A ; Nukta # Mn DOGRA SIGN NUKTA +11943 ; Nukta # Mn DIVES AKURU SIGN NUKTA +11D42 ; Nukta # Mn MASARAM GONDI SIGN NUKTA + +# ================================================ + +# Indic_Syllabic_Category=Virama + +# Virama (killing of inherent vowel in consonant sequence +# or consonant stacker) +# Only includes characters that can act both as visible killer viramas +# and consonant stackers. Separate property values exist for characters +# that can only act as pure killers or only as consonant stackers. + +# [Derivation: (ccc=9) - (InSC=Pure_Killer) - (InSC=Invisible_Stacker) +# - (InSC=Number_Joiner) - 2D7F] + +094D ; Virama # Mn DEVANAGARI SIGN VIRAMA +09CD ; Virama # Mn BENGALI SIGN VIRAMA +0A4D ; Virama # Mn GURMUKHI SIGN VIRAMA +0ACD ; Virama # Mn GUJARATI SIGN VIRAMA +0B4D ; Virama # Mn ORIYA SIGN VIRAMA +0BCD ; Virama # Mn TAMIL SIGN VIRAMA +0C4D ; Virama # Mn TELUGU SIGN VIRAMA +0CCD ; Virama # Mn KANNADA SIGN VIRAMA +0D4D ; Virama # Mn MALAYALAM SIGN VIRAMA +0DCA ; Virama # Mn SINHALA SIGN AL-LAKUNA +1B44 ; Virama # Mc BALINESE ADEG ADEG +A806 ; Virama # Mn SYLOTI NAGRI SIGN HASANTA +A8C4 ; Virama # Mn SAURASHTRA SIGN VIRAMA +A9C0 ; Virama # Mc JAVANESE PANGKON +11046 ; Virama # Mn BRAHMI VIRAMA +110B9 ; Virama # Mn KAITHI SIGN VIRAMA +111C0 ; Virama # Mc SHARADA SIGN VIRAMA +11235 ; Virama # Mc KHOJKI SIGN VIRAMA +1134D ; Virama # Mc GRANTHA SIGN VIRAMA +11442 ; Virama # Mn NEWA SIGN VIRAMA +114C2 ; Virama # Mn TIRHUTA SIGN VIRAMA +115BF ; Virama # Mn SIDDHAM SIGN VIRAMA +1163F ; Virama # Mn MODI SIGN VIRAMA +116B6 ; Virama # Mc TAKRI SIGN VIRAMA +11839 ; Virama # Mn DOGRA SIGN VIRAMA +119E0 ; Virama # Mn NANDINAGARI SIGN VIRAMA +11C3F ; Virama # Mn BHAIKSUKI SIGN VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Pure_Killer + +# Pure killer (killing of inherent vowel in consonant sequence, +# with no consonant stacking behavior) + +# [Not derivable] + +0D3B..0D3C ; Pure_Killer # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA +0E3A ; Pure_Killer # Mn THAI CHARACTER PHINTHU +0E4E ; Pure_Killer # Mn THAI CHARACTER YAMAKKAN +0EBA ; Pure_Killer # Mn LAO SIGN PALI VIRAMA +0F84 ; Pure_Killer # Mn TIBETAN MARK HALANTA +103A ; Pure_Killer # Mn MYANMAR SIGN ASAT +1714 ; Pure_Killer # Mn TAGALOG SIGN VIRAMA +1715 ; Pure_Killer # Mc TAGALOG SIGN PAMUDPOD +1734 ; Pure_Killer # Mc HANUNOO SIGN PAMUDPOD +17D1 ; Pure_Killer # Mn KHMER SIGN VIRIAM +1A7A ; Pure_Killer # Mn TAI THAM SIGN RA HAAM +1BAA ; Pure_Killer # Mc SUNDANESE SIGN PAMAAEH +1BF2..1BF3 ; Pure_Killer # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +A82C ; Pure_Killer # Mn SYLOTI NAGRI SIGN ALTERNATE HASANTA +A953 ; Pure_Killer # Mc REJANG VIRAMA +ABED ; Pure_Killer # Mn MEETEI MAYEK APUN IYEK +11070 ; Pure_Killer # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11134 ; Pure_Killer # Mn CHAKMA MAAYYAA +112EA ; Pure_Killer # Mn KHUDAWADI SIGN VIRAMA +1172B ; Pure_Killer # Mn AHOM SIGN KILLER +1193D ; Pure_Killer # Mc DIVES AKURU SIGN HALANTA +11A34 ; Pure_Killer # Mn ZANABAZAR SQUARE SIGN VIRAMA +11D44 ; Pure_Killer # Mn MASARAM GONDI SIGN HALANTA + +# ================================================ + +# Indic_Syllabic_Category=Invisible_Stacker + +# Invisible stacker (invisible consonant stacker virama). +# +# Note that in some scripts, such as Kharoshthi and Masaram Gondi, an invisible +# stacker may have a second function, changing the shape and/or location of the +# consonant preceding it, even when there is no consonant following the +# invisible stacker. + +# [Not derivable] + +1039 ; Invisible_Stacker # Mn MYANMAR SIGN VIRAMA +17D2 ; Invisible_Stacker # Mn KHMER SIGN COENG +1A60 ; Invisible_Stacker # Mn TAI THAM SIGN SAKOT +1BAB ; Invisible_Stacker # Mn SUNDANESE SIGN VIRAMA +AAF6 ; Invisible_Stacker # Mn MEETEI MAYEK VIRAMA +10A3F ; Invisible_Stacker # Mn KHAROSHTHI VIRAMA +11133 ; Invisible_Stacker # Mn CHAKMA VIRAMA +1193E ; Invisible_Stacker # Mn DIVES AKURU VIRAMA +11A47 ; Invisible_Stacker # Mn ZANABAZAR SQUARE SUBJOINER +11A99 ; Invisible_Stacker # Mn SOYOMBO SUBJOINER +11D45 ; Invisible_Stacker # Mn MASARAM GONDI VIRAMA +11D97 ; Invisible_Stacker # Mn GUNJALA GONDI VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Independent + +# Independent Vowels (contrasted with matras) + +# [Not derivable] + +0904..0914 ; Vowel_Independent # Lo [17] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER AU +0960..0961 ; Vowel_Independent # Lo [2] DEVANAGARI LETTER VOCALIC RR..DEVANAGARI LETTER VOCALIC LL +0972..0977 ; Vowel_Independent # Lo [6] DEVANAGARI LETTER CANDRA A..DEVANAGARI LETTER UUE +0985..098C ; Vowel_Independent # Lo [8] BENGALI LETTER A..BENGALI LETTER VOCALIC L +098F..0990 ; Vowel_Independent # Lo [2] BENGALI LETTER E..BENGALI LETTER AI +0993..0994 ; Vowel_Independent # Lo [2] BENGALI LETTER O..BENGALI LETTER AU +09E0..09E1 ; Vowel_Independent # Lo [2] BENGALI LETTER VOCALIC RR..BENGALI LETTER VOCALIC LL +0A05..0A0A ; Vowel_Independent # Lo [6] GURMUKHI LETTER A..GURMUKHI LETTER UU +0A0F..0A10 ; Vowel_Independent # Lo [2] GURMUKHI LETTER EE..GURMUKHI LETTER AI +0A13..0A14 ; Vowel_Independent # Lo [2] GURMUKHI LETTER OO..GURMUKHI LETTER AU +0A85..0A8D ; Vowel_Independent # Lo [9] GUJARATI LETTER A..GUJARATI VOWEL CANDRA E +0A8F..0A91 ; Vowel_Independent # Lo [3] GUJARATI LETTER E..GUJARATI VOWEL CANDRA O +0A93..0A94 ; Vowel_Independent # Lo [2] GUJARATI LETTER O..GUJARATI LETTER AU +0AE0..0AE1 ; Vowel_Independent # Lo [2] GUJARATI LETTER VOCALIC RR..GUJARATI LETTER VOCALIC LL +0B05..0B0C ; Vowel_Independent # Lo [8] ORIYA LETTER A..ORIYA LETTER VOCALIC L +0B0F..0B10 ; Vowel_Independent # Lo [2] ORIYA LETTER E..ORIYA LETTER AI +0B13..0B14 ; Vowel_Independent # Lo [2] ORIYA LETTER O..ORIYA LETTER AU +0B60..0B61 ; Vowel_Independent # Lo [2] ORIYA LETTER VOCALIC RR..ORIYA LETTER VOCALIC LL +0B85..0B8A ; Vowel_Independent # Lo [6] TAMIL LETTER A..TAMIL LETTER UU +0B8E..0B90 ; Vowel_Independent # Lo [3] TAMIL LETTER E..TAMIL LETTER AI +0B92..0B94 ; Vowel_Independent # Lo [3] TAMIL LETTER O..TAMIL LETTER AU +0C05..0C0C ; Vowel_Independent # Lo [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L +0C0E..0C10 ; Vowel_Independent # Lo [3] TELUGU LETTER E..TELUGU LETTER AI +0C12..0C14 ; Vowel_Independent # Lo [3] TELUGU LETTER O..TELUGU LETTER AU +0C60..0C61 ; Vowel_Independent # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL +0C85..0C8C ; Vowel_Independent # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L +0C8E..0C90 ; Vowel_Independent # Lo [3] KANNADA LETTER E..KANNADA LETTER AI +0C92..0C94 ; Vowel_Independent # Lo [3] KANNADA LETTER O..KANNADA LETTER AU +0CE0..0CE1 ; Vowel_Independent # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL +0D05..0D0C ; Vowel_Independent # Lo [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L +0D0E..0D10 ; Vowel_Independent # Lo [3] MALAYALAM LETTER E..MALAYALAM LETTER AI +0D12..0D14 ; Vowel_Independent # Lo [3] MALAYALAM LETTER O..MALAYALAM LETTER AU +0D5F..0D61 ; Vowel_Independent # Lo [3] MALAYALAM LETTER ARCHAIC II..MALAYALAM LETTER VOCALIC LL +0D85..0D96 ; Vowel_Independent # Lo [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA +1021..102A ; Vowel_Independent # Lo [10] MYANMAR LETTER A..MYANMAR LETTER AU +1052..1055 ; Vowel_Independent # Lo [4] MYANMAR LETTER VOCALIC R..MYANMAR LETTER VOCALIC LL +1700..1702 ; Vowel_Independent # Lo [3] TAGALOG LETTER A..TAGALOG LETTER U +1720..1722 ; Vowel_Independent # Lo [3] HANUNOO LETTER A..HANUNOO LETTER U +1740..1742 ; Vowel_Independent # Lo [3] BUHID LETTER A..BUHID LETTER U +1760..1762 ; Vowel_Independent # Lo [3] TAGBANWA LETTER A..TAGBANWA LETTER U +17A3..17B3 ; Vowel_Independent # Lo [17] KHMER INDEPENDENT VOWEL QAQ..KHMER INDEPENDENT VOWEL QAU +1A4D..1A52 ; Vowel_Independent # Lo [6] TAI THAM LETTER I..TAI THAM LETTER OO +1B05..1B12 ; Vowel_Independent # Lo [14] BALINESE LETTER AKARA..BALINESE LETTER OKARA TEDUNG +1B83..1B89 ; Vowel_Independent # Lo [7] SUNDANESE LETTER A..SUNDANESE LETTER EU +1BE4..1BE5 ; Vowel_Independent # Lo [2] BATAK LETTER I..BATAK LETTER U +A800..A801 ; Vowel_Independent # Lo [2] SYLOTI NAGRI LETTER A..SYLOTI NAGRI LETTER I +A803..A805 ; Vowel_Independent # Lo [3] SYLOTI NAGRI LETTER U..SYLOTI NAGRI LETTER O +A882..A891 ; Vowel_Independent # Lo [16] SAURASHTRA LETTER A..SAURASHTRA LETTER AU +A8FE ; Vowel_Independent # Lo DEVANAGARI LETTER AY +A984..A988 ; Vowel_Independent # Lo [5] JAVANESE LETTER A..JAVANESE LETTER U +A98C..A98E ; Vowel_Independent # Lo [3] JAVANESE LETTER E..JAVANESE LETTER O +AA00..AA05 ; Vowel_Independent # Lo [6] CHAM LETTER A..CHAM LETTER O +AAE0..AAE1 ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER E..MEETEI MAYEK LETTER O +ABCE..ABCF ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER UN..MEETEI MAYEK LETTER I +ABD1 ; Vowel_Independent # Lo MEETEI MAYEK LETTER ATIYA +11005..11012 ; Vowel_Independent # Lo [14] BRAHMI LETTER A..BRAHMI LETTER AU +11071..11072 ; Vowel_Independent # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11083..1108C ; Vowel_Independent # Lo [10] KAITHI LETTER A..KAITHI LETTER AU +11103..11106 ; Vowel_Independent # Lo [4] CHAKMA LETTER AA..CHAKMA LETTER E +11183..11190 ; Vowel_Independent # Lo [14] SHARADA LETTER A..SHARADA LETTER AU +11200..11207 ; Vowel_Independent # Lo [8] KHOJKI LETTER A..KHOJKI LETTER AU +11280..11283 ; Vowel_Independent # Lo [4] MULTANI LETTER A..MULTANI LETTER E +112B0..112B9 ; Vowel_Independent # Lo [10] KHUDAWADI LETTER A..KHUDAWADI LETTER AU +11305..1130C ; Vowel_Independent # Lo [8] GRANTHA LETTER A..GRANTHA LETTER VOCALIC L +1130F..11310 ; Vowel_Independent # Lo [2] GRANTHA LETTER EE..GRANTHA LETTER AI +11313..11314 ; Vowel_Independent # Lo [2] GRANTHA LETTER OO..GRANTHA LETTER AU +11360..11361 ; Vowel_Independent # Lo [2] GRANTHA LETTER VOCALIC RR..GRANTHA LETTER VOCALIC LL +11400..1140D ; Vowel_Independent # Lo [14] NEWA LETTER A..NEWA LETTER AU +11481..1148E ; Vowel_Independent # Lo [14] TIRHUTA LETTER A..TIRHUTA LETTER AU +11580..1158D ; Vowel_Independent # Lo [14] SIDDHAM LETTER A..SIDDHAM LETTER AU +115D8..115DB ; Vowel_Independent # Lo [4] SIDDHAM LETTER THREE-CIRCLE ALTERNATE I..SIDDHAM LETTER ALTERNATE U +11600..1160D ; Vowel_Independent # Lo [14] MODI LETTER A..MODI LETTER AU +11680..11689 ; Vowel_Independent # Lo [10] TAKRI LETTER A..TAKRI LETTER AU +11800..11809 ; Vowel_Independent # Lo [10] DOGRA LETTER A..DOGRA LETTER AU +11900..11906 ; Vowel_Independent # Lo [7] DIVES AKURU LETTER A..DIVES AKURU LETTER E +11909 ; Vowel_Independent # Lo DIVES AKURU LETTER O +119A0..119A7 ; Vowel_Independent # Lo [8] NANDINAGARI LETTER A..NANDINAGARI LETTER VOCALIC RR +119AA..119AD ; Vowel_Independent # Lo [4] NANDINAGARI LETTER E..NANDINAGARI LETTER AU +11A00 ; Vowel_Independent # Lo ZANABAZAR SQUARE LETTER A +11A50 ; Vowel_Independent # Lo SOYOMBO LETTER A +11C00..11C08 ; Vowel_Independent # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L +11C0A..11C0D ; Vowel_Independent # Lo [4] BHAIKSUKI LETTER E..BHAIKSUKI LETTER AU +11D00..11D06 ; Vowel_Independent # Lo [7] MASARAM GONDI LETTER A..MASARAM GONDI LETTER E +11D08..11D09 ; Vowel_Independent # Lo [2] MASARAM GONDI LETTER AI..MASARAM GONDI LETTER O +11D0B ; Vowel_Independent # Lo MASARAM GONDI LETTER AU +11D60..11D65 ; Vowel_Independent # Lo [6] GUNJALA GONDI LETTER A..GUNJALA GONDI LETTER UU +11D67..11D68 ; Vowel_Independent # Lo [2] GUNJALA GONDI LETTER EE..GUNJALA GONDI LETTER AI +11D6A..11D6B ; Vowel_Independent # Lo [2] GUNJALA GONDI LETTER OO..GUNJALA GONDI LETTER AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Dependent + +# Dependent Vowels (contrasted with independent vowels and/or with +# complex placement). Known as matras in Indic scripts. Also +# includes vowel modifiers that follow dependent (and sometimes +# independent) vowels. + +# [Not derivable] + +093A ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN OE +093B ; Vowel_Dependent # Mc DEVANAGARI VOWEL SIGN OOE +093E..0940 ; Vowel_Dependent # Mc [3] DEVANAGARI VOWEL SIGN AA..DEVANAGARI VOWEL SIGN II +0941..0948 ; Vowel_Dependent # Mn [8] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN AI +0949..094C ; Vowel_Dependent # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094E..094F ; Vowel_Dependent # Mc [2] DEVANAGARI VOWEL SIGN PRISHTHAMATRA E..DEVANAGARI VOWEL SIGN AW +0955..0957 ; Vowel_Dependent # Mn [3] DEVANAGARI VOWEL SIGN CANDRA LONG E..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Vowel_Dependent # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BE..09C0 ; Vowel_Dependent # Mc [3] BENGALI VOWEL SIGN AA..BENGALI VOWEL SIGN II +09C1..09C4 ; Vowel_Dependent # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09C7..09C8 ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +09CB..09CC ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +09D7 ; Vowel_Dependent # Mc BENGALI AU LENGTH MARK +09E2..09E3 ; Vowel_Dependent # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3E..0A40 ; Vowel_Dependent # Mc [3] GURMUKHI VOWEL SIGN AA..GURMUKHI VOWEL SIGN II +0A41..0A42 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A47..0A48 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0ABE..0AC0 ; Vowel_Dependent # Mc [3] GUJARATI VOWEL SIGN AA..GUJARATI VOWEL SIGN II +0AC1..0AC5 ; Vowel_Dependent # Mn [5] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AC9 ; Vowel_Dependent # Mc GUJARATI VOWEL SIGN CANDRA O +0ACB..0ACC ; Vowel_Dependent # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0AE2..0AE3 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3E ; Vowel_Dependent # Mc ORIYA VOWEL SIGN AA +0B3F ; Vowel_Dependent # Mn ORIYA VOWEL SIGN I +0B40 ; Vowel_Dependent # Mc ORIYA VOWEL SIGN II +0B41..0B44 ; Vowel_Dependent # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B47..0B48 ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI +0B4B..0B4C ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN O..ORIYA VOWEL SIGN AU +0B55..0B56 ; Vowel_Dependent # Mn [2] ORIYA SIGN OVERLINE..ORIYA AI LENGTH MARK +0B57 ; Vowel_Dependent # Mc ORIYA AU LENGTH MARK +0B62..0B63 ; Vowel_Dependent # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BBE..0BBF ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC0 ; Vowel_Dependent # Mn TAMIL VOWEL SIGN II +0BC1..0BC2 ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BC6..0BC8 ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0BCA..0BCC ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0BD7 ; Vowel_Dependent # Mc TAMIL AU LENGTH MARK +0C3E..0C40 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C41..0C44 ; Vowel_Dependent # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C46..0C48 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI +0C4A..0C4C ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C55..0C56 ; Vowel_Dependent # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK +0C62..0C63 ; Vowel_Dependent # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBE ; Vowel_Dependent # Mc KANNADA VOWEL SIGN AA +0CBF ; Vowel_Dependent # Mn KANNADA VOWEL SIGN I +0CC0..0CC4 ; Vowel_Dependent # Mc [5] KANNADA VOWEL SIGN II..KANNADA VOWEL SIGN VOCALIC RR +0CC6 ; Vowel_Dependent # Mn KANNADA VOWEL SIGN E +0CC7..0CC8 ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +0CCC ; Vowel_Dependent # Mn KANNADA VOWEL SIGN AU +0CD5..0CD6 ; Vowel_Dependent # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CE2..0CE3 ; Vowel_Dependent # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D3E..0D40 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D44 ; Vowel_Dependent # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR +0D46..0D48 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0D4A..0D4C ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0D57 ; Vowel_Dependent # Mc MALAYALAM AU LENGTH MARK +0D62..0D63 ; Vowel_Dependent # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DCF..0DD1 ; Vowel_Dependent # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD2..0DD4 ; Vowel_Dependent # Mn [3] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Vowel_Dependent # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0DD8..0DDF ; Vowel_Dependent # Mc [8] SINHALA VOWEL SIGN GAETTA-PILLA..SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Vowel_Dependent # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Vowel_Dependent # Lo THAI CHARACTER SARA A +0E31 ; Vowel_Dependent # Mn THAI CHARACTER MAI HAN-AKAT +0E32..0E33 ; Vowel_Dependent # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E34..0E39 ; Vowel_Dependent # Mn [6] THAI CHARACTER SARA I..THAI CHARACTER SARA UU +0E40..0E45 ; Vowel_Dependent # Lo [6] THAI CHARACTER SARA E..THAI CHARACTER LAKKHANGYAO +0E47 ; Vowel_Dependent # Mn THAI CHARACTER MAITAIKHU +0EB0 ; Vowel_Dependent # Lo LAO VOWEL SIGN A +0EB1 ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KAN +0EB2..0EB3 ; Vowel_Dependent # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0EB4..0EB9 ; Vowel_Dependent # Mn [6] LAO VOWEL SIGN I..LAO VOWEL SIGN UU +0EBB ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KON +0EC0..0EC4 ; Vowel_Dependent # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +0F71..0F7D ; Vowel_Dependent # Mn [13] TIBETAN VOWEL SIGN AA..TIBETAN VOWEL SIGN OO +0F80..0F81 ; Vowel_Dependent # Mn [2] TIBETAN VOWEL SIGN REVERSED I..TIBETAN VOWEL SIGN REVERSED II +102B..102C ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +102D..1030 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN UU +1031 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN E +1032..1035 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +1056..1057 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1058..1059 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1062 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1071..1074 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1083..1084 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN SHAN AA..MYANMAR VOWEL SIGN SHAN E +1085..1086 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109C ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN AITON A +109D ; Vowel_Dependent # Mn MYANMAR VOWEL SIGN AITON AI +1712..1713 ; Vowel_Dependent # Mn [2] TAGALOG VOWEL SIGN I..TAGALOG VOWEL SIGN U +1732..1733 ; Vowel_Dependent # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1752..1753 ; Vowel_Dependent # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U +1772..1773 ; Vowel_Dependent # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U +17B6 ; Vowel_Dependent # Mc KHMER VOWEL SIGN AA +17B7..17BD ; Vowel_Dependent # Mn [7] KHMER VOWEL SIGN I..KHMER VOWEL SIGN UA +17BE..17C5 ; Vowel_Dependent # Mc [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU +17C8 ; Vowel_Dependent # Mc KHMER SIGN YUUKALEAPINTU +1920..1922 ; Vowel_Dependent # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U +1923..1926 ; Vowel_Dependent # Mc [4] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AU +1927..1928 ; Vowel_Dependent # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Vowel_Dependent # Mn LIMBU SIGN KEMPHRENG +19B0..19C0 ; Vowel_Dependent # Lo [17] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN IY +1A17..1A18 ; Vowel_Dependent # Mn [2] BUGINESE VOWEL SIGN I..BUGINESE VOWEL SIGN U +1A19..1A1A ; Vowel_Dependent # Mc [2] BUGINESE VOWEL SIGN E..BUGINESE VOWEL SIGN O +1A1B ; Vowel_Dependent # Mn BUGINESE VOWEL SIGN AE +1A61 ; Vowel_Dependent # Mc TAI THAM VOWEL SIGN A +1A62 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN MAI SAT +1A63..1A64 ; Vowel_Dependent # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A65..1A6C ; Vowel_Dependent # Mn [8] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN OA BELOW +1A6D..1A72 ; Vowel_Dependent # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI +1A73 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN OA ABOVE +1B35 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN TEDUNG +1B36..1B3A ; Vowel_Dependent # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA +1B3B ; Vowel_Dependent # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +1B3C ; Vowel_Dependent # Mn BALINESE VOWEL SIGN LA LENGA +1B3D..1B41 ; Vowel_Dependent # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1B42 ; Vowel_Dependent # Mn BALINESE VOWEL SIGN PEPET +1B43 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN PEPET TEDUNG +1BA4..1BA5 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PANGHULU..SUNDANESE VOWEL SIGN PANYUKU +1BA6..1BA7 ; Vowel_Dependent # Mc [2] SUNDANESE VOWEL SIGN PANAELAENG..SUNDANESE VOWEL SIGN PANOLONG +1BA8..1BA9 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE7 ; Vowel_Dependent # Mc BATAK VOWEL SIGN E +1BE8..1BE9 ; Vowel_Dependent # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BEA..1BEC ; Vowel_Dependent # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BED ; Vowel_Dependent # Mn BATAK VOWEL SIGN KARO O +1BEE ; Vowel_Dependent # Mc BATAK VOWEL SIGN U +1BEF ; Vowel_Dependent # Mn BATAK VOWEL SIGN U FOR SIMALUNGUN SA +1C26..1C2B ; Vowel_Dependent # Mc [6] LEPCHA VOWEL SIGN AA..LEPCHA VOWEL SIGN UU +1C2C ; Vowel_Dependent # Mn LEPCHA VOWEL SIGN E +A802 ; Vowel_Dependent # Mn SYLOTI NAGRI SIGN DVISVARA +A823..A824 ; Vowel_Dependent # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A825..A826 ; Vowel_Dependent # Mn [2] SYLOTI NAGRI VOWEL SIGN U..SYLOTI NAGRI VOWEL SIGN E +A827 ; Vowel_Dependent # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Vowel_Dependent # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A8FF ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN AY +A947..A94E ; Vowel_Dependent # Mn [8] REJANG VOWEL SIGN I..REJANG VOWEL SIGN EA +A9B4..A9B5 ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9B6..A9B9 ; Vowel_Dependent # Mn [4] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BA..A9BB ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +A9BC ; Vowel_Dependent # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Vowel_Dependent # Mn MYANMAR SIGN SHAN SAW +AA29..AA2E ; Vowel_Dependent # Mn [6] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN OE +AA2F..AA30 ; Vowel_Dependent # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA31..AA32 ; Vowel_Dependent # Mn [2] CHAM VOWEL SIGN AU..CHAM VOWEL SIGN UE +AAB0 ; Vowel_Dependent # Mn TAI VIET MAI KANG +AAB1 ; Vowel_Dependent # Lo TAI VIET VOWEL AA +AAB2..AAB4 ; Vowel_Dependent # Mn [3] TAI VIET VOWEL I..TAI VIET VOWEL U +AAB5..AAB6 ; Vowel_Dependent # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB7..AAB8 ; Vowel_Dependent # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AAB9..AABD ; Vowel_Dependent # Lo [5] TAI VIET VOWEL UEA..TAI VIET VOWEL AN +AABE ; Vowel_Dependent # Mn TAI VIET VOWEL AM +AAEB ; Vowel_Dependent # Mc MEETEI MAYEK VOWEL SIGN II +AAEC..AAED ; Vowel_Dependent # Mn [2] MEETEI MAYEK VOWEL SIGN UU..MEETEI MAYEK VOWEL SIGN AAI +AAEE..AAEF ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN AU..MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE5 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN ANAP +ABE6..ABE7 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE8 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABE9..ABEA ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +10A01..10A03 ; Vowel_Dependent # Mn [3] KHAROSHTHI VOWEL SIGN I..KHAROSHTHI VOWEL SIGN VOCALIC R +10A05..10A06 ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O +10A0C..10A0D ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN DOUBLE RING BELOW +11038..11045 ; Vowel_Dependent # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +11073..11074 ; Vowel_Dependent # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O +110B0..110B2 ; Vowel_Dependent # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II +110B3..110B6 ; Vowel_Dependent # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI +110B7..110B8 ; Vowel_Dependent # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +110C2 ; Vowel_Dependent # Mn KAITHI VOWEL SIGN VOCALIC R +11127..1112B ; Vowel_Dependent # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU +1112C ; Vowel_Dependent # Mc CHAKMA VOWEL SIGN E +1112D..11132 ; Vowel_Dependent # Mn [6] CHAKMA VOWEL SIGN AI..CHAKMA AU MARK +11145..11146 ; Vowel_Dependent # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI +111B3..111B5 ; Vowel_Dependent # Mc [3] SHARADA VOWEL SIGN AA..SHARADA VOWEL SIGN II +111B6..111BE ; Vowel_Dependent # Mn [9] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN O +111BF ; Vowel_Dependent # Mc SHARADA VOWEL SIGN AU +111CB..111CC ; Vowel_Dependent # Mn [2] SHARADA VOWEL MODIFIER MARK..SHARADA EXTRA SHORT VOWEL MARK +111CE ; Vowel_Dependent # Mc SHARADA VOWEL SIGN PRISHTHAMATRA E +1122C..1122E ; Vowel_Dependent # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +1122F..11231 ; Vowel_Dependent # Mn [3] KHOJKI VOWEL SIGN U..KHOJKI VOWEL SIGN AI +11232..11233 ; Vowel_Dependent # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU +112E0..112E2 ; Vowel_Dependent # Mc [3] KHUDAWADI VOWEL SIGN AA..KHUDAWADI VOWEL SIGN II +112E3..112E8 ; Vowel_Dependent # Mn [6] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN AU +1133E..1133F ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11340 ; Vowel_Dependent # Mn GRANTHA VOWEL SIGN II +11341..11344 ; Vowel_Dependent # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +11347..11348 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +1134B..1134C ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +11357 ; Vowel_Dependent # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +11435..11437 ; Vowel_Dependent # Mc [3] NEWA VOWEL SIGN AA..NEWA VOWEL SIGN II +11438..1143F ; Vowel_Dependent # Mn [8] NEWA VOWEL SIGN U..NEWA VOWEL SIGN AI +11440..11441 ; Vowel_Dependent # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +114B0..114B2 ; Vowel_Dependent # Mc [3] TIRHUTA VOWEL SIGN AA..TIRHUTA VOWEL SIGN II +114B3..114B8 ; Vowel_Dependent # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114B9 ; Vowel_Dependent # Mc TIRHUTA VOWEL SIGN E +114BA ; Vowel_Dependent # Mn TIRHUTA VOWEL SIGN SHORT E +114BB..114BE ; Vowel_Dependent # Mc [4] TIRHUTA VOWEL SIGN AI..TIRHUTA VOWEL SIGN AU +115AF..115B1 ; Vowel_Dependent # Mc [3] SIDDHAM VOWEL SIGN AA..SIDDHAM VOWEL SIGN II +115B2..115B5 ; Vowel_Dependent # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115B8..115BB ; Vowel_Dependent # Mc [4] SIDDHAM VOWEL SIGN E..SIDDHAM VOWEL SIGN AU +115DC..115DD ; Vowel_Dependent # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11630..11632 ; Vowel_Dependent # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +11633..1163A ; Vowel_Dependent # Mn [8] MODI VOWEL SIGN U..MODI VOWEL SIGN AI +1163B..1163C ; Vowel_Dependent # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +11640 ; Vowel_Dependent # Mn MODI SIGN ARDHACANDRA +116AD ; Vowel_Dependent # Mn TAKRI VOWEL SIGN AA +116AE..116AF ; Vowel_Dependent # Mc [2] TAKRI VOWEL SIGN I..TAKRI VOWEL SIGN II +116B0..116B5 ; Vowel_Dependent # Mn [6] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN AU +11720..11721 ; Vowel_Dependent # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +11722..11725 ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN I..AHOM VOWEL SIGN UU +11726 ; Vowel_Dependent # Mc AHOM VOWEL SIGN E +11727..1172A ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN AW..AHOM VOWEL SIGN AM +1182C..1182E ; Vowel_Dependent # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II +1182F..11836 ; Vowel_Dependent # Mn [8] DOGRA VOWEL SIGN U..DOGRA VOWEL SIGN AU +11930..11935 ; Vowel_Dependent # Mc [6] DIVES AKURU VOWEL SIGN AA..DIVES AKURU VOWEL SIGN E +11937..11938 ; Vowel_Dependent # Mc [2] DIVES AKURU VOWEL SIGN AI..DIVES AKURU VOWEL SIGN O +119D1..119D3 ; Vowel_Dependent # Mc [3] NANDINAGARI VOWEL SIGN AA..NANDINAGARI VOWEL SIGN II +119D4..119D7 ; Vowel_Dependent # Mn [4] NANDINAGARI VOWEL SIGN U..NANDINAGARI VOWEL SIGN VOCALIC RR +119DA..119DB ; Vowel_Dependent # Mn [2] NANDINAGARI VOWEL SIGN E..NANDINAGARI VOWEL SIGN AI +119DC..119DD ; Vowel_Dependent # Mc [2] NANDINAGARI VOWEL SIGN O..NANDINAGARI VOWEL SIGN AU +119E4 ; Vowel_Dependent # Mc NANDINAGARI VOWEL SIGN PRISHTHAMATRA E +11A01..11A0A ; Vowel_Dependent # Mn [10] ZANABAZAR SQUARE VOWEL SIGN I..ZANABAZAR SQUARE VOWEL LENGTH MARK +11A51..11A56 ; Vowel_Dependent # Mn [6] SOYOMBO VOWEL SIGN I..SOYOMBO VOWEL SIGN OE +11A57..11A58 ; Vowel_Dependent # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A59..11A5B ; Vowel_Dependent # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11C2F ; Vowel_Dependent # Mc BHAIKSUKI VOWEL SIGN AA +11C30..11C36 ; Vowel_Dependent # Mn [7] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN VOCALIC L +11C38..11C3B ; Vowel_Dependent # Mn [4] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI VOWEL SIGN AU +11CB0 ; Vowel_Dependent # Mn MARCHEN VOWEL SIGN AA +11CB1 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN I +11CB2..11CB3 ; Vowel_Dependent # Mn [2] MARCHEN VOWEL SIGN U..MARCHEN VOWEL SIGN E +11CB4 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN O +11D31..11D36 ; Vowel_Dependent # Mn [6] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN VOCALIC R +11D3A ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Vowel_Dependent # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN AU +11D43 ; Vowel_Dependent # Mn MASARAM GONDI SIGN CANDRA +11D8A..11D8E ; Vowel_Dependent # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU +11D90..11D91 ; Vowel_Dependent # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI +11D93..11D94 ; Vowel_Dependent # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU +11EF3..11EF4 ; Vowel_Dependent # Mn [2] MAKASAR VOWEL SIGN I..MAKASAR VOWEL SIGN U +11EF5..11EF6 ; Vowel_Dependent # Mc [2] MAKASAR VOWEL SIGN E..MAKASAR VOWEL SIGN O + +# ================================================ + +# Indic_Syllabic_Category=Vowel + +# (Other) Vowels (reanalyzed as ordinary alphabetic letters or marks) + +# [Not derivable] + +1963..196D ; Vowel # Lo [11] TAI LE LETTER A..TAI LE LETTER AI +A85E..A861 ; Vowel # Lo [4] PHAGS-PA LETTER I..PHAGS-PA LETTER O +A866 ; Vowel # Lo PHAGS-PA LETTER EE +A922..A925 ; Vowel # Lo [4] KAYAH LI LETTER A..KAYAH LI LETTER OO +A926..A92A ; Vowel # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O +11150..11154 ; Vowel # Lo [5] MAHAJANI LETTER A..MAHAJANI LETTER O + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Placeholder + +# Consonant Placeholder +# This includes generic placeholders used for +# Indic script layout (NBSP and dotted circle), as well as a few script- +# specific vowel-holder characters which are not technically +# consonants, but serve instead as bases for placement of vowel marks. + +# [Not derivable] + +002D ; Consonant_Placeholder # Pd HYPHEN-MINUS +00A0 ; Consonant_Placeholder # Zs NO-BREAK SPACE +00D7 ; Consonant_Placeholder # Sm MULTIPLICATION SIGN +0980 ; Consonant_Placeholder # Lo BENGALI ANJI +0A72..0A73 ; Consonant_Placeholder # Lo [2] GURMUKHI IRI..GURMUKHI URA +104B ; Consonant_Placeholder # Po MYANMAR SIGN SECTION +104E ; Consonant_Placeholder # Po MYANMAR SYMBOL AFOREMENTIONED +1900 ; Consonant_Placeholder # Lo LIMBU VOWEL-CARRIER LETTER +1CFA ; Consonant_Placeholder # Lo VEDIC SIGN DOUBLE ANUSVARA ANTARGOMUKHA +2010..2014 ; Consonant_Placeholder # Pd [5] HYPHEN..EM DASH +25CC ; Consonant_Placeholder # So DOTTED CIRCLE +AA74..AA76 ; Consonant_Placeholder # Lo [3] MYANMAR LOGOGRAM KHAMTI OAY..MYANMAR LOGOGRAM KHAMTI HM +11A3F ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL HEAD MARK +11A45 ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL DOUBLE-LINED HEAD MARK +11EF2 ; Consonant_Placeholder # Lo MAKASAR ANGKA + +# ================================================ + +# Indic_Syllabic_Category=Consonant + +# Consonant (ordinary abugida consonants, with inherent vowels) + +# [Not derivable] + +0915..0939 ; Consonant # Lo [37] DEVANAGARI LETTER KA..DEVANAGARI LETTER HA +0958..095F ; Consonant # Lo [8] DEVANAGARI LETTER QA..DEVANAGARI LETTER YYA +0978..097F ; Consonant # Lo [8] DEVANAGARI LETTER MARWARI DDA..DEVANAGARI LETTER BBA +0995..09A8 ; Consonant # Lo [20] BENGALI LETTER KA..BENGALI LETTER NA +09AA..09B0 ; Consonant # Lo [7] BENGALI LETTER PA..BENGALI LETTER RA +09B2 ; Consonant # Lo BENGALI LETTER LA +09B6..09B9 ; Consonant # Lo [4] BENGALI LETTER SHA..BENGALI LETTER HA +09DC..09DD ; Consonant # Lo [2] BENGALI LETTER RRA..BENGALI LETTER RHA +09DF ; Consonant # Lo BENGALI LETTER YYA +09F0..09F1 ; Consonant # Lo [2] BENGALI LETTER RA WITH MIDDLE DIAGONAL..BENGALI LETTER RA WITH LOWER DIAGONAL +0A15..0A28 ; Consonant # Lo [20] GURMUKHI LETTER KA..GURMUKHI LETTER NA +0A2A..0A30 ; Consonant # Lo [7] GURMUKHI LETTER PA..GURMUKHI LETTER RA +0A32..0A33 ; Consonant # Lo [2] GURMUKHI LETTER LA..GURMUKHI LETTER LLA +0A35..0A36 ; Consonant # Lo [2] GURMUKHI LETTER VA..GURMUKHI LETTER SHA +0A38..0A39 ; Consonant # Lo [2] GURMUKHI LETTER SA..GURMUKHI LETTER HA +0A59..0A5C ; Consonant # Lo [4] GURMUKHI LETTER KHHA..GURMUKHI LETTER RRA +0A5E ; Consonant # Lo GURMUKHI LETTER FA +0A95..0AA8 ; Consonant # Lo [20] GUJARATI LETTER KA..GUJARATI LETTER NA +0AAA..0AB0 ; Consonant # Lo [7] GUJARATI LETTER PA..GUJARATI LETTER RA +0AB2..0AB3 ; Consonant # Lo [2] GUJARATI LETTER LA..GUJARATI LETTER LLA +0AB5..0AB9 ; Consonant # Lo [5] GUJARATI LETTER VA..GUJARATI LETTER HA +0AF9 ; Consonant # Lo GUJARATI LETTER ZHA +0B15..0B28 ; Consonant # Lo [20] ORIYA LETTER KA..ORIYA LETTER NA +0B2A..0B30 ; Consonant # Lo [7] ORIYA LETTER PA..ORIYA LETTER RA +0B32..0B33 ; Consonant # Lo [2] ORIYA LETTER LA..ORIYA LETTER LLA +0B35..0B39 ; Consonant # Lo [5] ORIYA LETTER VA..ORIYA LETTER HA +0B5C..0B5D ; Consonant # Lo [2] ORIYA LETTER RRA..ORIYA LETTER RHA +0B5F ; Consonant # Lo ORIYA LETTER YYA +0B71 ; Consonant # Lo ORIYA LETTER WA +0B95 ; Consonant # Lo TAMIL LETTER KA +0B99..0B9A ; Consonant # Lo [2] TAMIL LETTER NGA..TAMIL LETTER CA +0B9C ; Consonant # Lo TAMIL LETTER JA +0B9E..0B9F ; Consonant # Lo [2] TAMIL LETTER NYA..TAMIL LETTER TTA +0BA3..0BA4 ; Consonant # Lo [2] TAMIL LETTER NNA..TAMIL LETTER TA +0BA8..0BAA ; Consonant # Lo [3] TAMIL LETTER NA..TAMIL LETTER PA +0BAE..0BB9 ; Consonant # Lo [12] TAMIL LETTER MA..TAMIL LETTER HA +0C15..0C28 ; Consonant # Lo [20] TELUGU LETTER KA..TELUGU LETTER NA +0C2A..0C39 ; Consonant # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C58..0C5A ; Consonant # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C95..0CA8 ; Consonant # Lo [20] KANNADA LETTER KA..KANNADA LETTER NA +0CAA..0CB3 ; Consonant # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA +0CB5..0CB9 ; Consonant # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA +0CDE ; Consonant # Lo KANNADA LETTER FA +0D15..0D3A ; Consonant # Lo [38] MALAYALAM LETTER KA..MALAYALAM LETTER TTTA +0D9A..0DB1 ; Consonant # Lo [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA +0DB3..0DBB ; Consonant # Lo [9] SINHALA LETTER SANYAKA DAYANNA..SINHALA LETTER RAYANNA +0DBD ; Consonant # Lo SINHALA LETTER DANTAJA LAYANNA +0DC0..0DC6 ; Consonant # Lo [7] SINHALA LETTER VAYANNA..SINHALA LETTER FAYANNA +0E01..0E2E ; Consonant # Lo [46] THAI CHARACTER KO KAI..THAI CHARACTER HO NOKHUK +0E81..0E82 ; Consonant # Lo [2] LAO LETTER KO..LAO LETTER KHO SUNG +0E84 ; Consonant # Lo LAO LETTER KHO TAM +0E86..0E8A ; Consonant # Lo [5] LAO LETTER PALI GHA..LAO LETTER SO TAM +0E8C..0EA3 ; Consonant # Lo [24] LAO LETTER PALI JHA..LAO LETTER LO LING +0EA5 ; Consonant # Lo LAO LETTER LO LOOT +0EA7..0EAE ; Consonant # Lo [8] LAO LETTER WO..LAO LETTER HO TAM +0EDC..0EDF ; Consonant # Lo [4] LAO HO NO..LAO LETTER KHMU NYO +0F40..0F47 ; Consonant # Lo [8] TIBETAN LETTER KA..TIBETAN LETTER JA +0F49..0F6C ; Consonant # Lo [36] TIBETAN LETTER NYA..TIBETAN LETTER RRA +1000..1020 ; Consonant # Lo [33] MYANMAR LETTER KA..MYANMAR LETTER LLA +103F ; Consonant # Lo MYANMAR LETTER GREAT SA +1050..1051 ; Consonant # Lo [2] MYANMAR LETTER SHA..MYANMAR LETTER SSA +105A..105D ; Consonant # Lo [4] MYANMAR LETTER MON NGA..MYANMAR LETTER MON BBE +1061 ; Consonant # Lo MYANMAR LETTER SGAW KAREN SHA +1065..1066 ; Consonant # Lo [2] MYANMAR LETTER WESTERN PWO KAREN THA..MYANMAR LETTER WESTERN PWO KAREN PWA +106E..1070 ; Consonant # Lo [3] MYANMAR LETTER EASTERN PWO KAREN NNA..MYANMAR LETTER EASTERN PWO KAREN GHWA +1075..1081 ; Consonant # Lo [13] MYANMAR LETTER SHAN KA..MYANMAR LETTER SHAN HA +108E ; Consonant # Lo MYANMAR LETTER RUMAI PALAUNG FA +1703..1711 ; Consonant # Lo [15] TAGALOG LETTER KA..TAGALOG LETTER HA +171F ; Consonant # Lo TAGALOG LETTER ARCHAIC RA +1723..1731 ; Consonant # Lo [15] HANUNOO LETTER KA..HANUNOO LETTER HA +1743..1751 ; Consonant # Lo [15] BUHID LETTER KA..BUHID LETTER HA +1763..176C ; Consonant # Lo [10] TAGBANWA LETTER KA..TAGBANWA LETTER YA +176E..1770 ; Consonant # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA +1780..17A2 ; Consonant # Lo [35] KHMER LETTER KA..KHMER LETTER QA +1901..191E ; Consonant # Lo [30] LIMBU LETTER KA..LIMBU LETTER TRA +1950..1962 ; Consonant # Lo [19] TAI LE LETTER KA..TAI LE LETTER NA +1980..19AB ; Consonant # Lo [44] NEW TAI LUE LETTER HIGH QA..NEW TAI LUE LETTER LOW SUA +1A00..1A16 ; Consonant # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA +1A20..1A4C ; Consonant # Lo [45] TAI THAM LETTER HIGH KA..TAI THAM LETTER LOW HA +1A53..1A54 ; Consonant # Lo [2] TAI THAM LETTER LAE..TAI THAM LETTER GREAT SA +1B13..1B33 ; Consonant # Lo [33] BALINESE LETTER KA..BALINESE LETTER HA +1B45..1B4C ; Consonant # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA +1B8A..1BA0 ; Consonant # Lo [23] SUNDANESE LETTER KA..SUNDANESE LETTER HA +1BAE..1BAF ; Consonant # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA +1BBB..1BBD ; Consonant # Lo [3] SUNDANESE LETTER REU..SUNDANESE LETTER BHA +1BC0..1BE3 ; Consonant # Lo [36] BATAK LETTER A..BATAK LETTER MBA +1C00..1C23 ; Consonant # Lo [36] LEPCHA LETTER KA..LEPCHA LETTER A +1C4D..1C4F ; Consonant # Lo [3] LEPCHA LETTER TTA..LEPCHA LETTER DDA +A807..A80A ; Consonant # Lo [4] SYLOTI NAGRI LETTER KO..SYLOTI NAGRI LETTER GHO +A80C..A822 ; Consonant # Lo [23] SYLOTI NAGRI LETTER CO..SYLOTI NAGRI LETTER HO +A840..A85D ; Consonant # Lo [30] PHAGS-PA LETTER KA..PHAGS-PA LETTER A +A862..A865 ; Consonant # Lo [4] PHAGS-PA LETTER QA..PHAGS-PA LETTER GGA +A869..A870 ; Consonant # Lo [8] PHAGS-PA LETTER TTA..PHAGS-PA LETTER ASPIRATED FA +A872 ; Consonant # Lo PHAGS-PA SUPERFIXED LETTER RA +A892..A8B3 ; Consonant # Lo [34] SAURASHTRA LETTER KA..SAURASHTRA LETTER LLA +A90A..A921 ; Consonant # Lo [24] KAYAH LI LETTER KA..KAYAH LI LETTER CA +A930..A946 ; Consonant # Lo [23] REJANG LETTER KA..REJANG LETTER A +A989..A98B ; Consonant # Lo [3] JAVANESE LETTER PA CEREK..JAVANESE LETTER NGA LELET RASWADI +A98F..A9B2 ; Consonant # Lo [36] JAVANESE LETTER KA..JAVANESE LETTER HA +A9E0..A9E4 ; Consonant # Lo [5] MYANMAR LETTER SHAN GHA..MYANMAR LETTER SHAN BHA +A9E7..A9EF ; Consonant # Lo [9] MYANMAR LETTER TAI LAING NYA..MYANMAR LETTER TAI LAING NNA +A9FA..A9FE ; Consonant # Lo [5] MYANMAR LETTER TAI LAING LLA..MYANMAR LETTER TAI LAING BHA +AA06..AA28 ; Consonant # Lo [35] CHAM LETTER KA..CHAM LETTER HA +AA60..AA6F ; Consonant # Lo [16] MYANMAR LETTER KHAMTI GA..MYANMAR LETTER KHAMTI FA +AA71..AA73 ; Consonant # Lo [3] MYANMAR LETTER KHAMTI XA..MYANMAR LETTER KHAMTI RA +AA7A ; Consonant # Lo MYANMAR LETTER AITON RA +AA7E..AA7F ; Consonant # Lo [2] MYANMAR LETTER SHWE PALAUNG CHA..MYANMAR LETTER SHWE PALAUNG SHA +AA80..AAAF ; Consonant # Lo [48] TAI VIET LETTER LOW KO..TAI VIET LETTER HIGH O +AAE2..AAEA ; Consonant # Lo [9] MEETEI MAYEK LETTER CHA..MEETEI MAYEK LETTER SSA +ABC0..ABCD ; Consonant # Lo [14] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER HUK +ABD0 ; Consonant # Lo MEETEI MAYEK LETTER PHAM +ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTER BHAM +10A00 ; Consonant # Lo KHAROSHTHI LETTER A +10A10..10A13 ; Consonant # Lo [4] KHAROSHTHI LETTER KA..KHAROSHTHI LETTER GHA +10A15..10A17 ; Consonant # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA +10A19..10A35 ; Consonant # Lo [29] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER VHA +11013..11037 ; Consonant # Lo [37] BRAHMI LETTER KA..BRAHMI LETTER OLD TAMIL NNNA +11075 ; Consonant # Lo BRAHMI LETTER OLD TAMIL LLA +1108D..110AF ; Consonant # Lo [35] KAITHI LETTER KA..KAITHI LETTER HA +11107..11126 ; Consonant # Lo [32] CHAKMA LETTER KAA..CHAKMA LETTER HAA +11144 ; Consonant # Lo CHAKMA LETTER LHAA +11147 ; Consonant # Lo CHAKMA LETTER VAA +11155..11172 ; Consonant # Lo [30] MAHAJANI LETTER KA..MAHAJANI LETTER RRA +11191..111B2 ; Consonant # Lo [34] SHARADA LETTER KA..SHARADA LETTER HA +11208..11211 ; Consonant # Lo [10] KHOJKI LETTER KA..KHOJKI LETTER JJA +11213..1122B ; Consonant # Lo [25] KHOJKI LETTER NYA..KHOJKI LETTER LLA +11284..11286 ; Consonant # Lo [3] MULTANI LETTER KA..MULTANI LETTER GA +11288 ; Consonant # Lo MULTANI LETTER GHA +1128A..1128D ; Consonant # Lo [4] MULTANI LETTER CA..MULTANI LETTER JJA +1128F..1129D ; Consonant # Lo [15] MULTANI LETTER NYA..MULTANI LETTER BA +1129F..112A8 ; Consonant # Lo [10] MULTANI LETTER BHA..MULTANI LETTER RHA +112BA..112DE ; Consonant # Lo [37] KHUDAWADI LETTER KA..KHUDAWADI LETTER HA +11315..11328 ; Consonant # Lo [20] GRANTHA LETTER KA..GRANTHA LETTER NA +1132A..11330 ; Consonant # Lo [7] GRANTHA LETTER PA..GRANTHA LETTER RA +11332..11333 ; Consonant # Lo [2] GRANTHA LETTER LA..GRANTHA LETTER LLA +11335..11339 ; Consonant # Lo [5] GRANTHA LETTER VA..GRANTHA LETTER HA +1140E..11434 ; Consonant # Lo [39] NEWA LETTER KA..NEWA LETTER HA +1148F..114AF ; Consonant # Lo [33] TIRHUTA LETTER KA..TIRHUTA LETTER HA +1158E..115AE ; Consonant # Lo [33] SIDDHAM LETTER KA..SIDDHAM LETTER HA +1160E..1162F ; Consonant # Lo [34] MODI LETTER KA..MODI LETTER LLA +1168A..116AA ; Consonant # Lo [33] TAKRI LETTER KA..TAKRI LETTER RRA +116B8 ; Consonant # Lo TAKRI LETTER ARCHAIC KHA +11700..1171A ; Consonant # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA +11740..11746 ; Consonant # Lo [7] AHOM LETTER CA..AHOM LETTER LLA +1180A..1182B ; Consonant # Lo [34] DOGRA LETTER KA..DOGRA LETTER RRA +1190C..11913 ; Consonant # Lo [8] DIVES AKURU LETTER KA..DIVES AKURU LETTER JA +11915..11916 ; Consonant # Lo [2] DIVES AKURU LETTER NYA..DIVES AKURU LETTER TTA +11918..1192F ; Consonant # Lo [24] DIVES AKURU LETTER DDA..DIVES AKURU LETTER ZA +119AE..119D0 ; Consonant # Lo [35] NANDINAGARI LETTER KA..NANDINAGARI LETTER RRA +11A0B..11A32 ; Consonant # Lo [40] ZANABAZAR SQUARE LETTER KA..ZANABAZAR SQUARE LETTER KSSA +11A5C..11A83 ; Consonant # Lo [40] SOYOMBO LETTER KA..SOYOMBO LETTER KSSA +11C0E..11C2E ; Consonant # Lo [33] BHAIKSUKI LETTER KA..BHAIKSUKI LETTER HA +11C72..11C8F ; Consonant # Lo [30] MARCHEN LETTER KA..MARCHEN LETTER A +11D0C..11D30 ; Consonant # Lo [37] MASARAM GONDI LETTER KA..MASARAM GONDI LETTER TRA +11D6C..11D89 ; Consonant # Lo [30] GUNJALA GONDI LETTER YA..GUNJALA GONDI LETTER SA +11EE0..11EF1 ; Consonant # Lo [18] MAKASAR LETTER KA..MAKASAR LETTER A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Dead + +# Dead Consonant (special consonant with killed vowel) + +# [Not derivable] + +09CE ; Consonant_Dead # Lo BENGALI LETTER KHANDA TA +0C5D ; Consonant_Dead # Lo TELUGU LETTER NAKAARA POLLU +0CDD ; Consonant_Dead # Lo KANNADA LETTER NAKAARA POLLU +0D54..0D56 ; Consonant_Dead # Lo [3] MALAYALAM LETTER CHILLU M..MALAYALAM LETTER CHILLU LLL +0D7A..0D7F ; Consonant_Dead # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K +1CF2..1CF3 ; Consonant_Dead # Lo [2] VEDIC SIGN ARDHAVISARGA..VEDIC SIGN ROTATED ARDHAVISARGA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_With_Stacker + +# Consonants that may make stacked ligatures with the next consonant +# without the use of a virama + +# [Not derivable] + +0CF1..0CF2 ; Consonant_With_Stacker # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA +1CF5..1CF6 ; Consonant_With_Stacker # Lo [2] VEDIC SIGN JIHVAMULIYA..VEDIC SIGN UPADHMANIYA +11003..11004 ; Consonant_With_Stacker # Lo [2] BRAHMI SIGN JIHVAMULIYA..BRAHMI SIGN UPADHMANIYA +11460..11461 ; Consonant_With_Stacker # Lo [2] NEWA SIGN JIHVAMULIYA..NEWA SIGN UPADHMANIYA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Prefixed + +# Cluster-initial consonants + +# [Not derivable] + +111C2..111C3 ; Consonant_Prefixed # Lo [2] SHARADA SIGN JIHVAMULIYA..SHARADA SIGN UPADHMANIYA +1193F ; Consonant_Prefixed # Lo DIVES AKURU PREFIXED NASAL SIGN +11A3A ; Consonant_Prefixed # Lo ZANABAZAR SQUARE CLUSTER-INITIAL LETTER RA +11A84..11A89 ; Consonant_Prefixed # Lo [6] SOYOMBO SIGN JIHVAMULIYA..SOYOMBO CLUSTER-INITIAL LETTER SA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Preceding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when preceding the main +# consonant. + +# [Not derivable] + +0D4E ; Consonant_Preceding_Repha # Lo MALAYALAM LETTER DOT REPH +11941 ; Consonant_Preceding_Repha # Lo DIVES AKURU INITIAL RA +11D46 ; Consonant_Preceding_Repha # Lo MASARAM GONDI REPHA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Initial_Postfixed + +# Consonants that succeed the main consonant in character sequences, but are +# pronounced before it. + +# [Not derivable] + +1A5A ; Consonant_Initial_Postfixed # Mn TAI THAM CONSONANT SIGN LOW PA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Succeeding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when succeeding the main +# consonant. + +# [Not derivable] + +17CC ; Consonant_Succeeding_Repha # Mn KHMER SIGN ROBAT + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Subjoined + +# Subjoined Consonant (C2 form subtending a base consonant in Tibetan, etc.) + +# [Not derivable] + +0F8D..0F97 ; Consonant_Subjoined # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Consonant_Subjoined # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +1929..192B ; Consonant_Subjoined # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1A57 ; Consonant_Subjoined # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A5B..1A5E ; Consonant_Subjoined # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1BA1 ; Consonant_Subjoined # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA2..1BA3 ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BAC..1BAD ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C24..1C25 ; Consonant_Subjoined # Mc [2] LEPCHA SUBJOINED LETTER YA..LEPCHA SUBJOINED LETTER RA +A867..A868 ; Consonant_Subjoined # Lo [2] PHAGS-PA SUBJOINED LETTER WA..PHAGS-PA SUBJOINED LETTER YA +A871 ; Consonant_Subjoined # Lo PHAGS-PA SUBJOINED LETTER RA +11C92..11CA7 ; Consonant_Subjoined # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CA9 ; Consonant_Subjoined # Mc MARCHEN SUBJOINED LETTER YA +11CAA..11CAF ; Consonant_Subjoined # Mn [6] MARCHEN SUBJOINED LETTER RA..MARCHEN SUBJOINED LETTER A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Medial + +# Medial Consonant (medial liquid, occurring in clusters) + +# [Not derivable] + +0A75 ; Consonant_Medial # Mn GURMUKHI SIGN YAKASH +0EBC ; Consonant_Medial # Mn LAO SEMIVOWEL SIGN LO +0EBD ; Consonant_Medial # Lo LAO SEMIVOWEL SIGN NYO +103B..103C ; Consonant_Medial # Mc [2] MYANMAR CONSONANT SIGN MEDIAL YA..MYANMAR CONSONANT SIGN MEDIAL RA +103D..103E ; Consonant_Medial # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +105E..1060 ; Consonant_Medial # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Consonant_Medial # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +1A55 ; Consonant_Medial # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A56 ; Consonant_Medial # Mn TAI THAM CONSONANT SIGN MEDIAL LA +A8B4 ; Consonant_Medial # Mc SAURASHTRA CONSONANT SIGN HAARU +A9BD ; Consonant_Medial # Mn JAVANESE CONSONANT SIGN KERET +A9BE..A9BF ; Consonant_Medial # Mc [2] JAVANESE CONSONANT SIGN PENGKAL..JAVANESE CONSONANT SIGN CAKRA +AA33..AA34 ; Consonant_Medial # Mc [2] CHAM CONSONANT SIGN YA..CHAM CONSONANT SIGN RA +AA35..AA36 ; Consonant_Medial # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +1171D..1171F ; Consonant_Medial # Mn [3] AHOM CONSONANT SIGN MEDIAL LA..AHOM CONSONANT SIGN MEDIAL LIGATING RA +11940 ; Consonant_Medial # Mc DIVES AKURU MEDIAL YA +11942 ; Consonant_Medial # Mc DIVES AKURU MEDIAL RA +11A3B..11A3E ; Consonant_Medial # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11D47 ; Consonant_Medial # Mn MASARAM GONDI RA-KARA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Final + +# Final Consonant (special final forms which do not take vowels) + +# [Not derivable] + +1930..1931 ; Consonant_Final # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Consonant_Final # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +1939 ; Consonant_Final # Mn LIMBU SIGN MUKPHRENG +19C1..19C7 ; Consonant_Final # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B +1A58..1A59 ; Consonant_Final # Mn [2] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN FINAL NGA +1B03 ; Consonant_Final # Mn BALINESE SIGN SURANG +1B81 ; Consonant_Final # Mn SUNDANESE SIGN PANGLAYAR +1BBE..1BBF ; Consonant_Final # Lo [2] SUNDANESE LETTER FINAL K..SUNDANESE LETTER FINAL M +1BF0..1BF1 ; Consonant_Final # Mn [2] BATAK CONSONANT SIGN NG..BATAK CONSONANT SIGN H +1C2D..1C33 ; Consonant_Final # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +A94F..A951 ; Consonant_Final # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A952 ; Consonant_Final # Mc REJANG CONSONANT SIGN H +A982 ; Consonant_Final # Mn JAVANESE SIGN LAYAR +AA40..AA42 ; Consonant_Final # Lo [3] CHAM LETTER FINAL K..CHAM LETTER FINAL NG +AA43 ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL NG +AA44..AA4B ; Consonant_Final # Lo [8] CHAM LETTER FINAL CH..CHAM LETTER FINAL SS +AA4C ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL M +AA4D ; Consonant_Final # Mc CHAM CONSONANT SIGN FINAL H +ABDB..ABE2 ; Consonant_Final # Lo [8] MEETEI MAYEK LETTER KOK LONSUM..MEETEI MAYEK LETTER I LONSUM +11A8A..11A95 ; Consonant_Final # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Head_Letter + +# Head Letter (Tibetan) + +# [Not derivable] + +0F88..0F8C ; Consonant_Head_Letter # Lo [5] TIBETAN SIGN LCE TSA CAN..TIBETAN SIGN INVERTED MCHU CAN + +# ================================================ + +# Indic_Syllabic_Category=Modifying_Letter + +# Reanalyzed letters not participating in the abugida structure, but +# serving to modify the sound of an adjacent vowel or consonant. +# Note that this is not the same as General_Category=Modifier_Letter. + +# [Not derivable] + +0B83 ; Modifying_Letter # Lo TAMIL SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Tone_Letter + +# Tone Letter (spacing lexical tone mark with status as a letter) + +# [Not derivable] + +1970..1974 ; Tone_Letter # Lo [5] TAI LE LETTER TONE-2..TAI LE LETTER TONE-6 +AAC0 ; Tone_Letter # Lo TAI VIET TONE MAI NUENG +AAC2 ; Tone_Letter # Lo TAI VIET TONE MAI SONG + +# ================================================ + +# Indic_Syllabic_Category=Tone_Mark + +# Tone Mark (nonspacing or spacing lexical tone mark) + +# [Not derivable] + +0E48..0E4B ; Tone_Mark # Mn [4] THAI CHARACTER MAI EK..THAI CHARACTER MAI CHATTAWA +0EC8..0ECB ; Tone_Mark # Mn [4] LAO TONE MAI EK..LAO TONE MAI CATAWA +1037 ; Tone_Mark # Mn MYANMAR SIGN DOT BELOW +1063..1064 ; Tone_Mark # Mc [2] MYANMAR TONE MARK SGAW KAREN HATHI..MYANMAR TONE MARK SGAW KAREN KE PHO +1069..106D ; Tone_Mark # Mc [5] MYANMAR SIGN WESTERN PWO KAREN TONE-1..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1087..108C ; Tone_Mark # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108D ; Tone_Mark # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +108F ; Tone_Mark # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109B ; Tone_Mark # Mc [2] MYANMAR SIGN KHAMTI TONE-1..MYANMAR SIGN KHAMTI TONE-3 +19C8..19C9 ; Tone_Mark # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A75..1A79 ; Tone_Mark # Mn [5] TAI THAM SIGN TONE-1..TAI THAM SIGN KHUEN TONE-5 +A92B..A92D ; Tone_Mark # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +AA7B ; Tone_Mark # Mc MYANMAR SIGN PAO KAREN TONE +AA7C ; Tone_Mark # Mn MYANMAR SIGN TAI LAING TONE-2 +AA7D ; Tone_Mark # Mc MYANMAR SIGN TAI LAING TONE-5 +AABF ; Tone_Mark # Mn TAI VIET TONE MAI EK +AAC1 ; Tone_Mark # Mn TAI VIET TONE MAI THO +ABEC ; Tone_Mark # Mc MEETEI MAYEK LUM IYEK + +# ================================================ + +# Indic_Syllabic_Category=Gemination_Mark + +# Gemination Mark (doubling of the preceding or following consonant) + +# [Not derivable] + +0A71 ; Gemination_Mark # Mn GURMUKHI ADDAK +11237 ; Gemination_Mark # Mn KHOJKI SIGN SHADDA +11A98 ; Gemination_Mark # Mn SOYOMBO GEMINATION MARK + +# ================================================ + +# Indic_Syllabic_Category=Cantillation_Mark + +# Cantillation Mark (recitation marks, such as svara markers for the Samaveda) + +# [Not derivable] + +0951..0952 ; Cantillation_Mark # Mn [2] DEVANAGARI STRESS SIGN UDATTA..DEVANAGARI STRESS SIGN ANUDATTA +0A51 ; Cantillation_Mark # Mn GURMUKHI SIGN UDAAT +0AFA..0AFC ; Cantillation_Mark # Mn [3] GUJARATI SIGN SUKUN..GUJARATI SIGN MADDAH +1CD0..1CD2 ; Cantillation_Mark # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CD4..1CE0 ; Cantillation_Mark # Mn [13] VEDIC SIGN YAJURVEDIC MIDLINE SVARITA..VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CE1 ; Cantillation_Mark # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF4 ; Cantillation_Mark # Mn VEDIC TONE CANDRA ABOVE +1CF7 ; Cantillation_Mark # Mc VEDIC SIGN ATIKRAMA +1CF8..1CF9 ; Cantillation_Mark # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE +20F0 ; Cantillation_Mark # Mn COMBINING ASTERISK ABOVE +A8E0..A8F1 ; Cantillation_Mark # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +1123E ; Cantillation_Mark # Mn KHOJKI SIGN SUKUN +11366..1136C ; Cantillation_Mark # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Cantillation_Mark # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA + +# ================================================ + +# Indic_Syllabic_Category=Register_Shifter + +# Register Shifter (shifts register for consonants, akin to a tone mark) + +# [Not derivable] + +17C9..17CA ; Register_Shifter # Mn [2] KHMER SIGN MUUSIKATOAN..KHMER SIGN TRIISAP + +# ================================================ + +# Indic_Syllabic_Category=Syllable_Modifier + +# Syllable Modifier (miscellaneous combining characters that modify +# something in the orthographic syllable they succeed) + +# [Not derivable] + +00B2..00B3 ; Syllable_Modifier # No [2] SUPERSCRIPT TWO..SUPERSCRIPT THREE +09FE ; Syllable_Modifier # Mn BENGALI SANDHI MARK +0F35 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0FC6 ; Syllable_Modifier # Mn TIBETAN SYMBOL PADMA GDAN +17CB ; Syllable_Modifier # Mn KHMER SIGN BANTOC +17CE..17D0 ; Syllable_Modifier # Mn [3] KHMER SIGN KAKABAT..KHMER SIGN SAMYOK SANNYA +17D3 ; Syllable_Modifier # Mn KHMER SIGN BATHAMASAT +17DD ; Syllable_Modifier # Mn KHMER SIGN ATTHACAN +193B ; Syllable_Modifier # Mn LIMBU SIGN SA-I +1A7B..1A7C ; Syllable_Modifier # Mn [2] TAI THAM SIGN MAI SAM..TAI THAM SIGN KHUEN-LUE KARAN +1A7F ; Syllable_Modifier # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1C36 ; Syllable_Modifier # Mn LEPCHA SIGN RAN +1DFB ; Syllable_Modifier # Mn COMBINING DELETION MARK +2074 ; Syllable_Modifier # No SUPERSCRIPT FOUR +2082..2084 ; Syllable_Modifier # No [3] SUBSCRIPT TWO..SUBSCRIPT FOUR +111C9 ; Syllable_Modifier # Mn SHARADA SANDHI MARK +1145E ; Syllable_Modifier # Mn NEWA SANDHI MARK +11A33 ; Syllable_Modifier # Mn ZANABAZAR SQUARE FINAL CONSONANT MARK + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Killer + +# Consonant Killer (signifies that the previous consonant or consonants are +# not pronounced) + +# [Not derivable] + +0E4C ; Consonant_Killer # Mn THAI CHARACTER THANTHAKHAT +17CD ; Consonant_Killer # Mn KHMER SIGN TOANDAKHIAT + +# ================================================ + +# Indic_Syllabic_Category=Non_Joiner + +# Non_Joiner (Zero Width Non-Joiner) + +# [Not derivable] + +200C ; Non_Joiner # Cf ZERO WIDTH NON-JOINER + +# ================================================ + +# Indic_Syllabic_Category=Joiner + +# Joiner (Zero Width Joiner) + +# [Not derivable] + +200D ; Joiner # Cf ZERO WIDTH JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number_Joiner + +# Number_Joiner (forms ligatures between numbers for multiplication) + +# [Not derivable] + +1107F ; Number_Joiner # Mn BRAHMI NUMBER JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number + +# Number (can be used as vowel-holders like consonant placeholders) +# Note: A number may even hold subjoined consonants which may in turn +# have been formed using a virama or a stacker, e.g. the sequence +# where THAI THAM LETTER LOW TA is subjoined to +# TAI THAM THAM DIGIT THREE using an invisible stacker. + +# [Not derivable] + +0030..0039 ; Number # Nd [10] DIGIT ZERO..DIGIT NINE +0966..096F ; Number # Nd [10] DEVANAGARI DIGIT ZERO..DEVANAGARI DIGIT NINE +09E6..09EF ; Number # Nd [10] BENGALI DIGIT ZERO..BENGALI DIGIT NINE +0A66..0A6F ; Number # Nd [10] GURMUKHI DIGIT ZERO..GURMUKHI DIGIT NINE +0AE6..0AEF ; Number # Nd [10] GUJARATI DIGIT ZERO..GUJARATI DIGIT NINE +0B66..0B6F ; Number # Nd [10] ORIYA DIGIT ZERO..ORIYA DIGIT NINE +0BE6..0BEF ; Number # Nd [10] TAMIL DIGIT ZERO..TAMIL DIGIT NINE +0C66..0C6F ; Number # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE +0CE6..0CEF ; Number # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE +0D66..0D6F ; Number # Nd [10] MALAYALAM DIGIT ZERO..MALAYALAM DIGIT NINE +0DE6..0DEF ; Number # Nd [10] SINHALA LITH DIGIT ZERO..SINHALA LITH DIGIT NINE +0E50..0E59 ; Number # Nd [10] THAI DIGIT ZERO..THAI DIGIT NINE +0ED0..0ED9 ; Number # Nd [10] LAO DIGIT ZERO..LAO DIGIT NINE +0F20..0F29 ; Number # Nd [10] TIBETAN DIGIT ZERO..TIBETAN DIGIT NINE +0F2A..0F33 ; Number # No [10] TIBETAN DIGIT HALF ONE..TIBETAN DIGIT HALF ZERO +1040..1049 ; Number # Nd [10] MYANMAR DIGIT ZERO..MYANMAR DIGIT NINE +1090..1099 ; Number # Nd [10] MYANMAR SHAN DIGIT ZERO..MYANMAR SHAN DIGIT NINE +17E0..17E9 ; Number # Nd [10] KHMER DIGIT ZERO..KHMER DIGIT NINE +1946..194F ; Number # Nd [10] LIMBU DIGIT ZERO..LIMBU DIGIT NINE +19D0..19D9 ; Number # Nd [10] NEW TAI LUE DIGIT ZERO..NEW TAI LUE DIGIT NINE +19DA ; Number # No NEW TAI LUE THAM DIGIT ONE +1A80..1A89 ; Number # Nd [10] TAI THAM HORA DIGIT ZERO..TAI THAM HORA DIGIT NINE +1A90..1A99 ; Number # Nd [10] TAI THAM THAM DIGIT ZERO..TAI THAM THAM DIGIT NINE +1B50..1B59 ; Number # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE +1BB0..1BB9 ; Number # Nd [10] SUNDANESE DIGIT ZERO..SUNDANESE DIGIT NINE +1C40..1C49 ; Number # Nd [10] LEPCHA DIGIT ZERO..LEPCHA DIGIT NINE +A8D0..A8D9 ; Number # Nd [10] SAURASHTRA DIGIT ZERO..SAURASHTRA DIGIT NINE +A900..A909 ; Number # Nd [10] KAYAH LI DIGIT ZERO..KAYAH LI DIGIT NINE +A9D0..A9D9 ; Number # Nd [10] JAVANESE DIGIT ZERO..JAVANESE DIGIT NINE +A9F0..A9F9 ; Number # Nd [10] MYANMAR TAI LAING DIGIT ZERO..MYANMAR TAI LAING DIGIT NINE +AA50..AA59 ; Number # Nd [10] CHAM DIGIT ZERO..CHAM DIGIT NINE +ABF0..ABF9 ; Number # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE +10A40..10A48 ; Number # No [9] KHAROSHTHI DIGIT ONE..KHAROSHTHI FRACTION ONE HALF +11066..1106F ; Number # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11136..1113F ; Number # Nd [10] CHAKMA DIGIT ZERO..CHAKMA DIGIT NINE +111D0..111D9 ; Number # Nd [10] SHARADA DIGIT ZERO..SHARADA DIGIT NINE +111E1..111F4 ; Number # No [20] SINHALA ARCHAIC DIGIT ONE..SINHALA ARCHAIC NUMBER ONE THOUSAND +112F0..112F9 ; Number # Nd [10] KHUDAWADI DIGIT ZERO..KHUDAWADI DIGIT NINE +11450..11459 ; Number # Nd [10] NEWA DIGIT ZERO..NEWA DIGIT NINE +114D0..114D9 ; Number # Nd [10] TIRHUTA DIGIT ZERO..TIRHUTA DIGIT NINE +11650..11659 ; Number # Nd [10] MODI DIGIT ZERO..MODI DIGIT NINE +116C0..116C9 ; Number # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE +11730..11739 ; Number # Nd [10] AHOM DIGIT ZERO..AHOM DIGIT NINE +1173A..1173B ; Number # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY +11950..11959 ; Number # Nd [10] DIVES AKURU DIGIT ZERO..DIVES AKURU DIGIT NINE +11C50..11C59 ; Number # Nd [10] BHAIKSUKI DIGIT ZERO..BHAIKSUKI DIGIT NINE +11C5A..11C6C ; Number # No [19] BHAIKSUKI NUMBER ONE..BHAIKSUKI HUNDREDS UNIT MARK +11D50..11D59 ; Number # Nd [10] MASARAM GONDI DIGIT ZERO..MASARAM GONDI DIGIT NINE +11DA0..11DA9 ; Number # Nd [10] GUNJALA GONDI DIGIT ZERO..GUNJALA GONDI DIGIT NINE + +# ================================================ + +# Indic_Syllabic_Category=Brahmi_Joining_Number + +# Brahmi Joining Number (similar to Number in that in can be used as +# vowel-holders like Consonant_Placeholder, but may also be joined by +# a Number_Joiner of the same script, e.g. in Brahmi) + +# [Not derivable] + +11052..11065 ; Brahmi_Joining_Number # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND + +# EOF diff --git a/data/15.0.0-indic-positional-category.txt b/data/15.0.0-indic-positional-category.txt new file mode 100644 index 0000000..8b51a61 --- /dev/null +++ b/data/15.0.0-indic-positional-category.txt @@ -0,0 +1,808 @@ +# IndicPositionalCategory-15.0.0.txt +# Date: 2022-05-26, 02:18:00 GMT [KW, RP] +# © 2022 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use, see https://www.unicode.org/terms_of_use.html +# +# For documentation, see UAX #44: Unicode Character Database, +# at https://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Positional_Category enumerated property +# +# Scope: This property is aimed at the problem of +# the specification of syllabic structure for Indic scripts. +# Because dependent vowels (matras), visible viramas, and other +# characters are placed in notional slots around the consonant (or +# consonant cluster) core of an Indic syllable, there may be +# cooccurrence constraints or other interactions. Also, it may be +# desirable, in cases where more than one such character may occur in +# sequence, as for example, in a top slot and a bottom slot, to +# specify preferred orders for spelling. As such, this property +# is designed primarily to supplement the Indic_Syllabic_Category +# property. +# +# In addition to combining marks associated with Indic scripts, the +# Indic_Positional_Category has non-trivial values for special signs +# associated with Indic_Syllabic_Category=Consonant_Prefixed +# or Indic_Syllabic_Category=Consonant_Preceding_Repha. Those signs +# have General_Category=Lo, rather than being combining marks. +# They occur in initial position in syllabic structure. However, when +# rendered, they appear as marks positioned with respect to another +# base letter (usually above it). Hence, having an explicit value for +# Indic_Positional_Category for those signs can be helpful. +# +# Note that this property is *not* intended as +# a prescriptive property regarding display or font design, +# for a number of reasons. Good font design requires information +# that is outside the context of a character encoding standard, +# and is best handled in other venues. For Indic dependent +# vowels and similar characters, in particular: +# +# 1. Matra placement may vary somewhat based on typeface design. +# 2. Matra placement, even within a single script, may vary +# somewhat according to historic period or local conventions. +# 3. Matra placement may be changed by explicit orthographic reform +# decisions. +# 4. Matras may ligate in various ways with a consonant (or even +# other elements of a syllable) instead of occurring in a +# discrete location. +# 5. Matra display may be contextually determined. This is +# notable, for example, in the Tamil script, where the shape +# and placement of -u and -uu vowels depends strongly on +# which consonant they adjoin. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Positional_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as containing dependent vowels or similar characters +# in the structural sense used for the Indic_Positional_Category are the +# following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Dives Akuru, Dogra, Grantha, Gujarati, +# Gunjala Gondi, Gurmukhi, Hanunoo, Javanese, Kaithi, Kannada, Kawi, +# Kayah Li, Kharoshthi, Khmer, Khojki, Khudawadi, Lao, Lepcha, Limbu, +# Makasar, Malayalam, Marchen, Masaram Gondi, Meetei Mayek, Modi, +# Myanmar, Nandinagari, Newa, New Tai Lue, Oriya, Rejang, Saurashtra, +# Sharada, Siddham, Sinhala, Soyombo, Sundanese, Syloti Nagri, +# Tagalog, Tagbanwa, Tai Tham, Tai Viet, Takri, Tamil, Telugu, Thai, +# Tibetan, Tirhuta, and Zanabazar Square. +# +# All characters for all other scripts not in that list +# take the default value for this property. +# +# See IndicSyllabicCategory.txt for a slightly more extended +# list of Indic scripts, including those which do not have +# positional characters. Currently, those additional +# Indic scripts without positional characters are +# Multani, Phags-pa, and Tai Le. +# +# Notes: +# +# 1. The following characters are all assigned the positional category Right, +# but may have different positions in some cases: +# * U+0BC1 TAMIL VOWEL SIGN U and U+0BC2 TAMIL VOWEL SIGN UU have +# contextually variable placement in Tamil. +# * U+0D41 MALAYALAM VOWEL SIGN U and U+0D42 MALAYALAM VOWEL SIGN UU form +# complex ligatures with consonants in older Malayalam orthography. +# * U+11341 GRANTHA VOWEL SIGN U and U+11342 GRANTHA VOWEL SIGN UU have +# contextually variable placement in Grantha. +# * U+11440 NEWA VOWEL SIGN O and U+11441 NEWA VOWEL SIGN AU have contextually +# variable placement in Newa. +# +# 2. The following characters are all assigned the positional category Top, +# but may have different positions in some cases: +# * U+1143E NEWA VOWEL SIGN E and U+1143F NEWA VOWEL SIGN AI have contextually +# variable placement in Newa. +# +# 3. The following characters are all assigned the positional category Bottom, +# but may have different positions in some cases: +# * U+102F MYANMAR VOWEL SIGN U and U+1030 MYANMAR VOWEL SIGN UU have +# contextually variable placement in Myanmar. +# * U+1A69 TAI THAM VOWEL SIGN U and U+1A6A TAI THAM VOWEL SIGN UU have +# contextually variable placement in Tai Tham. +# +# 4. The following character is assigned the positional category Left, but +# may have different positions in different styles: +# * U+119D2 NANDINAGARI VOWEL SIGN I has stylistically variable placement +# in Nandinagari. + + +# ================================================ + +# Property: Indic_Positional_Category +# +# All code points not explicitly listed for Indic_Positional_Category +# have the value NA (not applicable). +# +# @missing: 0000..10FFFF; NA + +# ------------------------------------------------ + +# Indic_Positional_Category=Right + +0903 ; Right # Mc DEVANAGARI SIGN VISARGA +093B ; Right # Mc DEVANAGARI VOWEL SIGN OOE +093E ; Right # Mc DEVANAGARI VOWEL SIGN AA +0940 ; Right # Mc DEVANAGARI VOWEL SIGN II +0949..094C ; Right # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094F ; Right # Mc DEVANAGARI VOWEL SIGN AW +0982..0983 ; Right # Mc [2] BENGALI SIGN ANUSVARA..BENGALI SIGN VISARGA +09BE ; Right # Mc BENGALI VOWEL SIGN AA +09C0 ; Right # Mc BENGALI VOWEL SIGN II +09D7 ; Right # Mc BENGALI AU LENGTH MARK +0A03 ; Right # Mc GURMUKHI SIGN VISARGA +0A3E ; Right # Mc GURMUKHI VOWEL SIGN AA +0A40 ; Right # Mc GURMUKHI VOWEL SIGN II +0A83 ; Right # Mc GUJARATI SIGN VISARGA +0ABE ; Right # Mc GUJARATI VOWEL SIGN AA +0AC0 ; Right # Mc GUJARATI VOWEL SIGN II +0ACB..0ACC ; Right # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0B02..0B03 ; Right # Mc [2] ORIYA SIGN ANUSVARA..ORIYA SIGN VISARGA +0B3E ; Right # Mc ORIYA VOWEL SIGN AA +0B40 ; Right # Mc ORIYA VOWEL SIGN II +0BBE..0BBF ; Right # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC1..0BC2 ; Right # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BD7 ; Right # Mc TAMIL AU LENGTH MARK +0C01..0C03 ; Right # Mc [3] TELUGU SIGN CANDRABINDU..TELUGU SIGN VISARGA +0C41..0C44 ; Right # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C82..0C83 ; Right # Mc [2] KANNADA SIGN ANUSVARA..KANNADA SIGN VISARGA +0CBE ; Right # Mc KANNADA VOWEL SIGN AA +0CC1..0CC4 ; Right # Mc [4] KANNADA VOWEL SIGN U..KANNADA VOWEL SIGN VOCALIC RR +0CD5..0CD6 ; Right # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CF3 ; Right # Mc KANNADA SIGN COMBINING ANUSVARA ABOVE RIGHT +0D02..0D03 ; Right # Mc [2] MALAYALAM SIGN ANUSVARA..MALAYALAM SIGN VISARGA +0D3E..0D40 ; Right # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D42 ; Right # Mn [2] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN UU +0D57 ; Right # Mc MALAYALAM AU LENGTH MARK +0D82..0D83 ; Right # Mc [2] SINHALA SIGN ANUSVARAYA..SINHALA SIGN VISARGAYA +0DCF..0DD1 ; Right # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD8 ; Right # Mc SINHALA VOWEL SIGN GAETTA-PILLA +0DDF ; Right # Mc SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Right # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Right # Lo THAI CHARACTER SARA A +0E32..0E33 ; Right # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E45 ; Right # Lo THAI CHARACTER LAKKHANGYAO +0EB0 ; Right # Lo LAO VOWEL SIGN A +0EB2..0EB3 ; Right # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0F3E ; Right # Mc TIBETAN SIGN YAR TSHES +0F7F ; Right # Mc TIBETAN SIGN RNAM BCAD +102B..102C ; Right # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +1038 ; Right # Mc MYANMAR SIGN VISARGA +103B ; Right # Mc MYANMAR CONSONANT SIGN MEDIAL YA +1056..1057 ; Right # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1062..1064 ; Right # Mc [3] MYANMAR VOWEL SIGN SGAW KAREN EU..MYANMAR TONE MARK SGAW KAREN KE PHO +1067..106D ; Right # Mc [7] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1083 ; Right # Mc MYANMAR VOWEL SIGN SHAN AA +1087..108C ; Right # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108F ; Right # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109C ; Right # Mc [3] MYANMAR SIGN KHAMTI TONE-1..MYANMAR VOWEL SIGN AITON A +1715 ; Right # Mc TAGALOG SIGN PAMUDPOD +1734 ; Right # Mc HANUNOO SIGN PAMUDPOD +17B6 ; Right # Mc KHMER VOWEL SIGN AA +17C7..17C8 ; Right # Mc [2] KHMER SIGN REAHMUK..KHMER SIGN YUUKALEAPINTU +1923..1924 ; Right # Mc [2] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AI +1929..192B ; Right # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1930..1931 ; Right # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Right # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +19B0..19B4 ; Right # Lo [5] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN UU +19B8..19B9 ; Right # Lo [2] NEW TAI LUE VOWEL SIGN OA..NEW TAI LUE VOWEL SIGN UE +19BB..19C0 ; Right # Lo [6] NEW TAI LUE VOWEL SIGN AAY..NEW TAI LUE VOWEL SIGN IY +19C8..19C9 ; Right # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A1A ; Right # Mc BUGINESE VOWEL SIGN O +1A57 ; Right # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A61 ; Right # Mc TAI THAM VOWEL SIGN A +1A63..1A64 ; Right # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A6D ; Right # Mc TAI THAM VOWEL SIGN OY +1B04 ; Right # Mc BALINESE SIGN BISAH +1B35 ; Right # Mc BALINESE VOWEL SIGN TEDUNG +1B44 ; Right # Mc BALINESE ADEG ADEG +1B82 ; Right # Mc SUNDANESE SIGN PANGWISAD +1BA1 ; Right # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA7 ; Right # Mc SUNDANESE VOWEL SIGN PANOLONG +1BAA ; Right # Mc SUNDANESE SIGN PAMAAEH +1BE7 ; Right # Mc BATAK VOWEL SIGN E +1BEA..1BEC ; Right # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BEE ; Right # Mc BATAK VOWEL SIGN U +1BF2..1BF3 ; Right # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +1C24..1C26 ; Right # Mc [3] LEPCHA SUBJOINED LETTER YA..LEPCHA VOWEL SIGN AA +1C2A..1C2B ; Right # Mc [2] LEPCHA VOWEL SIGN U..LEPCHA VOWEL SIGN UU +1CE1 ; Right # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF7 ; Right # Mc VEDIC SIGN ATIKRAMA +A823..A824 ; Right # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A827 ; Right # Mc SYLOTI NAGRI VOWEL SIGN OO +A880..A881 ; Right # Mc [2] SAURASHTRA SIGN ANUSVARA..SAURASHTRA SIGN VISARGA +A8B4..A8C3 ; Right # Mc [16] SAURASHTRA CONSONANT SIGN HAARU..SAURASHTRA VOWEL SIGN AU +A952..A953 ; Right # Mc [2] REJANG CONSONANT SIGN H..REJANG VIRAMA +A983 ; Right # Mc JAVANESE SIGN WIGNYAN +A9B4..A9B5 ; Right # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +AA33 ; Right # Mc CHAM CONSONANT SIGN YA +AA4D ; Right # Mc CHAM CONSONANT SIGN FINAL H +AA7B ; Right # Mc MYANMAR SIGN PAO KAREN TONE +AA7D ; Right # Mc MYANMAR SIGN TAI LAING TONE-5 +AAB1 ; Right # Lo TAI VIET VOWEL AA +AABA ; Right # Lo TAI VIET VOWEL UA +AABD ; Right # Lo TAI VIET VOWEL AN +AAEF ; Right # Mc MEETEI MAYEK VOWEL SIGN AAU +AAF5 ; Right # Mc MEETEI MAYEK VOWEL SIGN VISARGA +ABE3..ABE4 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE6..ABE7 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE9..ABEA ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +ABEC ; Right # Mc MEETEI MAYEK LUM IYEK +11000 ; Right # Mc BRAHMI SIGN CANDRABINDU +11002 ; Right # Mc BRAHMI SIGN VISARGA +11082 ; Right # Mc KAITHI SIGN VISARGA +110B0 ; Right # Mc KAITHI VOWEL SIGN AA +110B2 ; Right # Mc KAITHI VOWEL SIGN II +110B7..110B8 ; Right # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11145..11146 ; Right # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI +11182 ; Right # Mc SHARADA SIGN VISARGA +111B3 ; Right # Mc SHARADA VOWEL SIGN AA +111B5 ; Right # Mc SHARADA VOWEL SIGN II +111C0 ; Right # Mc SHARADA SIGN VIRAMA +1122C..1122E ; Right # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +11235 ; Right # Mc KHOJKI SIGN VIRAMA +112E0 ; Right # Mc KHUDAWADI VOWEL SIGN AA +112E2 ; Right # Mc KHUDAWADI VOWEL SIGN II +11302..11303 ; Right # Mc [2] GRANTHA SIGN ANUSVARA..GRANTHA SIGN VISARGA +1133E..1133F ; Right # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11341..11344 ; Right # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +1134D ; Right # Mc GRANTHA SIGN VIRAMA +11357 ; Right # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Right # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +11435 ; Right # Mc NEWA VOWEL SIGN AA +11437 ; Right # Mc NEWA VOWEL SIGN II +11440..11441 ; Right # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +11445 ; Right # Mc NEWA SIGN VISARGA +114B0 ; Right # Mc TIRHUTA VOWEL SIGN AA +114B2 ; Right # Mc TIRHUTA VOWEL SIGN II +114BD ; Right # Mc TIRHUTA VOWEL SIGN SHORT O +114C1 ; Right # Mc TIRHUTA SIGN VISARGA +115AF ; Right # Mc SIDDHAM VOWEL SIGN AA +115B1 ; Right # Mc SIDDHAM VOWEL SIGN II +115BE ; Right # Mc SIDDHAM SIGN VISARGA +11630..11632 ; Right # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +1163B..1163C ; Right # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +1163E ; Right # Mc MODI SIGN VISARGA +116AC ; Right # Mc TAKRI SIGN VISARGA +116AF ; Right # Mc TAKRI VOWEL SIGN II +116B6 ; Right # Mc TAKRI SIGN VIRAMA +11720..11721 ; Right # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +1182C ; Right # Mc DOGRA VOWEL SIGN AA +1182E ; Right # Mc DOGRA VOWEL SIGN II +11838 ; Right # Mc DOGRA SIGN VISARGA +11930..11934 ; Right # Mc [5] DIVES AKURU VOWEL SIGN AA..DIVES AKURU VOWEL SIGN UU +1193D ; Right # Mc DIVES AKURU SIGN HALANTA +11940 ; Right # Mc DIVES AKURU MEDIAL YA +119D1 ; Right # Mc NANDINAGARI VOWEL SIGN AA +119D3 ; Right # Mc NANDINAGARI VOWEL SIGN II +119DC..119DF ; Right # Mc [4] NANDINAGARI VOWEL SIGN O..NANDINAGARI SIGN VISARGA +11A39 ; Right # Mc ZANABAZAR SQUARE SIGN VISARGA +11A57..11A58 ; Right # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A97 ; Right # Mc SOYOMBO SIGN VISARGA +11C2F ; Right # Mc BHAIKSUKI VOWEL SIGN AA +11C3E ; Right # Mc BHAIKSUKI SIGN VISARGA +11CA9 ; Right # Mc MARCHEN SUBJOINED LETTER YA +11CB4 ; Right # Mc MARCHEN VOWEL SIGN O +11D46 ; Right # Lo MASARAM GONDI REPHA +11D8A..11D8E ; Right # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU +11D93..11D94 ; Right # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU +11D96 ; Right # Mc GUNJALA GONDI SIGN VISARGA +11EF6 ; Right # Mc MAKASAR VOWEL SIGN O +11F03 ; Right # Mc KAWI SIGN VISARGA +11F34..11F35 ; Right # Mc [2] KAWI VOWEL SIGN AA..KAWI VOWEL SIGN ALTERNATE AA +11F41 ; Right # Mc KAWI SIGN KILLER + +# Indic_Positional_Category=Left + +093F ; Left # Mc DEVANAGARI VOWEL SIGN I +094E ; Left # Mc DEVANAGARI VOWEL SIGN PRISHTHAMATRA E +09BF ; Left # Mc BENGALI VOWEL SIGN I +09C7..09C8 ; Left # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +0A3F ; Left # Mc GURMUKHI VOWEL SIGN I +0ABF ; Left # Mc GUJARATI VOWEL SIGN I +0B47 ; Left # Mc ORIYA VOWEL SIGN E +0BC6..0BC8 ; Left # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0D46..0D48 ; Left # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0DD9 ; Left # Mc SINHALA VOWEL SIGN KOMBUVA +0DDB ; Left # Mc SINHALA VOWEL SIGN KOMBU DEKA +0F3F ; Left # Mc TIBETAN SIGN MAR TSHES +1031 ; Left # Mc MYANMAR VOWEL SIGN E +1084 ; Left # Mc MYANMAR VOWEL SIGN SHAN E +17C1..17C3 ; Left # Mc [3] KHMER VOWEL SIGN E..KHMER VOWEL SIGN AI +1A19 ; Left # Mc BUGINESE VOWEL SIGN E +1A55 ; Left # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A6E..1A72 ; Left # Mc [5] TAI THAM VOWEL SIGN E..TAI THAM VOWEL SIGN THAM AI +1B3E..1B3F ; Left # Mc [2] BALINESE VOWEL SIGN TALING..BALINESE VOWEL SIGN TALING REPA +1BA6 ; Left # Mc SUNDANESE VOWEL SIGN PANAELAENG +1C27..1C28 ; Left # Mc [2] LEPCHA VOWEL SIGN I..LEPCHA VOWEL SIGN O +1C34..1C35 ; Left # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A9BA..A9BB ; Left # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +AA2F..AA30 ; Left # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA34 ; Left # Mc CHAM CONSONANT SIGN RA +AAEB ; Left # Mc MEETEI MAYEK VOWEL SIGN II +AAEE ; Left # Mc MEETEI MAYEK VOWEL SIGN AU +110B1 ; Left # Mc KAITHI VOWEL SIGN I +1112C ; Left # Mc CHAKMA VOWEL SIGN E +111B4 ; Left # Mc SHARADA VOWEL SIGN I +111CE ; Left # Mc SHARADA VOWEL SIGN PRISHTHAMATRA E +112E1 ; Left # Mc KHUDAWADI VOWEL SIGN I +11347..11348 ; Left # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +11436 ; Left # Mc NEWA VOWEL SIGN I +114B1 ; Left # Mc TIRHUTA VOWEL SIGN I +114B9 ; Left # Mc TIRHUTA VOWEL SIGN E +115B0 ; Left # Mc SIDDHAM VOWEL SIGN I +115B8 ; Left # Mc SIDDHAM VOWEL SIGN E +116AE ; Left # Mc TAKRI VOWEL SIGN I +11726 ; Left # Mc AHOM VOWEL SIGN E +1182D ; Left # Mc DOGRA VOWEL SIGN I +11935 ; Left # Mc DIVES AKURU VOWEL SIGN E +11937 ; Left # Mc DIVES AKURU VOWEL SIGN AI +119D2 ; Left # Mc NANDINAGARI VOWEL SIGN I +119E4 ; Left # Mc NANDINAGARI VOWEL SIGN PRISHTHAMATRA E +11CB1 ; Left # Mc MARCHEN VOWEL SIGN I +11EF5 ; Left # Mc MAKASAR VOWEL SIGN E +11F3E..11F3F ; Left # Mc [2] KAWI VOWEL SIGN E..KAWI VOWEL SIGN AI + +# Indic_Positional_Category=Visual_Order_Left + +# These are dependent vowels that occur to the left of the consonant +# letter in a syllable, but which occur in scripts using the visual order +# model, instead of the logical order model. Because of the different +# model, these left-side vowels occur first in the backing store (before +# the consonant letter) and are not reordered during text rendering. +# +# [Derivation: Logical_Order_Exception=Yes] + +0E40..0E44 ; Visual_Order_Left # Lo [5] THAI CHARACTER SARA E..THAI CHARACTER SARA AI MAIMALAI +0EC0..0EC4 ; Visual_Order_Left # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +19B5..19B7 ; Visual_Order_Left # Lo [3] NEW TAI LUE VOWEL SIGN E..NEW TAI LUE VOWEL SIGN O +19BA ; Visual_Order_Left # Lo NEW TAI LUE VOWEL SIGN AY +AAB5..AAB6 ; Visual_Order_Left # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB9 ; Visual_Order_Left # Lo TAI VIET VOWEL UEA +AABB..AABC ; Visual_Order_Left # Lo [2] TAI VIET VOWEL AUE..TAI VIET VOWEL AY + +# Indic_Positional_Category=Left_And_Right + +09CB..09CC ; Left_And_Right # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +0B4B ; Left_And_Right # Mc ORIYA VOWEL SIGN O +0BCA..0BCC ; Left_And_Right # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0D4A..0D4C ; Left_And_Right # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0DDC ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA +0DDE ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA +17C0 ; Left_And_Right # Mc KHMER VOWEL SIGN IE +17C4..17C5 ; Left_And_Right # Mc [2] KHMER VOWEL SIGN OO..KHMER VOWEL SIGN AU +1B40..1B41 ; Left_And_Right # Mc [2] BALINESE VOWEL SIGN TALING TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1134B..1134C ; Left_And_Right # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +114BC ; Left_And_Right # Mc TIRHUTA VOWEL SIGN O +114BE ; Left_And_Right # Mc TIRHUTA VOWEL SIGN AU +115BA ; Left_And_Right # Mc SIDDHAM VOWEL SIGN O +11938 ; Left_And_Right # Mc DIVES AKURU VOWEL SIGN O + +# Indic_Positional_Category=Top + +0900..0902 ; Top # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +093A ; Top # Mn DEVANAGARI VOWEL SIGN OE +0945..0948 ; Top # Mn [4] DEVANAGARI VOWEL SIGN CANDRA E..DEVANAGARI VOWEL SIGN AI +0951 ; Top # Mn DEVANAGARI STRESS SIGN UDATTA +0955 ; Top # Mn DEVANAGARI VOWEL SIGN CANDRA LONG E +0981 ; Top # Mn BENGALI SIGN CANDRABINDU +09FE ; Top # Mn BENGALI SANDHI MARK +0A01..0A02 ; Top # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A47..0A48 ; Top # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Top # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0A70..0A71 ; Top # Mn [2] GURMUKHI TIPPI..GURMUKHI ADDAK +0A81..0A82 ; Top # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0AC5 ; Top # Mn GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Top # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AFA..0AFF ; Top # Mn [6] GUJARATI SIGN SUKUN..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B01 ; Top # Mn ORIYA SIGN CANDRABINDU +0B3F ; Top # Mn ORIYA VOWEL SIGN I +0B55..0B56 ; Top # Mn [2] ORIYA SIGN OVERLINE..ORIYA AI LENGTH MARK +0B82 ; Top # Mn TAMIL SIGN ANUSVARA +0BC0 ; Top # Mn TAMIL VOWEL SIGN II +0BCD ; Top # Mn TAMIL SIGN VIRAMA +0C00 ; Top # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C04 ; Top # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C3E..0C40 ; Top # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C46..0C47 ; Top # Mn [2] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN EE +0C4A..0C4D ; Top # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA +0C55 ; Top # Mn TELUGU LENGTH MARK +0C81 ; Top # Mn KANNADA SIGN CANDRABINDU +0CBF ; Top # Mn KANNADA VOWEL SIGN I +0CC6 ; Top # Mn KANNADA VOWEL SIGN E +0CCC..0CCD ; Top # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA +0D00..0D01 ; Top # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU +0D3B..0D3C ; Top # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA +0D4D ; Top # Mn MALAYALAM SIGN VIRAMA +0D4E ; Top # Lo MALAYALAM LETTER DOT REPH +0D81 ; Top # Mn SINHALA SIGN CANDRABINDU +0DCA ; Top # Mn SINHALA SIGN AL-LAKUNA +0DD2..0DD3 ; Top # Mn [2] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN DIGA IS-PILLA +0E31 ; Top # Mn THAI CHARACTER MAI HAN-AKAT +0E34..0E37 ; Top # Mn [4] THAI CHARACTER SARA I..THAI CHARACTER SARA UEE +0E47..0E4E ; Top # Mn [8] THAI CHARACTER MAITAIKHU..THAI CHARACTER YAMAKKAN +0EB1 ; Top # Mn LAO VOWEL SIGN MAI KAN +0EB4..0EB7 ; Top # Mn [4] LAO VOWEL SIGN I..LAO VOWEL SIGN YY +0EBB ; Top # Mn LAO VOWEL SIGN MAI KON +0EC8..0ECE ; Top # Mn [7] LAO TONE MAI EK..LAO YAMAKKAN +0F39 ; Top # Mn TIBETAN MARK TSA -PHRU +0F72 ; Top # Mn TIBETAN VOWEL SIGN I +0F7A..0F7E ; Top # Mn [5] TIBETAN VOWEL SIGN E..TIBETAN SIGN RJES SU NGA RO +0F80 ; Top # Mn TIBETAN VOWEL SIGN REVERSED I +0F82..0F83 ; Top # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +0F86..0F87 ; Top # Mn [2] TIBETAN SIGN LCI RTAGS..TIBETAN SIGN YANG RTAGS +102D..102E ; Top # Mn [2] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN II +1032..1036 ; Top # Mn [5] MYANMAR VOWEL SIGN AI..MYANMAR SIGN ANUSVARA +103A ; Top # Mn MYANMAR SIGN ASAT +1071..1074 ; Top # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1085..1086 ; Top # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109D ; Top # Mn MYANMAR VOWEL SIGN AITON AI +1712 ; Top # Mn TAGALOG VOWEL SIGN I +1732 ; Top # Mn HANUNOO VOWEL SIGN I +1752 ; Top # Mn BUHID VOWEL SIGN I +1772 ; Top # Mn TAGBANWA VOWEL SIGN I +17B7..17BA ; Top # Mn [4] KHMER VOWEL SIGN I..KHMER VOWEL SIGN YY +17C6 ; Top # Mn KHMER SIGN NIKAHIT +17C9..17D1 ; Top # Mn [9] KHMER SIGN MUUSIKATOAN..KHMER SIGN VIRIAM +17D3 ; Top # Mn KHMER SIGN BATHAMASAT +17DD ; Top # Mn KHMER SIGN ATTHACAN +1920..1921 ; Top # Mn [2] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN I +1927..1928 ; Top # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Top # Mn LIMBU SIGN KEMPHRENG +1A17 ; Top # Mn BUGINESE VOWEL SIGN I +1A1B ; Top # Mn BUGINESE VOWEL SIGN AE +1A58..1A5A ; Top # Mn [3] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN LOW PA +1A62 ; Top # Mn TAI THAM VOWEL SIGN MAI SAT +1A65..1A68 ; Top # Mn [4] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN UUE +1A6B ; Top # Mn TAI THAM VOWEL SIGN O +1A73..1A7C ; Top # Mn [10] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN KHUEN-LUE KARAN +1B00..1B03 ; Top # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG +1B34 ; Top # Mn BALINESE SIGN REREKAN +1B36..1B37 ; Top # Mn [2] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN ULU SARI +1B42 ; Top # Mn BALINESE VOWEL SIGN PEPET +1B6B ; Top # Mn BALINESE MUSICAL SYMBOL COMBINING TEGEH +1B6D..1B73 ; Top # Mn [7] BALINESE MUSICAL SYMBOL COMBINING KEMPUL..BALINESE MUSICAL SYMBOL COMBINING GONG +1B80..1B81 ; Top # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR +1BA4 ; Top # Mn SUNDANESE VOWEL SIGN PANGHULU +1BA8..1BA9 ; Top # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE6 ; Top # Mn BATAK SIGN TOMPI +1BE8..1BE9 ; Top # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BED ; Top # Mn BATAK VOWEL SIGN KARO O +1BEF..1BF1 ; Top # Mn [3] BATAK VOWEL SIGN U FOR SIMALUNGUN SA..BATAK CONSONANT SIGN H +1C2D..1C33 ; Top # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +1C36 ; Top # Mn LEPCHA SIGN RAN +1CD0..1CD2 ; Top # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CDA..1CDB ; Top # Mn [2] VEDIC TONE DOUBLE SVARITA..VEDIC TONE TRIPLE SVARITA +1CE0 ; Top # Mn VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CF4 ; Top # Mn VEDIC TONE CANDRA ABOVE +1DFB ; Top # Mn COMBINING DELETION MARK +20F0 ; Top # Mn COMBINING ASTERISK ABOVE +A802 ; Top # Mn SYLOTI NAGRI SIGN DVISVARA +A806 ; Top # Mn SYLOTI NAGRI SIGN HASANTA +A80B ; Top # Mn SYLOTI NAGRI SIGN ANUSVARA +A826 ; Top # Mn SYLOTI NAGRI VOWEL SIGN E +A8C5 ; Top # Mn SAURASHTRA SIGN CANDRABINDU +A8E0..A8F1 ; Top # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +A8FF ; Top # Mn DEVANAGARI VOWEL SIGN AY +A926..A92A ; Top # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O +A94A ; Top # Mn REJANG VOWEL SIGN AI +A94F..A951 ; Top # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A980..A982 ; Top # Mn [3] JAVANESE SIGN PANYANGGA..JAVANESE SIGN LAYAR +A9B3 ; Top # Mn JAVANESE SIGN CECAK TELU +A9B6..A9B7 ; Top # Mn [2] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN WULU MELIK +A9BC ; Top # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Top # Mn MYANMAR SIGN SHAN SAW +AA29..AA2C ; Top # Mn [4] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN EI +AA2E ; Top # Mn CHAM VOWEL SIGN OE +AA31 ; Top # Mn CHAM VOWEL SIGN AU +AA43 ; Top # Mn CHAM CONSONANT SIGN FINAL NG +AA4C ; Top # Mn CHAM CONSONANT SIGN FINAL M +AA7C ; Top # Mn MYANMAR SIGN TAI LAING TONE-2 +AAB0 ; Top # Mn TAI VIET MAI KANG +AAB2..AAB3 ; Top # Mn [2] TAI VIET VOWEL I..TAI VIET VOWEL UE +AAB7..AAB8 ; Top # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AABE..AABF ; Top # Mn [2] TAI VIET VOWEL AM..TAI VIET TONE MAI EK +AAC1 ; Top # Mn TAI VIET TONE MAI THO +AAED ; Top # Mn MEETEI MAYEK VOWEL SIGN AAI +ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP +10A05 ; Top # Mn KHAROSHTHI VOWEL SIGN E +10A0F ; Top # Mn KHAROSHTHI SIGN VISARGA +10A38 ; Top # Mn KHAROSHTHI SIGN BAR ABOVE +11001 ; Top # Mn BRAHMI SIGN ANUSVARA +11038..1103B ; Top # Mn [4] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN II +11042..11046 ; Top # Mn [5] BRAHMI VOWEL SIGN E..BRAHMI VIRAMA +11070 ; Top # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11073..11074 ; Top # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O +11080..11081 ; Top # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +110B5..110B6 ; Top # Mn [2] KAITHI VOWEL SIGN E..KAITHI VOWEL SIGN AI +11100..11102 ; Top # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA +11127..11129 ; Top # Mn [3] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN II +1112D ; Top # Mn CHAKMA VOWEL SIGN AI +11130 ; Top # Mn CHAKMA VOWEL SIGN OI +11134 ; Top # Mn CHAKMA MAAYYAA +11180..11181 ; Top # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +111BC..111BE ; Top # Mn [3] SHARADA VOWEL SIGN E..SHARADA VOWEL SIGN O +111C2..111C3 ; Top # Lo [2] SHARADA SIGN JIHVAMULIYA..SHARADA SIGN UPADHMANIYA +111CB ; Top # Mn SHARADA VOWEL MODIFIER MARK +111CF ; Top # Mn SHARADA SIGN INVERTED CANDRABINDU +11230..11231 ; Top # Mn [2] KHOJKI VOWEL SIGN E..KHOJKI VOWEL SIGN AI +11234 ; Top # Mn KHOJKI SIGN ANUSVARA +11236..11237 ; Top # Mn [2] KHOJKI SIGN NUKTA..KHOJKI SIGN SHADDA +1123E ; Top # Mn KHOJKI SIGN SUKUN +112DF ; Top # Mn KHUDAWADI SIGN ANUSVARA +112E5..112E8 ; Top # Mn [4] KHUDAWADI VOWEL SIGN E..KHUDAWADI VOWEL SIGN AU +11300..11301 ; Top # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11340 ; Top # Mn GRANTHA VOWEL SIGN II +11366..1136C ; Top # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Top # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA +1143E..1143F ; Top # Mn [2] NEWA VOWEL SIGN E..NEWA VOWEL SIGN AI +11443..11444 ; Top # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +1145E ; Top # Mn NEWA SANDHI MARK +114BA ; Top # Mn TIRHUTA VOWEL SIGN SHORT E +114BF..114C0 ; Top # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Top # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +11639..1163A ; Top # Mn [2] MODI VOWEL SIGN E..MODI VOWEL SIGN AI +1163D ; Top # Mn MODI SIGN ANUSVARA +11640 ; Top # Mn MODI SIGN ARDHACANDRA +116AB ; Top # Mn TAKRI SIGN ANUSVARA +116AD ; Top # Mn TAKRI VOWEL SIGN AA +116B2..116B5 ; Top # Mn [4] TAKRI VOWEL SIGN E..TAKRI VOWEL SIGN AU +1171F ; Top # Mn AHOM CONSONANT SIGN MEDIAL LIGATING RA +11722..11723 ; Top # Mn [2] AHOM VOWEL SIGN I..AHOM VOWEL SIGN II +11727 ; Top # Mn AHOM VOWEL SIGN AW +11729..1172B ; Top # Mn [3] AHOM VOWEL SIGN AI..AHOM SIGN KILLER +11833..11837 ; Top # Mn [5] DOGRA VOWEL SIGN E..DOGRA SIGN ANUSVARA +1193B..1193C ; Top # Mn [2] DIVES AKURU SIGN ANUSVARA..DIVES AKURU SIGN CANDRABINDU +1193F ; Top # Lo DIVES AKURU PREFIXED NASAL SIGN +11941 ; Top # Lo DIVES AKURU INITIAL RA +119DA..119DB ; Top # Mn [2] NANDINAGARI VOWEL SIGN E..NANDINAGARI VOWEL SIGN AI +11A01 ; Top # Mn ZANABAZAR SQUARE VOWEL SIGN I +11A04..11A09 ; Top # Mn [6] ZANABAZAR SQUARE VOWEL SIGN E..ZANABAZAR SQUARE VOWEL SIGN REVERSED I +11A35..11A38 ; Top # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A3A ; Top # Lo ZANABAZAR SQUARE CLUSTER-INITIAL LETTER RA +11A51 ; Top # Mn SOYOMBO VOWEL SIGN I +11A54..11A56 ; Top # Mn [3] SOYOMBO VOWEL SIGN E..SOYOMBO VOWEL SIGN OE +11A84..11A89 ; Top # Lo [6] SOYOMBO SIGN JIHVAMULIYA..SOYOMBO CLUSTER-INITIAL LETTER SA +11A96 ; Top # Mn SOYOMBO SIGN ANUSVARA +11A98 ; Top # Mn SOYOMBO GEMINATION MARK +11C30..11C31 ; Top # Mn [2] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN II +11C38..11C3D ; Top # Mn [6] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI SIGN ANUSVARA +11CB3 ; Top # Mn MARCHEN VOWEL SIGN E +11CB5..11CB6 ; Top # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D31..11D35 ; Top # Mn [5] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN UU +11D3A ; Top # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Top # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F..11D41 ; Top # Mn [3] MASARAM GONDI VOWEL SIGN AU..MASARAM GONDI SIGN VISARGA +11D43 ; Top # Mn MASARAM GONDI SIGN CANDRA +11D90..11D91 ; Top # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI +11D95 ; Top # Mn GUNJALA GONDI SIGN ANUSVARA +11EF3 ; Top # Mn MAKASAR VOWEL SIGN I +11F00..11F01 ; Top # Mn [2] KAWI SIGN CANDRABINDU..KAWI SIGN ANUSVARA +11F02 ; Top # Lo KAWI SIGN REPHA +11F36..11F37 ; Top # Mn [2] KAWI VOWEL SIGN I..KAWI VOWEL SIGN II +11F40 ; Top # Mn KAWI VOWEL SIGN EU + +# Indic_Positional_Category=Bottom + +093C ; Bottom # Mn DEVANAGARI SIGN NUKTA +0941..0944 ; Bottom # Mn [4] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN VOCALIC RR +094D ; Bottom # Mn DEVANAGARI SIGN VIRAMA +0952 ; Bottom # Mn DEVANAGARI STRESS SIGN ANUDATTA +0956..0957 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN UE..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BC ; Bottom # Mn BENGALI SIGN NUKTA +09C1..09C4 ; Bottom # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09CD ; Bottom # Mn BENGALI SIGN VIRAMA +09E2..09E3 ; Bottom # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3C ; Bottom # Mn GURMUKHI SIGN NUKTA +0A41..0A42 ; Bottom # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A4D ; Bottom # Mn GURMUKHI SIGN VIRAMA +0A51 ; Bottom # Mn GURMUKHI SIGN UDAAT +0A75 ; Bottom # Mn GURMUKHI SIGN YAKASH +0ABC ; Bottom # Mn GUJARATI SIGN NUKTA +0AC1..0AC4 ; Bottom # Mn [4] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN VOCALIC RR +0ACD ; Bottom # Mn GUJARATI SIGN VIRAMA +0AE2..0AE3 ; Bottom # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3C ; Bottom # Mn ORIYA SIGN NUKTA +0B41..0B44 ; Bottom # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B4D ; Bottom # Mn ORIYA SIGN VIRAMA +0B62..0B63 ; Bottom # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0C3C ; Bottom # Mn TELUGU SIGN NUKTA +0C56 ; Bottom # Mn TELUGU AI LENGTH MARK +0C62..0C63 ; Bottom # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBC ; Bottom # Mn KANNADA SIGN NUKTA +0CE2..0CE3 ; Bottom # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D43..0D44 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC R..MALAYALAM VOWEL SIGN VOCALIC RR +0D62..0D63 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DD4 ; Bottom # Mn SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Bottom # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0E38..0E3A ; Bottom # Mn [3] THAI CHARACTER SARA U..THAI CHARACTER PHINTHU +0EB8..0EBA ; Bottom # Mn [3] LAO VOWEL SIGN U..LAO SIGN PALI VIRAMA +0EBC ; Bottom # Mn LAO SEMIVOWEL SIGN LO +0F18..0F19 ; Bottom # Mn [2] TIBETAN ASTROLOGICAL SIGN -KHYUD PA..TIBETAN ASTROLOGICAL SIGN SDONG TSHUGS +0F35 ; Bottom # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Bottom # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0F71 ; Bottom # Mn TIBETAN VOWEL SIGN AA +0F74..0F75 ; Bottom # Mn [2] TIBETAN VOWEL SIGN U..TIBETAN VOWEL SIGN UU +0F84 ; Bottom # Mn TIBETAN MARK HALANTA +0F8D..0F97 ; Bottom # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Bottom # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +0FC6 ; Bottom # Mn TIBETAN SYMBOL PADMA GDAN +102F..1030 ; Bottom # Mn [2] MYANMAR VOWEL SIGN U..MYANMAR VOWEL SIGN UU +1037 ; Bottom # Mn MYANMAR SIGN DOT BELOW +103D..103E ; Bottom # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +1058..1059 ; Bottom # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +105E..1060 ; Bottom # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Bottom # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +108D ; Bottom # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +1713..1714 ; Bottom # Mn [2] TAGALOG VOWEL SIGN U..TAGALOG SIGN VIRAMA +1733 ; Bottom # Mn HANUNOO VOWEL SIGN U +1753 ; Bottom # Mn BUHID VOWEL SIGN U +1773 ; Bottom # Mn TAGBANWA VOWEL SIGN U +17BB..17BD ; Bottom # Mn [3] KHMER VOWEL SIGN U..KHMER VOWEL SIGN UA +1922 ; Bottom # Mn LIMBU VOWEL SIGN U +1932 ; Bottom # Mn LIMBU SMALL LETTER ANUSVARA +1939 ; Bottom # Mn LIMBU SIGN MUKPHRENG +193B ; Bottom # Mn LIMBU SIGN SA-I +1A18 ; Bottom # Mn BUGINESE VOWEL SIGN U +1A56 ; Bottom # Mn TAI THAM CONSONANT SIGN MEDIAL LA +1A5B..1A5E ; Bottom # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1A69..1A6A ; Bottom # Mn [2] TAI THAM VOWEL SIGN U..TAI THAM VOWEL SIGN UU +1A6C ; Bottom # Mn TAI THAM VOWEL SIGN OA BELOW +1A7F ; Bottom # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1B38..1B3A ; Bottom # Mn [3] BALINESE VOWEL SIGN SUKU..BALINESE VOWEL SIGN RA REPA +1B6C ; Bottom # Mn BALINESE MUSICAL SYMBOL COMBINING ENDEP +1BA2..1BA3 ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BA5 ; Bottom # Mn SUNDANESE VOWEL SIGN PANYUKU +1BAC..1BAD ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C2C ; Bottom # Mn LEPCHA VOWEL SIGN E +1C37 ; Bottom # Mn LEPCHA SIGN NUKTA +1CD5..1CD9 ; Bottom # Mn [5] VEDIC TONE YAJURVEDIC AGGRAVATED INDEPENDENT SVARITA..VEDIC TONE YAJURVEDIC KATHAKA INDEPENDENT SVARITA SCHROEDER +1CDC..1CDF ; Bottom # Mn [4] VEDIC TONE KATHAKA ANUDATTA..VEDIC TONE THREE DOTS BELOW +1CED ; Bottom # Mn VEDIC SIGN TIRYAK +A825 ; Bottom # Mn SYLOTI NAGRI VOWEL SIGN U +A82C ; Bottom # Mn SYLOTI NAGRI SIGN ALTERNATE HASANTA +A8C4 ; Bottom # Mn SAURASHTRA SIGN VIRAMA +A92B..A92D ; Bottom # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +A947..A949 ; Bottom # Mn [3] REJANG VOWEL SIGN I..REJANG VOWEL SIGN E +A94B..A94E ; Bottom # Mn [4] REJANG VOWEL SIGN O..REJANG VOWEL SIGN EA +A9B8..A9B9 ; Bottom # Mn [2] JAVANESE VOWEL SIGN SUKU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BD ; Bottom # Mn JAVANESE CONSONANT SIGN KERET +AA2D ; Bottom # Mn CHAM VOWEL SIGN U +AA32 ; Bottom # Mn CHAM VOWEL SIGN UE +AA35..AA36 ; Bottom # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +AAB4 ; Bottom # Mn TAI VIET VOWEL U +AAEC ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UU +ABE8 ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK +10A02..10A03 ; Bottom # Mn [2] KHAROSHTHI VOWEL SIGN U..KHAROSHTHI VOWEL SIGN VOCALIC R +10A0C..10A0E ; Bottom # Mn [3] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN ANUSVARA +10A39..10A3A ; Bottom # Mn [2] KHAROSHTHI SIGN CAUDA..KHAROSHTHI SIGN DOT BELOW +1103C..11041 ; Bottom # Mn [6] BRAHMI VOWEL SIGN U..BRAHMI VOWEL SIGN VOCALIC LL +110B3..110B4 ; Bottom # Mn [2] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN UU +110B9..110BA ; Bottom # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +110C2 ; Bottom # Mn KAITHI VOWEL SIGN VOCALIC R +1112A..1112B ; Bottom # Mn [2] CHAKMA VOWEL SIGN U..CHAKMA VOWEL SIGN UU +11131..11132 ; Bottom # Mn [2] CHAKMA O MARK..CHAKMA AU MARK +11173 ; Bottom # Mn MAHAJANI SIGN NUKTA +111B6..111BB ; Bottom # Mn [6] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN VOCALIC LL +111C9..111CA ; Bottom # Mn [2] SHARADA SANDHI MARK..SHARADA SIGN NUKTA +111CC ; Bottom # Mn SHARADA EXTRA SHORT VOWEL MARK +1122F ; Bottom # Mn KHOJKI VOWEL SIGN U +11241 ; Bottom # Mn KHOJKI VOWEL SIGN VOCALIC R +112E3..112E4 ; Bottom # Mn [2] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN UU +112E9..112EA ; Bottom # Mn [2] KHUDAWADI SIGN NUKTA..KHUDAWADI SIGN VIRAMA +1133B..1133C ; Bottom # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA +11438..1143D ; Bottom # Mn [6] NEWA VOWEL SIGN U..NEWA VOWEL SIGN VOCALIC LL +11442 ; Bottom # Mn NEWA SIGN VIRAMA +11446 ; Bottom # Mn NEWA SIGN NUKTA +114B3..114B8 ; Bottom # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114C2..114C3 ; Bottom # Mn [2] TIRHUTA SIGN VIRAMA..TIRHUTA SIGN NUKTA +115B2..115B5 ; Bottom # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115BF..115C0 ; Bottom # Mn [2] SIDDHAM SIGN VIRAMA..SIDDHAM SIGN NUKTA +115DC..115DD ; Bottom # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11633..11638 ; Bottom # Mn [6] MODI VOWEL SIGN U..MODI VOWEL SIGN VOCALIC LL +1163F ; Bottom # Mn MODI SIGN VIRAMA +116B0..116B1 ; Bottom # Mn [2] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN UU +116B7 ; Bottom # Mn TAKRI SIGN NUKTA +1171D ; Bottom # Mn AHOM CONSONANT SIGN MEDIAL LA +11724..11725 ; Bottom # Mn [2] AHOM VOWEL SIGN U..AHOM VOWEL SIGN UU +11728 ; Bottom # Mn AHOM VOWEL SIGN O +1182F..11832 ; Bottom # Mn [4] DOGRA VOWEL SIGN U..DOGRA VOWEL SIGN VOCALIC RR +11839..1183A ; Bottom # Mn [2] DOGRA SIGN VIRAMA..DOGRA SIGN NUKTA +11943 ; Bottom # Mn DIVES AKURU SIGN NUKTA +119D4..119D7 ; Bottom # Mn [4] NANDINAGARI VOWEL SIGN U..NANDINAGARI VOWEL SIGN VOCALIC RR +119E0 ; Bottom # Mn NANDINAGARI SIGN VIRAMA +11A02..11A03 ; Bottom # Mn [2] ZANABAZAR SQUARE VOWEL SIGN UE..ZANABAZAR SQUARE VOWEL SIGN U +11A0A ; Bottom # Mn ZANABAZAR SQUARE VOWEL LENGTH MARK +11A33..11A34 ; Bottom # Mn [2] ZANABAZAR SQUARE FINAL CONSONANT MARK..ZANABAZAR SQUARE SIGN VIRAMA +11A3B..11A3E ; Bottom # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11A52..11A53 ; Bottom # Mn [2] SOYOMBO VOWEL SIGN UE..SOYOMBO VOWEL SIGN U +11A59..11A5B ; Bottom # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11A8A..11A95 ; Bottom # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A +11C32..11C36 ; Bottom # Mn [5] BHAIKSUKI VOWEL SIGN U..BHAIKSUKI VOWEL SIGN VOCALIC L +11C3F ; Bottom # Mn BHAIKSUKI SIGN VIRAMA +11C92..11CA7 ; Bottom # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CAA..11CB0 ; Bottom # Mn [7] MARCHEN SUBJOINED LETTER RA..MARCHEN VOWEL SIGN AA +11CB2 ; Bottom # Mn MARCHEN VOWEL SIGN U +11D36 ; Bottom # Mn MASARAM GONDI VOWEL SIGN VOCALIC R +11D42 ; Bottom # Mn MASARAM GONDI SIGN NUKTA +11D44 ; Bottom # Mn MASARAM GONDI SIGN HALANTA +11D47 ; Bottom # Mn MASARAM GONDI RA-KARA +11EF4 ; Bottom # Mn MAKASAR VOWEL SIGN U +11F38..11F3A ; Bottom # Mn [3] KAWI VOWEL SIGN U..KAWI VOWEL SIGN VOCALIC R + +# Indic_Positional_Category=Top_And_Bottom + +0C48 ; Top_And_Bottom # Mn TELUGU VOWEL SIGN AI +0F73 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN II +0F76..0F79 ; Top_And_Bottom # Mn [4] TIBETAN VOWEL SIGN VOCALIC R..TIBETAN VOWEL SIGN VOCALIC LL +0F81 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN REVERSED II +1B3C ; Top_And_Bottom # Mn BALINESE VOWEL SIGN LA LENGA +1112E..1112F ; Top_And_Bottom # Mn [2] CHAKMA VOWEL SIGN O..CHAKMA VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Right + +0AC9 ; Top_And_Right # Mc GUJARATI VOWEL SIGN CANDRA O +0B57 ; Top_And_Right # Mc ORIYA AU LENGTH MARK +0CC0 ; Top_And_Right # Mc KANNADA VOWEL SIGN II +0CC7..0CC8 ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +1925..1926 ; Top_And_Right # Mc [2] LIMBU VOWEL SIGN OO..LIMBU VOWEL SIGN AU +1B43 ; Top_And_Right # Mc BALINESE VOWEL SIGN PEPET TEDUNG +111BF ; Top_And_Right # Mc SHARADA VOWEL SIGN AU +11232..11233 ; Top_And_Right # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Left + +0B48 ; Top_And_Left # Mc ORIYA VOWEL SIGN AI +0DDA ; Top_And_Left # Mc SINHALA VOWEL SIGN DIGA KOMBUVA +17BE ; Top_And_Left # Mc KHMER VOWEL SIGN OE +1C29 ; Top_And_Left # Mc LEPCHA VOWEL SIGN OO +114BB ; Top_And_Left # Mc TIRHUTA VOWEL SIGN AI +115B9 ; Top_And_Left # Mc SIDDHAM VOWEL SIGN AI + +# Indic_Positional_Category=Top_And_Left_And_Right + +0B4C ; Top_And_Left_And_Right # Mc ORIYA VOWEL SIGN AU +0DDD ; Top_And_Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA +17BF ; Top_And_Left_And_Right # Mc KHMER VOWEL SIGN YA +115BB ; Top_And_Left_And_Right # Mc SIDDHAM VOWEL SIGN AU + +# Indic_Positional_Category=Bottom_And_Right + +1B3B ; Bottom_And_Right # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +A9BE ; Bottom_And_Right # Mc JAVANESE CONSONANT SIGN PENGKAL +A9C0 ; Bottom_And_Right # Mc JAVANESE PANGKON +11942 ; Bottom_And_Right # Mc DIVES AKURU MEDIAL RA + +# Indic_Positional_Category=Bottom_And_Left + +A9BF ; Bottom_And_Left # Mc JAVANESE CONSONANT SIGN CAKRA + +# Indic_Positional_Category=Top_And_Bottom_And_Right + +1B3D ; Top_And_Bottom_And_Right # Mc BALINESE VOWEL SIGN LA LENGA TEDUNG + +# Indic_Positional_Category=Top_And_Bottom_And_Left + +103C ; Top_And_Bottom_And_Left # Mc MYANMAR CONSONANT SIGN MEDIAL RA +1171E ; Top_And_Bottom_And_Left # Mn AHOM CONSONANT SIGN MEDIAL RA + +# Indic_Positional_Category=Overstruck + +1CD4 ; Overstruck # Mn VEDIC SIGN YAJURVEDIC MIDLINE SVARITA +1CE2..1CE8 ; Overstruck # Mn [7] VEDIC SIGN VISARGA SVARITA..VEDIC SIGN VISARGA ANUDATTA WITH TAIL +10A01 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN I +10A06 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN O + +# EOF diff --git a/data/15.0.0-indic-syllabic-category.txt b/data/15.0.0-indic-syllabic-category.txt new file mode 100644 index 0000000..7843c17 --- /dev/null +++ b/data/15.0.0-indic-syllabic-category.txt @@ -0,0 +1,1347 @@ +# IndicSyllabicCategory-15.0.0.txt +# Date: 2022-05-26, 02:18:00 GMT [KW, RP] +# © 2022 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use, see https://www.unicode.org/terms_of_use.html +# +# For documentation, see UAX #44: Unicode Character Database, +# at https://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Syllabic_Category enumerated property +# +# Scope: This property is aimed at two general problem +# areas involving the analysis and processing of Indic scripts: +# +# 1. Specification of syllabic structure. +# 2. Specification of segmentation rules. +# +# Both of these problem areas may benefit from having defined subtypes +# of Indic script characters which are relevant to how Indic +# syllables (or aksaras) are constructed. Note that rules for +# syllabic structure in Indic scripts may differ significantly +# from how phonological syllables are defined. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Syllabic_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as Indic in the structural sense used for the +# Indic_Syllabic_Category are the following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Dives Akuru, Dogra, Grantha, Gujarati, +# Gunjala Gondi, Gurmukhi, Hanunoo, Javanese, Kaithi, Kannada, Kawi, +# Kayah Li, Kharoshthi, Khmer, Khojki, Khudawadi, Lao, Lepcha, Limbu, +# Mahajani, Makasar, Malayalam, Marchen, Masaram Gondi, Meetei Mayek, +# Modi, Multani, Myanmar, Nandinagari, Newa, New Tai Lue, Oriya, +# Phags-pa, Rejang, Saurashtra, Sharada, Siddham, Sinhala, Soyombo, +# Sundanese, Syloti Nagri, Tagalog, Tagbanwa, Tai Le, Tai Tham, +# Tai Viet, Takri, Tamil, Telugu, Thai, Tibetan, Tirhuta, and +# Zanabazar Square. +# +# All characters for all other scripts not in that list +# take the default value for this property, unless they +# are individually listed in this data file. +# + +# ================================================ + +# Property: Indic_Syllabic_Category +# +# All code points not explicitly listed for Indic_Syllabic_Category +# have the value Other. +# +# @missing: 0000..10FFFF; Other + +# ================================================ + +# Indic_Syllabic_Category=Bindu + +# Bindu/Anusvara (nasalization or -n) + +# [Not derivable] + +0900..0902 ; Bindu # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +0981 ; Bindu # Mn BENGALI SIGN CANDRABINDU +0982 ; Bindu # Mc BENGALI SIGN ANUSVARA +09FC ; Bindu # Lo BENGALI LETTER VEDIC ANUSVARA +0A01..0A02 ; Bindu # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A70 ; Bindu # Mn GURMUKHI TIPPI +0A81..0A82 ; Bindu # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0B01 ; Bindu # Mn ORIYA SIGN CANDRABINDU +0B02 ; Bindu # Mc ORIYA SIGN ANUSVARA +0B82 ; Bindu # Mn TAMIL SIGN ANUSVARA +0C00 ; Bindu # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C01..0C02 ; Bindu # Mc [2] TELUGU SIGN CANDRABINDU..TELUGU SIGN ANUSVARA +0C04 ; Bindu # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C80 ; Bindu # Lo KANNADA SIGN SPACING CANDRABINDU +0C81 ; Bindu # Mn KANNADA SIGN CANDRABINDU +0C82 ; Bindu # Mc KANNADA SIGN ANUSVARA +0CF3 ; Bindu # Mc KANNADA SIGN COMBINING ANUSVARA ABOVE RIGHT +0D00..0D01 ; Bindu # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU +0D02 ; Bindu # Mc MALAYALAM SIGN ANUSVARA +0D04 ; Bindu # Lo MALAYALAM LETTER VEDIC ANUSVARA +0D81 ; Bindu # Mn SINHALA SIGN CANDRABINDU +0D82 ; Bindu # Mc SINHALA SIGN ANUSVARAYA +0E4D ; Bindu # Mn THAI CHARACTER NIKHAHIT +0ECD ; Bindu # Mn LAO NIGGAHITA +0F7E ; Bindu # Mn TIBETAN SIGN RJES SU NGA RO +0F82..0F83 ; Bindu # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +1036 ; Bindu # Mn MYANMAR SIGN ANUSVARA +17C6 ; Bindu # Mn KHMER SIGN NIKAHIT +1932 ; Bindu # Mn LIMBU SMALL LETTER ANUSVARA +1A74 ; Bindu # Mn TAI THAM SIGN MAI KANG +1B00..1B02 ; Bindu # Mn [3] BALINESE SIGN ULU RICEM..BALINESE SIGN CECEK +1B80 ; Bindu # Mn SUNDANESE SIGN PANYECEK +1C34..1C35 ; Bindu # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A80B ; Bindu # Mn SYLOTI NAGRI SIGN ANUSVARA +A873 ; Bindu # Lo PHAGS-PA LETTER CANDRABINDU +A880 ; Bindu # Mc SAURASHTRA SIGN ANUSVARA +A8C5 ; Bindu # Mn SAURASHTRA SIGN CANDRABINDU +A8F2..A8F3 ; Bindu # Lo [2] DEVANAGARI SIGN SPACING CANDRABINDU..DEVANAGARI SIGN CANDRABINDU VIRAMA +A980..A981 ; Bindu # Mn [2] JAVANESE SIGN PANYANGGA..JAVANESE SIGN CECAK +10A0E ; Bindu # Mn KHAROSHTHI SIGN ANUSVARA +11000 ; Bindu # Mc BRAHMI SIGN CANDRABINDU +11001 ; Bindu # Mn BRAHMI SIGN ANUSVARA +11080..11081 ; Bindu # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +11100..11101 ; Bindu # Mn [2] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN ANUSVARA +11180..11181 ; Bindu # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +111CF ; Bindu # Mn SHARADA SIGN INVERTED CANDRABINDU +11234 ; Bindu # Mn KHOJKI SIGN ANUSVARA +112DF ; Bindu # Mn KHUDAWADI SIGN ANUSVARA +11300..11301 ; Bindu # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11302 ; Bindu # Mc GRANTHA SIGN ANUSVARA +1135E..1135F ; Bindu # Lo [2] GRANTHA LETTER VEDIC ANUSVARA..GRANTHA LETTER VEDIC DOUBLE ANUSVARA +11443..11444 ; Bindu # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +1145F ; Bindu # Lo NEWA LETTER VEDIC ANUSVARA +114BF..114C0 ; Bindu # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Bindu # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +1163D ; Bindu # Mn MODI SIGN ANUSVARA +116AB ; Bindu # Mn TAKRI SIGN ANUSVARA +11837 ; Bindu # Mn DOGRA SIGN ANUSVARA +1193B..1193C ; Bindu # Mn [2] DIVES AKURU SIGN ANUSVARA..DIVES AKURU SIGN CANDRABINDU +119DE ; Bindu # Mc NANDINAGARI SIGN ANUSVARA +11A35..11A38 ; Bindu # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A96 ; Bindu # Mn SOYOMBO SIGN ANUSVARA +11C3C..11C3D ; Bindu # Mn [2] BHAIKSUKI SIGN CANDRABINDU..BHAIKSUKI SIGN ANUSVARA +11CB5..11CB6 ; Bindu # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D40 ; Bindu # Mn MASARAM GONDI SIGN ANUSVARA +11D95 ; Bindu # Mn GUNJALA GONDI SIGN ANUSVARA +11F00..11F01 ; Bindu # Mn [2] KAWI SIGN CANDRABINDU..KAWI SIGN ANUSVARA + +# ================================================ + +# Indic_Syllabic_Category=Visarga + +# Visarga (-h) +# Excludes letters for jihvamuliya and upadhmaniya, which are +# related, but structured somewhat differently. + +# [Not derivable] + +0903 ; Visarga # Mc DEVANAGARI SIGN VISARGA +0983 ; Visarga # Mc BENGALI SIGN VISARGA +0A03 ; Visarga # Mc GURMUKHI SIGN VISARGA +0A83 ; Visarga # Mc GUJARATI SIGN VISARGA +0B03 ; Visarga # Mc ORIYA SIGN VISARGA +0C03 ; Visarga # Mc TELUGU SIGN VISARGA +0C83 ; Visarga # Mc KANNADA SIGN VISARGA +0D03 ; Visarga # Mc MALAYALAM SIGN VISARGA +0D83 ; Visarga # Mc SINHALA SIGN VISARGAYA +0F7F ; Visarga # Mc TIBETAN SIGN RNAM BCAD +1038 ; Visarga # Mc MYANMAR SIGN VISARGA +17C7 ; Visarga # Mc KHMER SIGN REAHMUK +1B04 ; Visarga # Mc BALINESE SIGN BISAH +1B82 ; Visarga # Mc SUNDANESE SIGN PANGWISAD +A881 ; Visarga # Mc SAURASHTRA SIGN VISARGA +A983 ; Visarga # Mc JAVANESE SIGN WIGNYAN +AAF5 ; Visarga # Mc MEETEI MAYEK VOWEL SIGN VISARGA +10A0F ; Visarga # Mn KHAROSHTHI SIGN VISARGA +11002 ; Visarga # Mc BRAHMI SIGN VISARGA +11082 ; Visarga # Mc KAITHI SIGN VISARGA +11102 ; Visarga # Mn CHAKMA SIGN VISARGA +11182 ; Visarga # Mc SHARADA SIGN VISARGA +11303 ; Visarga # Mc GRANTHA SIGN VISARGA +11445 ; Visarga # Mc NEWA SIGN VISARGA +114C1 ; Visarga # Mc TIRHUTA SIGN VISARGA +115BE ; Visarga # Mc SIDDHAM SIGN VISARGA +1163E ; Visarga # Mc MODI SIGN VISARGA +116AC ; Visarga # Mc TAKRI SIGN VISARGA +11838 ; Visarga # Mc DOGRA SIGN VISARGA +119DF ; Visarga # Mc NANDINAGARI SIGN VISARGA +11A39 ; Visarga # Mc ZANABAZAR SQUARE SIGN VISARGA +11A97 ; Visarga # Mc SOYOMBO SIGN VISARGA +11C3E ; Visarga # Mc BHAIKSUKI SIGN VISARGA +11D41 ; Visarga # Mn MASARAM GONDI SIGN VISARGA +11D96 ; Visarga # Mc GUNJALA GONDI SIGN VISARGA +11F03 ; Visarga # Mc KAWI SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Avagraha + +# Avagraha (elision of initial a- in sandhi) + +# [Not derivable] + +093D ; Avagraha # Lo DEVANAGARI SIGN AVAGRAHA +09BD ; Avagraha # Lo BENGALI SIGN AVAGRAHA +0ABD ; Avagraha # Lo GUJARATI SIGN AVAGRAHA +0B3D ; Avagraha # Lo ORIYA SIGN AVAGRAHA +0C3D ; Avagraha # Lo TELUGU SIGN AVAGRAHA +0CBD ; Avagraha # Lo KANNADA SIGN AVAGRAHA +0D3D ; Avagraha # Lo MALAYALAM SIGN AVAGRAHA +0F85 ; Avagraha # Po TIBETAN MARK PALUTA +17DC ; Avagraha # Lo KHMER SIGN AVAKRAHASANYA +1BBA ; Avagraha # Lo SUNDANESE AVAGRAHA +111C1 ; Avagraha # Lo SHARADA SIGN AVAGRAHA +1133D ; Avagraha # Lo GRANTHA SIGN AVAGRAHA +11447 ; Avagraha # Lo NEWA SIGN AVAGRAHA +114C4 ; Avagraha # Lo TIRHUTA SIGN AVAGRAHA +119E1 ; Avagraha # Lo NANDINAGARI SIGN AVAGRAHA +11A9D ; Avagraha # Lo SOYOMBO MARK PLUTA +11C40 ; Avagraha # Lo BHAIKSUKI SIGN AVAGRAHA + +# ================================================ + +# Indic_Syllabic_Category=Nukta + +# Nukta (diacritic for borrowed consonants or other consonant +# modifications). Note that while the resulting sound is typically a +# consonant, the base letter a nukta follows may be an independent +# vowel. For example, is used to transcribe ARABIC LETTER +# AIN. + +# [Not derivable] + +093C ; Nukta # Mn DEVANAGARI SIGN NUKTA +09BC ; Nukta # Mn BENGALI SIGN NUKTA +0A3C ; Nukta # Mn GURMUKHI SIGN NUKTA +0ABC ; Nukta # Mn GUJARATI SIGN NUKTA +0AFD..0AFF ; Nukta # Mn [3] GUJARATI SIGN THREE-DOT NUKTA ABOVE..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B3C ; Nukta # Mn ORIYA SIGN NUKTA +0C3C ; Nukta # Mn TELUGU SIGN NUKTA +0CBC ; Nukta # Mn KANNADA SIGN NUKTA +0F39 ; Nukta # Mn TIBETAN MARK TSA -PHRU +1B34 ; Nukta # Mn BALINESE SIGN REREKAN +1BE6 ; Nukta # Mn BATAK SIGN TOMPI +1C37 ; Nukta # Mn LEPCHA SIGN NUKTA +A9B3 ; Nukta # Mn JAVANESE SIGN CECAK TELU +10A38..10A3A ; Nukta # Mn [3] KHAROSHTHI SIGN BAR ABOVE..KHAROSHTHI SIGN DOT BELOW +110BA ; Nukta # Mn KAITHI SIGN NUKTA +11173 ; Nukta # Mn MAHAJANI SIGN NUKTA +111CA ; Nukta # Mn SHARADA SIGN NUKTA +11236 ; Nukta # Mn KHOJKI SIGN NUKTA +112E9 ; Nukta # Mn KHUDAWADI SIGN NUKTA +1133B..1133C ; Nukta # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA +11446 ; Nukta # Mn NEWA SIGN NUKTA +114C3 ; Nukta # Mn TIRHUTA SIGN NUKTA +115C0 ; Nukta # Mn SIDDHAM SIGN NUKTA +116B7 ; Nukta # Mn TAKRI SIGN NUKTA +1183A ; Nukta # Mn DOGRA SIGN NUKTA +11943 ; Nukta # Mn DIVES AKURU SIGN NUKTA +11D42 ; Nukta # Mn MASARAM GONDI SIGN NUKTA + +# ================================================ + +# Indic_Syllabic_Category=Virama + +# Virama (killing of inherent vowel in consonant sequence +# or consonant stacker) +# Only includes characters that can act both as visible killer viramas +# and consonant stackers. Separate property values exist for characters +# that can only act as pure killers or only as consonant stackers. + +# [Derivation: (ccc=9) - (InSC=Pure_Killer) - (InSC=Invisible_Stacker) +# - (InSC=Number_Joiner) - 2D7F] + +094D ; Virama # Mn DEVANAGARI SIGN VIRAMA +09CD ; Virama # Mn BENGALI SIGN VIRAMA +0A4D ; Virama # Mn GURMUKHI SIGN VIRAMA +0ACD ; Virama # Mn GUJARATI SIGN VIRAMA +0B4D ; Virama # Mn ORIYA SIGN VIRAMA +0BCD ; Virama # Mn TAMIL SIGN VIRAMA +0C4D ; Virama # Mn TELUGU SIGN VIRAMA +0CCD ; Virama # Mn KANNADA SIGN VIRAMA +0D4D ; Virama # Mn MALAYALAM SIGN VIRAMA +0DCA ; Virama # Mn SINHALA SIGN AL-LAKUNA +1B44 ; Virama # Mc BALINESE ADEG ADEG +A806 ; Virama # Mn SYLOTI NAGRI SIGN HASANTA +A8C4 ; Virama # Mn SAURASHTRA SIGN VIRAMA +A9C0 ; Virama # Mc JAVANESE PANGKON +11046 ; Virama # Mn BRAHMI VIRAMA +110B9 ; Virama # Mn KAITHI SIGN VIRAMA +111C0 ; Virama # Mc SHARADA SIGN VIRAMA +11235 ; Virama # Mc KHOJKI SIGN VIRAMA +1134D ; Virama # Mc GRANTHA SIGN VIRAMA +11442 ; Virama # Mn NEWA SIGN VIRAMA +114C2 ; Virama # Mn TIRHUTA SIGN VIRAMA +115BF ; Virama # Mn SIDDHAM SIGN VIRAMA +1163F ; Virama # Mn MODI SIGN VIRAMA +116B6 ; Virama # Mc TAKRI SIGN VIRAMA +11839 ; Virama # Mn DOGRA SIGN VIRAMA +119E0 ; Virama # Mn NANDINAGARI SIGN VIRAMA +11C3F ; Virama # Mn BHAIKSUKI SIGN VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Pure_Killer + +# Pure killer (killing of inherent vowel in consonant sequence, +# with no consonant stacking behavior) + +# [Not derivable] + +0D3B..0D3C ; Pure_Killer # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA +0E3A ; Pure_Killer # Mn THAI CHARACTER PHINTHU +0E4E ; Pure_Killer # Mn THAI CHARACTER YAMAKKAN +0EBA ; Pure_Killer # Mn LAO SIGN PALI VIRAMA +0F84 ; Pure_Killer # Mn TIBETAN MARK HALANTA +103A ; Pure_Killer # Mn MYANMAR SIGN ASAT +1714 ; Pure_Killer # Mn TAGALOG SIGN VIRAMA +1715 ; Pure_Killer # Mc TAGALOG SIGN PAMUDPOD +1734 ; Pure_Killer # Mc HANUNOO SIGN PAMUDPOD +17D1 ; Pure_Killer # Mn KHMER SIGN VIRIAM +1A7A ; Pure_Killer # Mn TAI THAM SIGN RA HAAM +1BAA ; Pure_Killer # Mc SUNDANESE SIGN PAMAAEH +1BF2..1BF3 ; Pure_Killer # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +A82C ; Pure_Killer # Mn SYLOTI NAGRI SIGN ALTERNATE HASANTA +A953 ; Pure_Killer # Mc REJANG VIRAMA +ABED ; Pure_Killer # Mn MEETEI MAYEK APUN IYEK +11070 ; Pure_Killer # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11134 ; Pure_Killer # Mn CHAKMA MAAYYAA +112EA ; Pure_Killer # Mn KHUDAWADI SIGN VIRAMA +1172B ; Pure_Killer # Mn AHOM SIGN KILLER +1193D ; Pure_Killer # Mc DIVES AKURU SIGN HALANTA +11A34 ; Pure_Killer # Mn ZANABAZAR SQUARE SIGN VIRAMA +11D44 ; Pure_Killer # Mn MASARAM GONDI SIGN HALANTA +11F41 ; Pure_Killer # Mc KAWI SIGN KILLER + +# ================================================ + +# Indic_Syllabic_Category=Invisible_Stacker + +# Invisible stacker (invisible consonant stacker virama). +# +# Note that in some scripts, such as Kharoshthi and Masaram Gondi, an invisible +# stacker may have a second function, changing the shape and/or location of the +# consonant preceding it, even when there is no consonant following the +# invisible stacker. + +# [Not derivable] + +1039 ; Invisible_Stacker # Mn MYANMAR SIGN VIRAMA +17D2 ; Invisible_Stacker # Mn KHMER SIGN COENG +1A60 ; Invisible_Stacker # Mn TAI THAM SIGN SAKOT +1BAB ; Invisible_Stacker # Mn SUNDANESE SIGN VIRAMA +AAF6 ; Invisible_Stacker # Mn MEETEI MAYEK VIRAMA +10A3F ; Invisible_Stacker # Mn KHAROSHTHI VIRAMA +11133 ; Invisible_Stacker # Mn CHAKMA VIRAMA +1193E ; Invisible_Stacker # Mn DIVES AKURU VIRAMA +11A47 ; Invisible_Stacker # Mn ZANABAZAR SQUARE SUBJOINER +11A99 ; Invisible_Stacker # Mn SOYOMBO SUBJOINER +11D45 ; Invisible_Stacker # Mn MASARAM GONDI VIRAMA +11D97 ; Invisible_Stacker # Mn GUNJALA GONDI VIRAMA +11F42 ; Invisible_Stacker # Mn KAWI CONJOINER + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Independent + +# Independent Vowels (contrasted with matras) + +# [Not derivable] + +0904..0914 ; Vowel_Independent # Lo [17] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER AU +0960..0961 ; Vowel_Independent # Lo [2] DEVANAGARI LETTER VOCALIC RR..DEVANAGARI LETTER VOCALIC LL +0972..0977 ; Vowel_Independent # Lo [6] DEVANAGARI LETTER CANDRA A..DEVANAGARI LETTER UUE +0985..098C ; Vowel_Independent # Lo [8] BENGALI LETTER A..BENGALI LETTER VOCALIC L +098F..0990 ; Vowel_Independent # Lo [2] BENGALI LETTER E..BENGALI LETTER AI +0993..0994 ; Vowel_Independent # Lo [2] BENGALI LETTER O..BENGALI LETTER AU +09E0..09E1 ; Vowel_Independent # Lo [2] BENGALI LETTER VOCALIC RR..BENGALI LETTER VOCALIC LL +0A05..0A0A ; Vowel_Independent # Lo [6] GURMUKHI LETTER A..GURMUKHI LETTER UU +0A0F..0A10 ; Vowel_Independent # Lo [2] GURMUKHI LETTER EE..GURMUKHI LETTER AI +0A13..0A14 ; Vowel_Independent # Lo [2] GURMUKHI LETTER OO..GURMUKHI LETTER AU +0A85..0A8D ; Vowel_Independent # Lo [9] GUJARATI LETTER A..GUJARATI VOWEL CANDRA E +0A8F..0A91 ; Vowel_Independent # Lo [3] GUJARATI LETTER E..GUJARATI VOWEL CANDRA O +0A93..0A94 ; Vowel_Independent # Lo [2] GUJARATI LETTER O..GUJARATI LETTER AU +0AE0..0AE1 ; Vowel_Independent # Lo [2] GUJARATI LETTER VOCALIC RR..GUJARATI LETTER VOCALIC LL +0B05..0B0C ; Vowel_Independent # Lo [8] ORIYA LETTER A..ORIYA LETTER VOCALIC L +0B0F..0B10 ; Vowel_Independent # Lo [2] ORIYA LETTER E..ORIYA LETTER AI +0B13..0B14 ; Vowel_Independent # Lo [2] ORIYA LETTER O..ORIYA LETTER AU +0B60..0B61 ; Vowel_Independent # Lo [2] ORIYA LETTER VOCALIC RR..ORIYA LETTER VOCALIC LL +0B85..0B8A ; Vowel_Independent # Lo [6] TAMIL LETTER A..TAMIL LETTER UU +0B8E..0B90 ; Vowel_Independent # Lo [3] TAMIL LETTER E..TAMIL LETTER AI +0B92..0B94 ; Vowel_Independent # Lo [3] TAMIL LETTER O..TAMIL LETTER AU +0C05..0C0C ; Vowel_Independent # Lo [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L +0C0E..0C10 ; Vowel_Independent # Lo [3] TELUGU LETTER E..TELUGU LETTER AI +0C12..0C14 ; Vowel_Independent # Lo [3] TELUGU LETTER O..TELUGU LETTER AU +0C60..0C61 ; Vowel_Independent # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL +0C85..0C8C ; Vowel_Independent # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L +0C8E..0C90 ; Vowel_Independent # Lo [3] KANNADA LETTER E..KANNADA LETTER AI +0C92..0C94 ; Vowel_Independent # Lo [3] KANNADA LETTER O..KANNADA LETTER AU +0CE0..0CE1 ; Vowel_Independent # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL +0D05..0D0C ; Vowel_Independent # Lo [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L +0D0E..0D10 ; Vowel_Independent # Lo [3] MALAYALAM LETTER E..MALAYALAM LETTER AI +0D12..0D14 ; Vowel_Independent # Lo [3] MALAYALAM LETTER O..MALAYALAM LETTER AU +0D5F..0D61 ; Vowel_Independent # Lo [3] MALAYALAM LETTER ARCHAIC II..MALAYALAM LETTER VOCALIC LL +0D85..0D96 ; Vowel_Independent # Lo [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA +1021..102A ; Vowel_Independent # Lo [10] MYANMAR LETTER A..MYANMAR LETTER AU +1052..1055 ; Vowel_Independent # Lo [4] MYANMAR LETTER VOCALIC R..MYANMAR LETTER VOCALIC LL +1700..1702 ; Vowel_Independent # Lo [3] TAGALOG LETTER A..TAGALOG LETTER U +1720..1722 ; Vowel_Independent # Lo [3] HANUNOO LETTER A..HANUNOO LETTER U +1740..1742 ; Vowel_Independent # Lo [3] BUHID LETTER A..BUHID LETTER U +1760..1762 ; Vowel_Independent # Lo [3] TAGBANWA LETTER A..TAGBANWA LETTER U +17A3..17B3 ; Vowel_Independent # Lo [17] KHMER INDEPENDENT VOWEL QAQ..KHMER INDEPENDENT VOWEL QAU +1A4D..1A52 ; Vowel_Independent # Lo [6] TAI THAM LETTER I..TAI THAM LETTER OO +1B05..1B12 ; Vowel_Independent # Lo [14] BALINESE LETTER AKARA..BALINESE LETTER OKARA TEDUNG +1B83..1B89 ; Vowel_Independent # Lo [7] SUNDANESE LETTER A..SUNDANESE LETTER EU +1BE4..1BE5 ; Vowel_Independent # Lo [2] BATAK LETTER I..BATAK LETTER U +A800..A801 ; Vowel_Independent # Lo [2] SYLOTI NAGRI LETTER A..SYLOTI NAGRI LETTER I +A803..A805 ; Vowel_Independent # Lo [3] SYLOTI NAGRI LETTER U..SYLOTI NAGRI LETTER O +A882..A891 ; Vowel_Independent # Lo [16] SAURASHTRA LETTER A..SAURASHTRA LETTER AU +A8FE ; Vowel_Independent # Lo DEVANAGARI LETTER AY +A984..A988 ; Vowel_Independent # Lo [5] JAVANESE LETTER A..JAVANESE LETTER U +A98C..A98E ; Vowel_Independent # Lo [3] JAVANESE LETTER E..JAVANESE LETTER O +AA00..AA05 ; Vowel_Independent # Lo [6] CHAM LETTER A..CHAM LETTER O +AAE0..AAE1 ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER E..MEETEI MAYEK LETTER O +ABCE..ABCF ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER UN..MEETEI MAYEK LETTER I +ABD1 ; Vowel_Independent # Lo MEETEI MAYEK LETTER ATIYA +11005..11012 ; Vowel_Independent # Lo [14] BRAHMI LETTER A..BRAHMI LETTER AU +11071..11072 ; Vowel_Independent # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11083..1108C ; Vowel_Independent # Lo [10] KAITHI LETTER A..KAITHI LETTER AU +11103..11106 ; Vowel_Independent # Lo [4] CHAKMA LETTER AA..CHAKMA LETTER E +11183..11190 ; Vowel_Independent # Lo [14] SHARADA LETTER A..SHARADA LETTER AU +11200..11207 ; Vowel_Independent # Lo [8] KHOJKI LETTER A..KHOJKI LETTER AU +11240 ; Vowel_Independent # Lo KHOJKI LETTER SHORT I +11280..11283 ; Vowel_Independent # Lo [4] MULTANI LETTER A..MULTANI LETTER E +112B0..112B9 ; Vowel_Independent # Lo [10] KHUDAWADI LETTER A..KHUDAWADI LETTER AU +11305..1130C ; Vowel_Independent # Lo [8] GRANTHA LETTER A..GRANTHA LETTER VOCALIC L +1130F..11310 ; Vowel_Independent # Lo [2] GRANTHA LETTER EE..GRANTHA LETTER AI +11313..11314 ; Vowel_Independent # Lo [2] GRANTHA LETTER OO..GRANTHA LETTER AU +11360..11361 ; Vowel_Independent # Lo [2] GRANTHA LETTER VOCALIC RR..GRANTHA LETTER VOCALIC LL +11400..1140D ; Vowel_Independent # Lo [14] NEWA LETTER A..NEWA LETTER AU +11481..1148E ; Vowel_Independent # Lo [14] TIRHUTA LETTER A..TIRHUTA LETTER AU +11580..1158D ; Vowel_Independent # Lo [14] SIDDHAM LETTER A..SIDDHAM LETTER AU +115D8..115DB ; Vowel_Independent # Lo [4] SIDDHAM LETTER THREE-CIRCLE ALTERNATE I..SIDDHAM LETTER ALTERNATE U +11600..1160D ; Vowel_Independent # Lo [14] MODI LETTER A..MODI LETTER AU +11680..11689 ; Vowel_Independent # Lo [10] TAKRI LETTER A..TAKRI LETTER AU +11800..11809 ; Vowel_Independent # Lo [10] DOGRA LETTER A..DOGRA LETTER AU +11900..11906 ; Vowel_Independent # Lo [7] DIVES AKURU LETTER A..DIVES AKURU LETTER E +11909 ; Vowel_Independent # Lo DIVES AKURU LETTER O +119A0..119A7 ; Vowel_Independent # Lo [8] NANDINAGARI LETTER A..NANDINAGARI LETTER VOCALIC RR +119AA..119AD ; Vowel_Independent # Lo [4] NANDINAGARI LETTER E..NANDINAGARI LETTER AU +11A00 ; Vowel_Independent # Lo ZANABAZAR SQUARE LETTER A +11A50 ; Vowel_Independent # Lo SOYOMBO LETTER A +11C00..11C08 ; Vowel_Independent # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L +11C0A..11C0D ; Vowel_Independent # Lo [4] BHAIKSUKI LETTER E..BHAIKSUKI LETTER AU +11D00..11D06 ; Vowel_Independent # Lo [7] MASARAM GONDI LETTER A..MASARAM GONDI LETTER E +11D08..11D09 ; Vowel_Independent # Lo [2] MASARAM GONDI LETTER AI..MASARAM GONDI LETTER O +11D0B ; Vowel_Independent # Lo MASARAM GONDI LETTER AU +11D60..11D65 ; Vowel_Independent # Lo [6] GUNJALA GONDI LETTER A..GUNJALA GONDI LETTER UU +11D67..11D68 ; Vowel_Independent # Lo [2] GUNJALA GONDI LETTER EE..GUNJALA GONDI LETTER AI +11D6A..11D6B ; Vowel_Independent # Lo [2] GUNJALA GONDI LETTER OO..GUNJALA GONDI LETTER AU +11F04..11F10 ; Vowel_Independent # Lo [13] KAWI LETTER A..KAWI LETTER O + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Dependent + +# Dependent Vowels (contrasted with independent vowels and/or with +# complex placement). Known as matras in Indic scripts. Also +# includes vowel modifiers that follow dependent (and sometimes +# independent) vowels. + +# [Not derivable] + +093A ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN OE +093B ; Vowel_Dependent # Mc DEVANAGARI VOWEL SIGN OOE +093E..0940 ; Vowel_Dependent # Mc [3] DEVANAGARI VOWEL SIGN AA..DEVANAGARI VOWEL SIGN II +0941..0948 ; Vowel_Dependent # Mn [8] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN AI +0949..094C ; Vowel_Dependent # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094E..094F ; Vowel_Dependent # Mc [2] DEVANAGARI VOWEL SIGN PRISHTHAMATRA E..DEVANAGARI VOWEL SIGN AW +0955..0957 ; Vowel_Dependent # Mn [3] DEVANAGARI VOWEL SIGN CANDRA LONG E..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Vowel_Dependent # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BE..09C0 ; Vowel_Dependent # Mc [3] BENGALI VOWEL SIGN AA..BENGALI VOWEL SIGN II +09C1..09C4 ; Vowel_Dependent # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09C7..09C8 ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +09CB..09CC ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +09D7 ; Vowel_Dependent # Mc BENGALI AU LENGTH MARK +09E2..09E3 ; Vowel_Dependent # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3E..0A40 ; Vowel_Dependent # Mc [3] GURMUKHI VOWEL SIGN AA..GURMUKHI VOWEL SIGN II +0A41..0A42 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A47..0A48 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0ABE..0AC0 ; Vowel_Dependent # Mc [3] GUJARATI VOWEL SIGN AA..GUJARATI VOWEL SIGN II +0AC1..0AC5 ; Vowel_Dependent # Mn [5] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AC9 ; Vowel_Dependent # Mc GUJARATI VOWEL SIGN CANDRA O +0ACB..0ACC ; Vowel_Dependent # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0AE2..0AE3 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3E ; Vowel_Dependent # Mc ORIYA VOWEL SIGN AA +0B3F ; Vowel_Dependent # Mn ORIYA VOWEL SIGN I +0B40 ; Vowel_Dependent # Mc ORIYA VOWEL SIGN II +0B41..0B44 ; Vowel_Dependent # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B47..0B48 ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI +0B4B..0B4C ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN O..ORIYA VOWEL SIGN AU +0B55..0B56 ; Vowel_Dependent # Mn [2] ORIYA SIGN OVERLINE..ORIYA AI LENGTH MARK +0B57 ; Vowel_Dependent # Mc ORIYA AU LENGTH MARK +0B62..0B63 ; Vowel_Dependent # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BBE..0BBF ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC0 ; Vowel_Dependent # Mn TAMIL VOWEL SIGN II +0BC1..0BC2 ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BC6..0BC8 ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0BCA..0BCC ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0BD7 ; Vowel_Dependent # Mc TAMIL AU LENGTH MARK +0C3E..0C40 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C41..0C44 ; Vowel_Dependent # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C46..0C48 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI +0C4A..0C4C ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C55..0C56 ; Vowel_Dependent # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK +0C62..0C63 ; Vowel_Dependent # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBE ; Vowel_Dependent # Mc KANNADA VOWEL SIGN AA +0CBF ; Vowel_Dependent # Mn KANNADA VOWEL SIGN I +0CC0..0CC4 ; Vowel_Dependent # Mc [5] KANNADA VOWEL SIGN II..KANNADA VOWEL SIGN VOCALIC RR +0CC6 ; Vowel_Dependent # Mn KANNADA VOWEL SIGN E +0CC7..0CC8 ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +0CCC ; Vowel_Dependent # Mn KANNADA VOWEL SIGN AU +0CD5..0CD6 ; Vowel_Dependent # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CE2..0CE3 ; Vowel_Dependent # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D3E..0D40 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D44 ; Vowel_Dependent # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR +0D46..0D48 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0D4A..0D4C ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0D57 ; Vowel_Dependent # Mc MALAYALAM AU LENGTH MARK +0D62..0D63 ; Vowel_Dependent # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DCF..0DD1 ; Vowel_Dependent # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD2..0DD4 ; Vowel_Dependent # Mn [3] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Vowel_Dependent # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0DD8..0DDF ; Vowel_Dependent # Mc [8] SINHALA VOWEL SIGN GAETTA-PILLA..SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Vowel_Dependent # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Vowel_Dependent # Lo THAI CHARACTER SARA A +0E31 ; Vowel_Dependent # Mn THAI CHARACTER MAI HAN-AKAT +0E32..0E33 ; Vowel_Dependent # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E34..0E39 ; Vowel_Dependent # Mn [6] THAI CHARACTER SARA I..THAI CHARACTER SARA UU +0E40..0E45 ; Vowel_Dependent # Lo [6] THAI CHARACTER SARA E..THAI CHARACTER LAKKHANGYAO +0E47 ; Vowel_Dependent # Mn THAI CHARACTER MAITAIKHU +0EB0 ; Vowel_Dependent # Lo LAO VOWEL SIGN A +0EB1 ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KAN +0EB2..0EB3 ; Vowel_Dependent # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0EB4..0EB9 ; Vowel_Dependent # Mn [6] LAO VOWEL SIGN I..LAO VOWEL SIGN UU +0EBB ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KON +0EC0..0EC4 ; Vowel_Dependent # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +0F71..0F7D ; Vowel_Dependent # Mn [13] TIBETAN VOWEL SIGN AA..TIBETAN VOWEL SIGN OO +0F80..0F81 ; Vowel_Dependent # Mn [2] TIBETAN VOWEL SIGN REVERSED I..TIBETAN VOWEL SIGN REVERSED II +102B..102C ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +102D..1030 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN UU +1031 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN E +1032..1035 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +1056..1057 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1058..1059 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1062 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1071..1074 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1083..1084 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN SHAN AA..MYANMAR VOWEL SIGN SHAN E +1085..1086 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109C ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN AITON A +109D ; Vowel_Dependent # Mn MYANMAR VOWEL SIGN AITON AI +1712..1713 ; Vowel_Dependent # Mn [2] TAGALOG VOWEL SIGN I..TAGALOG VOWEL SIGN U +1732..1733 ; Vowel_Dependent # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1752..1753 ; Vowel_Dependent # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U +1772..1773 ; Vowel_Dependent # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U +17B6 ; Vowel_Dependent # Mc KHMER VOWEL SIGN AA +17B7..17BD ; Vowel_Dependent # Mn [7] KHMER VOWEL SIGN I..KHMER VOWEL SIGN UA +17BE..17C5 ; Vowel_Dependent # Mc [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU +17C8 ; Vowel_Dependent # Mc KHMER SIGN YUUKALEAPINTU +1920..1922 ; Vowel_Dependent # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U +1923..1926 ; Vowel_Dependent # Mc [4] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AU +1927..1928 ; Vowel_Dependent # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Vowel_Dependent # Mn LIMBU SIGN KEMPHRENG +19B0..19C0 ; Vowel_Dependent # Lo [17] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN IY +1A17..1A18 ; Vowel_Dependent # Mn [2] BUGINESE VOWEL SIGN I..BUGINESE VOWEL SIGN U +1A19..1A1A ; Vowel_Dependent # Mc [2] BUGINESE VOWEL SIGN E..BUGINESE VOWEL SIGN O +1A1B ; Vowel_Dependent # Mn BUGINESE VOWEL SIGN AE +1A61 ; Vowel_Dependent # Mc TAI THAM VOWEL SIGN A +1A62 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN MAI SAT +1A63..1A64 ; Vowel_Dependent # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A65..1A6C ; Vowel_Dependent # Mn [8] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN OA BELOW +1A6D..1A72 ; Vowel_Dependent # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI +1A73 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN OA ABOVE +1B35 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN TEDUNG +1B36..1B3A ; Vowel_Dependent # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA +1B3B ; Vowel_Dependent # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +1B3C ; Vowel_Dependent # Mn BALINESE VOWEL SIGN LA LENGA +1B3D..1B41 ; Vowel_Dependent # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1B42 ; Vowel_Dependent # Mn BALINESE VOWEL SIGN PEPET +1B43 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN PEPET TEDUNG +1BA4..1BA5 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PANGHULU..SUNDANESE VOWEL SIGN PANYUKU +1BA6..1BA7 ; Vowel_Dependent # Mc [2] SUNDANESE VOWEL SIGN PANAELAENG..SUNDANESE VOWEL SIGN PANOLONG +1BA8..1BA9 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE7 ; Vowel_Dependent # Mc BATAK VOWEL SIGN E +1BE8..1BE9 ; Vowel_Dependent # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BEA..1BEC ; Vowel_Dependent # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BED ; Vowel_Dependent # Mn BATAK VOWEL SIGN KARO O +1BEE ; Vowel_Dependent # Mc BATAK VOWEL SIGN U +1BEF ; Vowel_Dependent # Mn BATAK VOWEL SIGN U FOR SIMALUNGUN SA +1C26..1C2B ; Vowel_Dependent # Mc [6] LEPCHA VOWEL SIGN AA..LEPCHA VOWEL SIGN UU +1C2C ; Vowel_Dependent # Mn LEPCHA VOWEL SIGN E +A802 ; Vowel_Dependent # Mn SYLOTI NAGRI SIGN DVISVARA +A823..A824 ; Vowel_Dependent # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A825..A826 ; Vowel_Dependent # Mn [2] SYLOTI NAGRI VOWEL SIGN U..SYLOTI NAGRI VOWEL SIGN E +A827 ; Vowel_Dependent # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Vowel_Dependent # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A8FF ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN AY +A947..A94E ; Vowel_Dependent # Mn [8] REJANG VOWEL SIGN I..REJANG VOWEL SIGN EA +A9B4..A9B5 ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9B6..A9B9 ; Vowel_Dependent # Mn [4] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BA..A9BB ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +A9BC ; Vowel_Dependent # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Vowel_Dependent # Mn MYANMAR SIGN SHAN SAW +AA29..AA2E ; Vowel_Dependent # Mn [6] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN OE +AA2F..AA30 ; Vowel_Dependent # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA31..AA32 ; Vowel_Dependent # Mn [2] CHAM VOWEL SIGN AU..CHAM VOWEL SIGN UE +AAB0 ; Vowel_Dependent # Mn TAI VIET MAI KANG +AAB1 ; Vowel_Dependent # Lo TAI VIET VOWEL AA +AAB2..AAB4 ; Vowel_Dependent # Mn [3] TAI VIET VOWEL I..TAI VIET VOWEL U +AAB5..AAB6 ; Vowel_Dependent # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB7..AAB8 ; Vowel_Dependent # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AAB9..AABD ; Vowel_Dependent # Lo [5] TAI VIET VOWEL UEA..TAI VIET VOWEL AN +AABE ; Vowel_Dependent # Mn TAI VIET VOWEL AM +AAEB ; Vowel_Dependent # Mc MEETEI MAYEK VOWEL SIGN II +AAEC..AAED ; Vowel_Dependent # Mn [2] MEETEI MAYEK VOWEL SIGN UU..MEETEI MAYEK VOWEL SIGN AAI +AAEE..AAEF ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN AU..MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE5 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN ANAP +ABE6..ABE7 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE8 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABE9..ABEA ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +10A01..10A03 ; Vowel_Dependent # Mn [3] KHAROSHTHI VOWEL SIGN I..KHAROSHTHI VOWEL SIGN VOCALIC R +10A05..10A06 ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O +10A0C..10A0D ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN DOUBLE RING BELOW +11038..11045 ; Vowel_Dependent # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +11073..11074 ; Vowel_Dependent # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O +110B0..110B2 ; Vowel_Dependent # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II +110B3..110B6 ; Vowel_Dependent # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI +110B7..110B8 ; Vowel_Dependent # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +110C2 ; Vowel_Dependent # Mn KAITHI VOWEL SIGN VOCALIC R +11127..1112B ; Vowel_Dependent # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU +1112C ; Vowel_Dependent # Mc CHAKMA VOWEL SIGN E +1112D..11132 ; Vowel_Dependent # Mn [6] CHAKMA VOWEL SIGN AI..CHAKMA AU MARK +11145..11146 ; Vowel_Dependent # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI +111B3..111B5 ; Vowel_Dependent # Mc [3] SHARADA VOWEL SIGN AA..SHARADA VOWEL SIGN II +111B6..111BE ; Vowel_Dependent # Mn [9] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN O +111BF ; Vowel_Dependent # Mc SHARADA VOWEL SIGN AU +111CB..111CC ; Vowel_Dependent # Mn [2] SHARADA VOWEL MODIFIER MARK..SHARADA EXTRA SHORT VOWEL MARK +111CE ; Vowel_Dependent # Mc SHARADA VOWEL SIGN PRISHTHAMATRA E +1122C..1122E ; Vowel_Dependent # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +1122F..11231 ; Vowel_Dependent # Mn [3] KHOJKI VOWEL SIGN U..KHOJKI VOWEL SIGN AI +11232..11233 ; Vowel_Dependent # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU +11241 ; Vowel_Dependent # Mn KHOJKI VOWEL SIGN VOCALIC R +112E0..112E2 ; Vowel_Dependent # Mc [3] KHUDAWADI VOWEL SIGN AA..KHUDAWADI VOWEL SIGN II +112E3..112E8 ; Vowel_Dependent # Mn [6] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN AU +1133E..1133F ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11340 ; Vowel_Dependent # Mn GRANTHA VOWEL SIGN II +11341..11344 ; Vowel_Dependent # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +11347..11348 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +1134B..1134C ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +11357 ; Vowel_Dependent # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +11435..11437 ; Vowel_Dependent # Mc [3] NEWA VOWEL SIGN AA..NEWA VOWEL SIGN II +11438..1143F ; Vowel_Dependent # Mn [8] NEWA VOWEL SIGN U..NEWA VOWEL SIGN AI +11440..11441 ; Vowel_Dependent # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +114B0..114B2 ; Vowel_Dependent # Mc [3] TIRHUTA VOWEL SIGN AA..TIRHUTA VOWEL SIGN II +114B3..114B8 ; Vowel_Dependent # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114B9 ; Vowel_Dependent # Mc TIRHUTA VOWEL SIGN E +114BA ; Vowel_Dependent # Mn TIRHUTA VOWEL SIGN SHORT E +114BB..114BE ; Vowel_Dependent # Mc [4] TIRHUTA VOWEL SIGN AI..TIRHUTA VOWEL SIGN AU +115AF..115B1 ; Vowel_Dependent # Mc [3] SIDDHAM VOWEL SIGN AA..SIDDHAM VOWEL SIGN II +115B2..115B5 ; Vowel_Dependent # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115B8..115BB ; Vowel_Dependent # Mc [4] SIDDHAM VOWEL SIGN E..SIDDHAM VOWEL SIGN AU +115DC..115DD ; Vowel_Dependent # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11630..11632 ; Vowel_Dependent # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +11633..1163A ; Vowel_Dependent # Mn [8] MODI VOWEL SIGN U..MODI VOWEL SIGN AI +1163B..1163C ; Vowel_Dependent # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +11640 ; Vowel_Dependent # Mn MODI SIGN ARDHACANDRA +116AD ; Vowel_Dependent # Mn TAKRI VOWEL SIGN AA +116AE..116AF ; Vowel_Dependent # Mc [2] TAKRI VOWEL SIGN I..TAKRI VOWEL SIGN II +116B0..116B5 ; Vowel_Dependent # Mn [6] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN AU +11720..11721 ; Vowel_Dependent # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +11722..11725 ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN I..AHOM VOWEL SIGN UU +11726 ; Vowel_Dependent # Mc AHOM VOWEL SIGN E +11727..1172A ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN AW..AHOM VOWEL SIGN AM +1182C..1182E ; Vowel_Dependent # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II +1182F..11836 ; Vowel_Dependent # Mn [8] DOGRA VOWEL SIGN U..DOGRA VOWEL SIGN AU +11930..11935 ; Vowel_Dependent # Mc [6] DIVES AKURU VOWEL SIGN AA..DIVES AKURU VOWEL SIGN E +11937..11938 ; Vowel_Dependent # Mc [2] DIVES AKURU VOWEL SIGN AI..DIVES AKURU VOWEL SIGN O +119D1..119D3 ; Vowel_Dependent # Mc [3] NANDINAGARI VOWEL SIGN AA..NANDINAGARI VOWEL SIGN II +119D4..119D7 ; Vowel_Dependent # Mn [4] NANDINAGARI VOWEL SIGN U..NANDINAGARI VOWEL SIGN VOCALIC RR +119DA..119DB ; Vowel_Dependent # Mn [2] NANDINAGARI VOWEL SIGN E..NANDINAGARI VOWEL SIGN AI +119DC..119DD ; Vowel_Dependent # Mc [2] NANDINAGARI VOWEL SIGN O..NANDINAGARI VOWEL SIGN AU +119E4 ; Vowel_Dependent # Mc NANDINAGARI VOWEL SIGN PRISHTHAMATRA E +11A01..11A0A ; Vowel_Dependent # Mn [10] ZANABAZAR SQUARE VOWEL SIGN I..ZANABAZAR SQUARE VOWEL LENGTH MARK +11A51..11A56 ; Vowel_Dependent # Mn [6] SOYOMBO VOWEL SIGN I..SOYOMBO VOWEL SIGN OE +11A57..11A58 ; Vowel_Dependent # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A59..11A5B ; Vowel_Dependent # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11C2F ; Vowel_Dependent # Mc BHAIKSUKI VOWEL SIGN AA +11C30..11C36 ; Vowel_Dependent # Mn [7] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN VOCALIC L +11C38..11C3B ; Vowel_Dependent # Mn [4] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI VOWEL SIGN AU +11CB0 ; Vowel_Dependent # Mn MARCHEN VOWEL SIGN AA +11CB1 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN I +11CB2..11CB3 ; Vowel_Dependent # Mn [2] MARCHEN VOWEL SIGN U..MARCHEN VOWEL SIGN E +11CB4 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN O +11D31..11D36 ; Vowel_Dependent # Mn [6] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN VOCALIC R +11D3A ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Vowel_Dependent # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN AU +11D43 ; Vowel_Dependent # Mn MASARAM GONDI SIGN CANDRA +11D8A..11D8E ; Vowel_Dependent # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU +11D90..11D91 ; Vowel_Dependent # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI +11D93..11D94 ; Vowel_Dependent # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU +11EF3..11EF4 ; Vowel_Dependent # Mn [2] MAKASAR VOWEL SIGN I..MAKASAR VOWEL SIGN U +11EF5..11EF6 ; Vowel_Dependent # Mc [2] MAKASAR VOWEL SIGN E..MAKASAR VOWEL SIGN O +11F34..11F35 ; Vowel_Dependent # Mc [2] KAWI VOWEL SIGN AA..KAWI VOWEL SIGN ALTERNATE AA +11F36..11F3A ; Vowel_Dependent # Mn [5] KAWI VOWEL SIGN I..KAWI VOWEL SIGN VOCALIC R +11F3E..11F3F ; Vowel_Dependent # Mc [2] KAWI VOWEL SIGN E..KAWI VOWEL SIGN AI +11F40 ; Vowel_Dependent # Mn KAWI VOWEL SIGN EU + +# ================================================ + +# Indic_Syllabic_Category=Vowel + +# (Other) Vowels (reanalyzed as ordinary alphabetic letters or marks) + +# [Not derivable] + +1963..196D ; Vowel # Lo [11] TAI LE LETTER A..TAI LE LETTER AI +A85E..A861 ; Vowel # Lo [4] PHAGS-PA LETTER I..PHAGS-PA LETTER O +A866 ; Vowel # Lo PHAGS-PA LETTER EE +A922..A925 ; Vowel # Lo [4] KAYAH LI LETTER A..KAYAH LI LETTER OO +A926..A92A ; Vowel # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O +11150..11154 ; Vowel # Lo [5] MAHAJANI LETTER A..MAHAJANI LETTER O + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Placeholder + +# Consonant Placeholder +# This includes generic placeholders used for +# Indic script layout (NBSP and dotted circle), as well as a few script- +# specific vowel-holder characters which are not technically +# consonants, but serve instead as bases for placement of vowel marks. + +# [Not derivable] + +002D ; Consonant_Placeholder # Pd HYPHEN-MINUS +00A0 ; Consonant_Placeholder # Zs NO-BREAK SPACE +00D7 ; Consonant_Placeholder # Sm MULTIPLICATION SIGN +0980 ; Consonant_Placeholder # Lo BENGALI ANJI +0A72..0A73 ; Consonant_Placeholder # Lo [2] GURMUKHI IRI..GURMUKHI URA +104B ; Consonant_Placeholder # Po MYANMAR SIGN SECTION +104E ; Consonant_Placeholder # Po MYANMAR SYMBOL AFOREMENTIONED +1900 ; Consonant_Placeholder # Lo LIMBU VOWEL-CARRIER LETTER +1CFA ; Consonant_Placeholder # Lo VEDIC SIGN DOUBLE ANUSVARA ANTARGOMUKHA +2010..2014 ; Consonant_Placeholder # Pd [5] HYPHEN..EM DASH +25CC ; Consonant_Placeholder # So DOTTED CIRCLE +AA74..AA76 ; Consonant_Placeholder # Lo [3] MYANMAR LOGOGRAM KHAMTI OAY..MYANMAR LOGOGRAM KHAMTI HM +11A3F ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL HEAD MARK +11A45 ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL DOUBLE-LINED HEAD MARK +11EF2 ; Consonant_Placeholder # Lo MAKASAR ANGKA + +# ================================================ + +# Indic_Syllabic_Category=Consonant + +# Consonant (ordinary abugida consonants, with inherent vowels) + +# [Not derivable] + +0915..0939 ; Consonant # Lo [37] DEVANAGARI LETTER KA..DEVANAGARI LETTER HA +0958..095F ; Consonant # Lo [8] DEVANAGARI LETTER QA..DEVANAGARI LETTER YYA +0978..097F ; Consonant # Lo [8] DEVANAGARI LETTER MARWARI DDA..DEVANAGARI LETTER BBA +0995..09A8 ; Consonant # Lo [20] BENGALI LETTER KA..BENGALI LETTER NA +09AA..09B0 ; Consonant # Lo [7] BENGALI LETTER PA..BENGALI LETTER RA +09B2 ; Consonant # Lo BENGALI LETTER LA +09B6..09B9 ; Consonant # Lo [4] BENGALI LETTER SHA..BENGALI LETTER HA +09DC..09DD ; Consonant # Lo [2] BENGALI LETTER RRA..BENGALI LETTER RHA +09DF ; Consonant # Lo BENGALI LETTER YYA +09F0..09F1 ; Consonant # Lo [2] BENGALI LETTER RA WITH MIDDLE DIAGONAL..BENGALI LETTER RA WITH LOWER DIAGONAL +0A15..0A28 ; Consonant # Lo [20] GURMUKHI LETTER KA..GURMUKHI LETTER NA +0A2A..0A30 ; Consonant # Lo [7] GURMUKHI LETTER PA..GURMUKHI LETTER RA +0A32..0A33 ; Consonant # Lo [2] GURMUKHI LETTER LA..GURMUKHI LETTER LLA +0A35..0A36 ; Consonant # Lo [2] GURMUKHI LETTER VA..GURMUKHI LETTER SHA +0A38..0A39 ; Consonant # Lo [2] GURMUKHI LETTER SA..GURMUKHI LETTER HA +0A59..0A5C ; Consonant # Lo [4] GURMUKHI LETTER KHHA..GURMUKHI LETTER RRA +0A5E ; Consonant # Lo GURMUKHI LETTER FA +0A95..0AA8 ; Consonant # Lo [20] GUJARATI LETTER KA..GUJARATI LETTER NA +0AAA..0AB0 ; Consonant # Lo [7] GUJARATI LETTER PA..GUJARATI LETTER RA +0AB2..0AB3 ; Consonant # Lo [2] GUJARATI LETTER LA..GUJARATI LETTER LLA +0AB5..0AB9 ; Consonant # Lo [5] GUJARATI LETTER VA..GUJARATI LETTER HA +0AF9 ; Consonant # Lo GUJARATI LETTER ZHA +0B15..0B28 ; Consonant # Lo [20] ORIYA LETTER KA..ORIYA LETTER NA +0B2A..0B30 ; Consonant # Lo [7] ORIYA LETTER PA..ORIYA LETTER RA +0B32..0B33 ; Consonant # Lo [2] ORIYA LETTER LA..ORIYA LETTER LLA +0B35..0B39 ; Consonant # Lo [5] ORIYA LETTER VA..ORIYA LETTER HA +0B5C..0B5D ; Consonant # Lo [2] ORIYA LETTER RRA..ORIYA LETTER RHA +0B5F ; Consonant # Lo ORIYA LETTER YYA +0B71 ; Consonant # Lo ORIYA LETTER WA +0B95 ; Consonant # Lo TAMIL LETTER KA +0B99..0B9A ; Consonant # Lo [2] TAMIL LETTER NGA..TAMIL LETTER CA +0B9C ; Consonant # Lo TAMIL LETTER JA +0B9E..0B9F ; Consonant # Lo [2] TAMIL LETTER NYA..TAMIL LETTER TTA +0BA3..0BA4 ; Consonant # Lo [2] TAMIL LETTER NNA..TAMIL LETTER TA +0BA8..0BAA ; Consonant # Lo [3] TAMIL LETTER NA..TAMIL LETTER PA +0BAE..0BB9 ; Consonant # Lo [12] TAMIL LETTER MA..TAMIL LETTER HA +0C15..0C28 ; Consonant # Lo [20] TELUGU LETTER KA..TELUGU LETTER NA +0C2A..0C39 ; Consonant # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C58..0C5A ; Consonant # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C95..0CA8 ; Consonant # Lo [20] KANNADA LETTER KA..KANNADA LETTER NA +0CAA..0CB3 ; Consonant # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA +0CB5..0CB9 ; Consonant # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA +0CDE ; Consonant # Lo KANNADA LETTER FA +0D15..0D3A ; Consonant # Lo [38] MALAYALAM LETTER KA..MALAYALAM LETTER TTTA +0D9A..0DB1 ; Consonant # Lo [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA +0DB3..0DBB ; Consonant # Lo [9] SINHALA LETTER SANYAKA DAYANNA..SINHALA LETTER RAYANNA +0DBD ; Consonant # Lo SINHALA LETTER DANTAJA LAYANNA +0DC0..0DC6 ; Consonant # Lo [7] SINHALA LETTER VAYANNA..SINHALA LETTER FAYANNA +0E01..0E2E ; Consonant # Lo [46] THAI CHARACTER KO KAI..THAI CHARACTER HO NOKHUK +0E81..0E82 ; Consonant # Lo [2] LAO LETTER KO..LAO LETTER KHO SUNG +0E84 ; Consonant # Lo LAO LETTER KHO TAM +0E86..0E8A ; Consonant # Lo [5] LAO LETTER PALI GHA..LAO LETTER SO TAM +0E8C..0EA3 ; Consonant # Lo [24] LAO LETTER PALI JHA..LAO LETTER LO LING +0EA5 ; Consonant # Lo LAO LETTER LO LOOT +0EA7..0EAE ; Consonant # Lo [8] LAO LETTER WO..LAO LETTER HO TAM +0EDC..0EDF ; Consonant # Lo [4] LAO HO NO..LAO LETTER KHMU NYO +0F40..0F47 ; Consonant # Lo [8] TIBETAN LETTER KA..TIBETAN LETTER JA +0F49..0F6C ; Consonant # Lo [36] TIBETAN LETTER NYA..TIBETAN LETTER RRA +1000..1020 ; Consonant # Lo [33] MYANMAR LETTER KA..MYANMAR LETTER LLA +103F ; Consonant # Lo MYANMAR LETTER GREAT SA +1050..1051 ; Consonant # Lo [2] MYANMAR LETTER SHA..MYANMAR LETTER SSA +105A..105D ; Consonant # Lo [4] MYANMAR LETTER MON NGA..MYANMAR LETTER MON BBE +1061 ; Consonant # Lo MYANMAR LETTER SGAW KAREN SHA +1065..1066 ; Consonant # Lo [2] MYANMAR LETTER WESTERN PWO KAREN THA..MYANMAR LETTER WESTERN PWO KAREN PWA +106E..1070 ; Consonant # Lo [3] MYANMAR LETTER EASTERN PWO KAREN NNA..MYANMAR LETTER EASTERN PWO KAREN GHWA +1075..1081 ; Consonant # Lo [13] MYANMAR LETTER SHAN KA..MYANMAR LETTER SHAN HA +108E ; Consonant # Lo MYANMAR LETTER RUMAI PALAUNG FA +1703..1711 ; Consonant # Lo [15] TAGALOG LETTER KA..TAGALOG LETTER HA +171F ; Consonant # Lo TAGALOG LETTER ARCHAIC RA +1723..1731 ; Consonant # Lo [15] HANUNOO LETTER KA..HANUNOO LETTER HA +1743..1751 ; Consonant # Lo [15] BUHID LETTER KA..BUHID LETTER HA +1763..176C ; Consonant # Lo [10] TAGBANWA LETTER KA..TAGBANWA LETTER YA +176E..1770 ; Consonant # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA +1780..17A2 ; Consonant # Lo [35] KHMER LETTER KA..KHMER LETTER QA +1901..191E ; Consonant # Lo [30] LIMBU LETTER KA..LIMBU LETTER TRA +1950..1962 ; Consonant # Lo [19] TAI LE LETTER KA..TAI LE LETTER NA +1980..19AB ; Consonant # Lo [44] NEW TAI LUE LETTER HIGH QA..NEW TAI LUE LETTER LOW SUA +1A00..1A16 ; Consonant # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA +1A20..1A4C ; Consonant # Lo [45] TAI THAM LETTER HIGH KA..TAI THAM LETTER LOW HA +1A53..1A54 ; Consonant # Lo [2] TAI THAM LETTER LAE..TAI THAM LETTER GREAT SA +1B13..1B33 ; Consonant # Lo [33] BALINESE LETTER KA..BALINESE LETTER HA +1B45..1B4C ; Consonant # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA +1B8A..1BA0 ; Consonant # Lo [23] SUNDANESE LETTER KA..SUNDANESE LETTER HA +1BAE..1BAF ; Consonant # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA +1BBB..1BBD ; Consonant # Lo [3] SUNDANESE LETTER REU..SUNDANESE LETTER BHA +1BC0..1BE3 ; Consonant # Lo [36] BATAK LETTER A..BATAK LETTER MBA +1C00..1C23 ; Consonant # Lo [36] LEPCHA LETTER KA..LEPCHA LETTER A +1C4D..1C4F ; Consonant # Lo [3] LEPCHA LETTER TTA..LEPCHA LETTER DDA +A807..A80A ; Consonant # Lo [4] SYLOTI NAGRI LETTER KO..SYLOTI NAGRI LETTER GHO +A80C..A822 ; Consonant # Lo [23] SYLOTI NAGRI LETTER CO..SYLOTI NAGRI LETTER HO +A840..A85D ; Consonant # Lo [30] PHAGS-PA LETTER KA..PHAGS-PA LETTER A +A862..A865 ; Consonant # Lo [4] PHAGS-PA LETTER QA..PHAGS-PA LETTER GGA +A869..A870 ; Consonant # Lo [8] PHAGS-PA LETTER TTA..PHAGS-PA LETTER ASPIRATED FA +A872 ; Consonant # Lo PHAGS-PA SUPERFIXED LETTER RA +A892..A8B3 ; Consonant # Lo [34] SAURASHTRA LETTER KA..SAURASHTRA LETTER LLA +A90A..A921 ; Consonant # Lo [24] KAYAH LI LETTER KA..KAYAH LI LETTER CA +A930..A946 ; Consonant # Lo [23] REJANG LETTER KA..REJANG LETTER A +A989..A98B ; Consonant # Lo [3] JAVANESE LETTER PA CEREK..JAVANESE LETTER NGA LELET RASWADI +A98F..A9B2 ; Consonant # Lo [36] JAVANESE LETTER KA..JAVANESE LETTER HA +A9E0..A9E4 ; Consonant # Lo [5] MYANMAR LETTER SHAN GHA..MYANMAR LETTER SHAN BHA +A9E7..A9EF ; Consonant # Lo [9] MYANMAR LETTER TAI LAING NYA..MYANMAR LETTER TAI LAING NNA +A9FA..A9FE ; Consonant # Lo [5] MYANMAR LETTER TAI LAING LLA..MYANMAR LETTER TAI LAING BHA +AA06..AA28 ; Consonant # Lo [35] CHAM LETTER KA..CHAM LETTER HA +AA60..AA6F ; Consonant # Lo [16] MYANMAR LETTER KHAMTI GA..MYANMAR LETTER KHAMTI FA +AA71..AA73 ; Consonant # Lo [3] MYANMAR LETTER KHAMTI XA..MYANMAR LETTER KHAMTI RA +AA7A ; Consonant # Lo MYANMAR LETTER AITON RA +AA7E..AA7F ; Consonant # Lo [2] MYANMAR LETTER SHWE PALAUNG CHA..MYANMAR LETTER SHWE PALAUNG SHA +AA80..AAAF ; Consonant # Lo [48] TAI VIET LETTER LOW KO..TAI VIET LETTER HIGH O +AAE2..AAEA ; Consonant # Lo [9] MEETEI MAYEK LETTER CHA..MEETEI MAYEK LETTER SSA +ABC0..ABCD ; Consonant # Lo [14] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER HUK +ABD0 ; Consonant # Lo MEETEI MAYEK LETTER PHAM +ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTER BHAM +10A00 ; Consonant # Lo KHAROSHTHI LETTER A +10A10..10A13 ; Consonant # Lo [4] KHAROSHTHI LETTER KA..KHAROSHTHI LETTER GHA +10A15..10A17 ; Consonant # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA +10A19..10A35 ; Consonant # Lo [29] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER VHA +11013..11037 ; Consonant # Lo [37] BRAHMI LETTER KA..BRAHMI LETTER OLD TAMIL NNNA +11075 ; Consonant # Lo BRAHMI LETTER OLD TAMIL LLA +1108D..110AF ; Consonant # Lo [35] KAITHI LETTER KA..KAITHI LETTER HA +11107..11126 ; Consonant # Lo [32] CHAKMA LETTER KAA..CHAKMA LETTER HAA +11144 ; Consonant # Lo CHAKMA LETTER LHAA +11147 ; Consonant # Lo CHAKMA LETTER VAA +11155..11172 ; Consonant # Lo [30] MAHAJANI LETTER KA..MAHAJANI LETTER RRA +11191..111B2 ; Consonant # Lo [34] SHARADA LETTER KA..SHARADA LETTER HA +11208..11211 ; Consonant # Lo [10] KHOJKI LETTER KA..KHOJKI LETTER JJA +11213..1122B ; Consonant # Lo [25] KHOJKI LETTER NYA..KHOJKI LETTER LLA +1123F ; Consonant # Lo KHOJKI LETTER QA +11284..11286 ; Consonant # Lo [3] MULTANI LETTER KA..MULTANI LETTER GA +11288 ; Consonant # Lo MULTANI LETTER GHA +1128A..1128D ; Consonant # Lo [4] MULTANI LETTER CA..MULTANI LETTER JJA +1128F..1129D ; Consonant # Lo [15] MULTANI LETTER NYA..MULTANI LETTER BA +1129F..112A8 ; Consonant # Lo [10] MULTANI LETTER BHA..MULTANI LETTER RHA +112BA..112DE ; Consonant # Lo [37] KHUDAWADI LETTER KA..KHUDAWADI LETTER HA +11315..11328 ; Consonant # Lo [20] GRANTHA LETTER KA..GRANTHA LETTER NA +1132A..11330 ; Consonant # Lo [7] GRANTHA LETTER PA..GRANTHA LETTER RA +11332..11333 ; Consonant # Lo [2] GRANTHA LETTER LA..GRANTHA LETTER LLA +11335..11339 ; Consonant # Lo [5] GRANTHA LETTER VA..GRANTHA LETTER HA +1140E..11434 ; Consonant # Lo [39] NEWA LETTER KA..NEWA LETTER HA +1148F..114AF ; Consonant # Lo [33] TIRHUTA LETTER KA..TIRHUTA LETTER HA +1158E..115AE ; Consonant # Lo [33] SIDDHAM LETTER KA..SIDDHAM LETTER HA +1160E..1162F ; Consonant # Lo [34] MODI LETTER KA..MODI LETTER LLA +1168A..116AA ; Consonant # Lo [33] TAKRI LETTER KA..TAKRI LETTER RRA +116B8 ; Consonant # Lo TAKRI LETTER ARCHAIC KHA +11700..1171A ; Consonant # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA +11740..11746 ; Consonant # Lo [7] AHOM LETTER CA..AHOM LETTER LLA +1180A..1182B ; Consonant # Lo [34] DOGRA LETTER KA..DOGRA LETTER RRA +1190C..11913 ; Consonant # Lo [8] DIVES AKURU LETTER KA..DIVES AKURU LETTER JA +11915..11916 ; Consonant # Lo [2] DIVES AKURU LETTER NYA..DIVES AKURU LETTER TTA +11918..1192F ; Consonant # Lo [24] DIVES AKURU LETTER DDA..DIVES AKURU LETTER ZA +119AE..119D0 ; Consonant # Lo [35] NANDINAGARI LETTER KA..NANDINAGARI LETTER RRA +11A0B..11A32 ; Consonant # Lo [40] ZANABAZAR SQUARE LETTER KA..ZANABAZAR SQUARE LETTER KSSA +11A5C..11A83 ; Consonant # Lo [40] SOYOMBO LETTER KA..SOYOMBO LETTER KSSA +11C0E..11C2E ; Consonant # Lo [33] BHAIKSUKI LETTER KA..BHAIKSUKI LETTER HA +11C72..11C8F ; Consonant # Lo [30] MARCHEN LETTER KA..MARCHEN LETTER A +11D0C..11D30 ; Consonant # Lo [37] MASARAM GONDI LETTER KA..MASARAM GONDI LETTER TRA +11D6C..11D89 ; Consonant # Lo [30] GUNJALA GONDI LETTER YA..GUNJALA GONDI LETTER SA +11EE0..11EF1 ; Consonant # Lo [18] MAKASAR LETTER KA..MAKASAR LETTER A +11F12..11F33 ; Consonant # Lo [34] KAWI LETTER KA..KAWI LETTER JNYA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Dead + +# Dead Consonant (special consonant with killed vowel) + +# [Not derivable] + +09CE ; Consonant_Dead # Lo BENGALI LETTER KHANDA TA +0C5D ; Consonant_Dead # Lo TELUGU LETTER NAKAARA POLLU +0CDD ; Consonant_Dead # Lo KANNADA LETTER NAKAARA POLLU +0D54..0D56 ; Consonant_Dead # Lo [3] MALAYALAM LETTER CHILLU M..MALAYALAM LETTER CHILLU LLL +0D7A..0D7F ; Consonant_Dead # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K +1CF2..1CF3 ; Consonant_Dead # Lo [2] VEDIC SIGN ARDHAVISARGA..VEDIC SIGN ROTATED ARDHAVISARGA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_With_Stacker + +# Consonants that may make stacked ligatures with the next consonant +# without the use of a virama + +# [Not derivable] + +0CF1..0CF2 ; Consonant_With_Stacker # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA +1CF5..1CF6 ; Consonant_With_Stacker # Lo [2] VEDIC SIGN JIHVAMULIYA..VEDIC SIGN UPADHMANIYA +11003..11004 ; Consonant_With_Stacker # Lo [2] BRAHMI SIGN JIHVAMULIYA..BRAHMI SIGN UPADHMANIYA +11460..11461 ; Consonant_With_Stacker # Lo [2] NEWA SIGN JIHVAMULIYA..NEWA SIGN UPADHMANIYA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Prefixed + +# Cluster-initial consonants + +# [Not derivable] + +111C2..111C3 ; Consonant_Prefixed # Lo [2] SHARADA SIGN JIHVAMULIYA..SHARADA SIGN UPADHMANIYA +1193F ; Consonant_Prefixed # Lo DIVES AKURU PREFIXED NASAL SIGN +11A3A ; Consonant_Prefixed # Lo ZANABAZAR SQUARE CLUSTER-INITIAL LETTER RA +11A84..11A89 ; Consonant_Prefixed # Lo [6] SOYOMBO SIGN JIHVAMULIYA..SOYOMBO CLUSTER-INITIAL LETTER SA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Preceding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when preceding the main +# consonant. + +# [Not derivable] + +0D4E ; Consonant_Preceding_Repha # Lo MALAYALAM LETTER DOT REPH +11941 ; Consonant_Preceding_Repha # Lo DIVES AKURU INITIAL RA +11D46 ; Consonant_Preceding_Repha # Lo MASARAM GONDI REPHA +11F02 ; Consonant_Preceding_Repha # Lo KAWI SIGN REPHA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Initial_Postfixed + +# Consonants that succeed the main consonant in character sequences, but are +# pronounced before it. + +# [Not derivable] + +1A5A ; Consonant_Initial_Postfixed # Mn TAI THAM CONSONANT SIGN LOW PA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Succeeding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when succeeding the main +# consonant. + +# [Not derivable] + +17CC ; Consonant_Succeeding_Repha # Mn KHMER SIGN ROBAT + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Subjoined + +# Subjoined Consonant (C2 form subtending a base consonant in Tibetan, etc.) + +# [Not derivable] + +0F8D..0F97 ; Consonant_Subjoined # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Consonant_Subjoined # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +1929..192B ; Consonant_Subjoined # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1A57 ; Consonant_Subjoined # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A5B..1A5E ; Consonant_Subjoined # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1BA1 ; Consonant_Subjoined # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA2..1BA3 ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BAC..1BAD ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C24..1C25 ; Consonant_Subjoined # Mc [2] LEPCHA SUBJOINED LETTER YA..LEPCHA SUBJOINED LETTER RA +A867..A868 ; Consonant_Subjoined # Lo [2] PHAGS-PA SUBJOINED LETTER WA..PHAGS-PA SUBJOINED LETTER YA +A871 ; Consonant_Subjoined # Lo PHAGS-PA SUBJOINED LETTER RA +11C92..11CA7 ; Consonant_Subjoined # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CA9 ; Consonant_Subjoined # Mc MARCHEN SUBJOINED LETTER YA +11CAA..11CAF ; Consonant_Subjoined # Mn [6] MARCHEN SUBJOINED LETTER RA..MARCHEN SUBJOINED LETTER A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Medial + +# Medial Consonant (medial liquid, occurring in clusters) + +# [Not derivable] + +0A75 ; Consonant_Medial # Mn GURMUKHI SIGN YAKASH +0EBC ; Consonant_Medial # Mn LAO SEMIVOWEL SIGN LO +0EBD ; Consonant_Medial # Lo LAO SEMIVOWEL SIGN NYO +103B..103C ; Consonant_Medial # Mc [2] MYANMAR CONSONANT SIGN MEDIAL YA..MYANMAR CONSONANT SIGN MEDIAL RA +103D..103E ; Consonant_Medial # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +105E..1060 ; Consonant_Medial # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Consonant_Medial # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +1A55 ; Consonant_Medial # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A56 ; Consonant_Medial # Mn TAI THAM CONSONANT SIGN MEDIAL LA +A8B4 ; Consonant_Medial # Mc SAURASHTRA CONSONANT SIGN HAARU +A9BD ; Consonant_Medial # Mn JAVANESE CONSONANT SIGN KERET +A9BE..A9BF ; Consonant_Medial # Mc [2] JAVANESE CONSONANT SIGN PENGKAL..JAVANESE CONSONANT SIGN CAKRA +AA33..AA34 ; Consonant_Medial # Mc [2] CHAM CONSONANT SIGN YA..CHAM CONSONANT SIGN RA +AA35..AA36 ; Consonant_Medial # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +1171D..1171F ; Consonant_Medial # Mn [3] AHOM CONSONANT SIGN MEDIAL LA..AHOM CONSONANT SIGN MEDIAL LIGATING RA +11940 ; Consonant_Medial # Mc DIVES AKURU MEDIAL YA +11942 ; Consonant_Medial # Mc DIVES AKURU MEDIAL RA +11A3B..11A3E ; Consonant_Medial # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11D47 ; Consonant_Medial # Mn MASARAM GONDI RA-KARA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Final + +# Final Consonant (special final forms which do not take vowels) + +# [Not derivable] + +1930..1931 ; Consonant_Final # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Consonant_Final # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +1939 ; Consonant_Final # Mn LIMBU SIGN MUKPHRENG +19C1..19C7 ; Consonant_Final # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B +1A58..1A59 ; Consonant_Final # Mn [2] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN FINAL NGA +1B03 ; Consonant_Final # Mn BALINESE SIGN SURANG +1B81 ; Consonant_Final # Mn SUNDANESE SIGN PANGLAYAR +1BBE..1BBF ; Consonant_Final # Lo [2] SUNDANESE LETTER FINAL K..SUNDANESE LETTER FINAL M +1BF0..1BF1 ; Consonant_Final # Mn [2] BATAK CONSONANT SIGN NG..BATAK CONSONANT SIGN H +1C2D..1C33 ; Consonant_Final # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +A94F..A951 ; Consonant_Final # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A952 ; Consonant_Final # Mc REJANG CONSONANT SIGN H +A982 ; Consonant_Final # Mn JAVANESE SIGN LAYAR +AA40..AA42 ; Consonant_Final # Lo [3] CHAM LETTER FINAL K..CHAM LETTER FINAL NG +AA43 ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL NG +AA44..AA4B ; Consonant_Final # Lo [8] CHAM LETTER FINAL CH..CHAM LETTER FINAL SS +AA4C ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL M +AA4D ; Consonant_Final # Mc CHAM CONSONANT SIGN FINAL H +ABDB..ABE2 ; Consonant_Final # Lo [8] MEETEI MAYEK LETTER KOK LONSUM..MEETEI MAYEK LETTER I LONSUM +11A8A..11A95 ; Consonant_Final # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Head_Letter + +# Head Letter (Tibetan) + +# [Not derivable] + +0F88..0F8C ; Consonant_Head_Letter # Lo [5] TIBETAN SIGN LCE TSA CAN..TIBETAN SIGN INVERTED MCHU CAN + +# ================================================ + +# Indic_Syllabic_Category=Modifying_Letter + +# Reanalyzed letters not participating in the abugida structure, but +# serving to modify the sound of an adjacent vowel or consonant. +# Note that this is not the same as General_Category=Modifier_Letter. + +# [Not derivable] + +0B83 ; Modifying_Letter # Lo TAMIL SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Tone_Letter + +# Tone Letter (spacing lexical tone mark with status as a letter) + +# [Not derivable] + +1970..1974 ; Tone_Letter # Lo [5] TAI LE LETTER TONE-2..TAI LE LETTER TONE-6 +AAC0 ; Tone_Letter # Lo TAI VIET TONE MAI NUENG +AAC2 ; Tone_Letter # Lo TAI VIET TONE MAI SONG + +# ================================================ + +# Indic_Syllabic_Category=Tone_Mark + +# Tone Mark (nonspacing or spacing lexical tone mark) + +# [Not derivable] + +0E48..0E4B ; Tone_Mark # Mn [4] THAI CHARACTER MAI EK..THAI CHARACTER MAI CHATTAWA +0EC8..0ECB ; Tone_Mark # Mn [4] LAO TONE MAI EK..LAO TONE MAI CATAWA +1037 ; Tone_Mark # Mn MYANMAR SIGN DOT BELOW +1063..1064 ; Tone_Mark # Mc [2] MYANMAR TONE MARK SGAW KAREN HATHI..MYANMAR TONE MARK SGAW KAREN KE PHO +1069..106D ; Tone_Mark # Mc [5] MYANMAR SIGN WESTERN PWO KAREN TONE-1..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1087..108C ; Tone_Mark # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108D ; Tone_Mark # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +108F ; Tone_Mark # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109B ; Tone_Mark # Mc [2] MYANMAR SIGN KHAMTI TONE-1..MYANMAR SIGN KHAMTI TONE-3 +19C8..19C9 ; Tone_Mark # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A75..1A79 ; Tone_Mark # Mn [5] TAI THAM SIGN TONE-1..TAI THAM SIGN KHUEN TONE-5 +A92B..A92D ; Tone_Mark # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +AA7B ; Tone_Mark # Mc MYANMAR SIGN PAO KAREN TONE +AA7C ; Tone_Mark # Mn MYANMAR SIGN TAI LAING TONE-2 +AA7D ; Tone_Mark # Mc MYANMAR SIGN TAI LAING TONE-5 +AABF ; Tone_Mark # Mn TAI VIET TONE MAI EK +AAC1 ; Tone_Mark # Mn TAI VIET TONE MAI THO +ABEC ; Tone_Mark # Mc MEETEI MAYEK LUM IYEK + +# ================================================ + +# Indic_Syllabic_Category=Gemination_Mark + +# Gemination Mark (doubling of the preceding or following consonant) +# +# U+0A71 GURMUKHI ADDAK precedes the consonant it geminates, while the +# others follow the consonant they geminate. + +# [Not derivable] + +0A71 ; Gemination_Mark # Mn GURMUKHI ADDAK +0AFB ; Gemination_Mark # Mn GUJARATI SIGN SHADDA +11237 ; Gemination_Mark # Mn KHOJKI SIGN SHADDA +11A98 ; Gemination_Mark # Mn SOYOMBO GEMINATION MARK + +# ================================================ + +# Indic_Syllabic_Category=Cantillation_Mark + +# Cantillation Mark (recitation marks, such as svara markers for the Samaveda) + +# [Not derivable] + +0951..0952 ; Cantillation_Mark # Mn [2] DEVANAGARI STRESS SIGN UDATTA..DEVANAGARI STRESS SIGN ANUDATTA +0A51 ; Cantillation_Mark # Mn GURMUKHI SIGN UDAAT +0AFA ; Cantillation_Mark # Mn GUJARATI SIGN SUKUN +0AFC ; Cantillation_Mark # Mn GUJARATI SIGN MADDAH +1CD0..1CD2 ; Cantillation_Mark # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CD4..1CE0 ; Cantillation_Mark # Mn [13] VEDIC SIGN YAJURVEDIC MIDLINE SVARITA..VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CE1 ; Cantillation_Mark # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF4 ; Cantillation_Mark # Mn VEDIC TONE CANDRA ABOVE +1CF7 ; Cantillation_Mark # Mc VEDIC SIGN ATIKRAMA +1CF8..1CF9 ; Cantillation_Mark # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE +20F0 ; Cantillation_Mark # Mn COMBINING ASTERISK ABOVE +A8E0..A8F1 ; Cantillation_Mark # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +1123E ; Cantillation_Mark # Mn KHOJKI SIGN SUKUN +11366..1136C ; Cantillation_Mark # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Cantillation_Mark # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA + +# ================================================ + +# Indic_Syllabic_Category=Register_Shifter + +# Register Shifter (shifts register for consonants, akin to a tone mark) + +# [Not derivable] + +17C9..17CA ; Register_Shifter # Mn [2] KHMER SIGN MUUSIKATOAN..KHMER SIGN TRIISAP + +# ================================================ + +# Indic_Syllabic_Category=Syllable_Modifier + +# Syllable Modifier (miscellaneous combining characters that modify +# something in the orthographic syllable they succeed or appear in) + +# [Not derivable] + +00B2..00B3 ; Syllable_Modifier # No [2] SUPERSCRIPT TWO..SUPERSCRIPT THREE +09FE ; Syllable_Modifier # Mn BENGALI SANDHI MARK +0ECE ; Syllable_Modifier # Mn LAO YAMAKKAN +0F35 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0FC6 ; Syllable_Modifier # Mn TIBETAN SYMBOL PADMA GDAN +17CB ; Syllable_Modifier # Mn KHMER SIGN BANTOC +17CE..17D0 ; Syllable_Modifier # Mn [3] KHMER SIGN KAKABAT..KHMER SIGN SAMYOK SANNYA +17D3 ; Syllable_Modifier # Mn KHMER SIGN BATHAMASAT +17DD ; Syllable_Modifier # Mn KHMER SIGN ATTHACAN +193B ; Syllable_Modifier # Mn LIMBU SIGN SA-I +1A7B..1A7C ; Syllable_Modifier # Mn [2] TAI THAM SIGN MAI SAM..TAI THAM SIGN KHUEN-LUE KARAN +1A7F ; Syllable_Modifier # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1C36 ; Syllable_Modifier # Mn LEPCHA SIGN RAN +1DFB ; Syllable_Modifier # Mn COMBINING DELETION MARK +2074 ; Syllable_Modifier # No SUPERSCRIPT FOUR +2082..2084 ; Syllable_Modifier # No [3] SUBSCRIPT TWO..SUBSCRIPT FOUR +111C9 ; Syllable_Modifier # Mn SHARADA SANDHI MARK +1145E ; Syllable_Modifier # Mn NEWA SANDHI MARK +11A33 ; Syllable_Modifier # Mn ZANABAZAR SQUARE FINAL CONSONANT MARK + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Killer + +# Consonant Killer (signifies that the previous consonant or consonants are +# not pronounced) + +# [Not derivable] + +0E4C ; Consonant_Killer # Mn THAI CHARACTER THANTHAKHAT +17CD ; Consonant_Killer # Mn KHMER SIGN TOANDAKHIAT + +# ================================================ + +# Indic_Syllabic_Category=Non_Joiner + +# Non_Joiner (Zero Width Non-Joiner) + +# [Not derivable] + +200C ; Non_Joiner # Cf ZERO WIDTH NON-JOINER + +# ================================================ + +# Indic_Syllabic_Category=Joiner + +# Joiner (Zero Width Joiner) + +# [Not derivable] + +200D ; Joiner # Cf ZERO WIDTH JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number_Joiner + +# Number_Joiner (forms ligatures between numbers for multiplication) + +# [Not derivable] + +1107F ; Number_Joiner # Mn BRAHMI NUMBER JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number + +# Number (can be used as vowel-holders like consonant placeholders) +# Note: A number may even hold subjoined consonants which may in turn +# have been formed using a virama or a stacker, e.g. the sequence +# where THAI THAM LETTER LOW TA is subjoined to +# TAI THAM THAM DIGIT THREE using an invisible stacker. + +# [Not derivable] + +0030..0039 ; Number # Nd [10] DIGIT ZERO..DIGIT NINE +0966..096F ; Number # Nd [10] DEVANAGARI DIGIT ZERO..DEVANAGARI DIGIT NINE +09E6..09EF ; Number # Nd [10] BENGALI DIGIT ZERO..BENGALI DIGIT NINE +0A66..0A6F ; Number # Nd [10] GURMUKHI DIGIT ZERO..GURMUKHI DIGIT NINE +0AE6..0AEF ; Number # Nd [10] GUJARATI DIGIT ZERO..GUJARATI DIGIT NINE +0B66..0B6F ; Number # Nd [10] ORIYA DIGIT ZERO..ORIYA DIGIT NINE +0BE6..0BEF ; Number # Nd [10] TAMIL DIGIT ZERO..TAMIL DIGIT NINE +0C66..0C6F ; Number # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE +0CE6..0CEF ; Number # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE +0D66..0D6F ; Number # Nd [10] MALAYALAM DIGIT ZERO..MALAYALAM DIGIT NINE +0DE6..0DEF ; Number # Nd [10] SINHALA LITH DIGIT ZERO..SINHALA LITH DIGIT NINE +0E50..0E59 ; Number # Nd [10] THAI DIGIT ZERO..THAI DIGIT NINE +0ED0..0ED9 ; Number # Nd [10] LAO DIGIT ZERO..LAO DIGIT NINE +0F20..0F29 ; Number # Nd [10] TIBETAN DIGIT ZERO..TIBETAN DIGIT NINE +0F2A..0F33 ; Number # No [10] TIBETAN DIGIT HALF ONE..TIBETAN DIGIT HALF ZERO +1040..1049 ; Number # Nd [10] MYANMAR DIGIT ZERO..MYANMAR DIGIT NINE +1090..1099 ; Number # Nd [10] MYANMAR SHAN DIGIT ZERO..MYANMAR SHAN DIGIT NINE +17E0..17E9 ; Number # Nd [10] KHMER DIGIT ZERO..KHMER DIGIT NINE +1946..194F ; Number # Nd [10] LIMBU DIGIT ZERO..LIMBU DIGIT NINE +19D0..19D9 ; Number # Nd [10] NEW TAI LUE DIGIT ZERO..NEW TAI LUE DIGIT NINE +19DA ; Number # No NEW TAI LUE THAM DIGIT ONE +1A80..1A89 ; Number # Nd [10] TAI THAM HORA DIGIT ZERO..TAI THAM HORA DIGIT NINE +1A90..1A99 ; Number # Nd [10] TAI THAM THAM DIGIT ZERO..TAI THAM THAM DIGIT NINE +1B50..1B59 ; Number # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE +1BB0..1BB9 ; Number # Nd [10] SUNDANESE DIGIT ZERO..SUNDANESE DIGIT NINE +1C40..1C49 ; Number # Nd [10] LEPCHA DIGIT ZERO..LEPCHA DIGIT NINE +A8D0..A8D9 ; Number # Nd [10] SAURASHTRA DIGIT ZERO..SAURASHTRA DIGIT NINE +A900..A909 ; Number # Nd [10] KAYAH LI DIGIT ZERO..KAYAH LI DIGIT NINE +A9D0..A9D9 ; Number # Nd [10] JAVANESE DIGIT ZERO..JAVANESE DIGIT NINE +A9F0..A9F9 ; Number # Nd [10] MYANMAR TAI LAING DIGIT ZERO..MYANMAR TAI LAING DIGIT NINE +AA50..AA59 ; Number # Nd [10] CHAM DIGIT ZERO..CHAM DIGIT NINE +ABF0..ABF9 ; Number # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE +10A40..10A48 ; Number # No [9] KHAROSHTHI DIGIT ONE..KHAROSHTHI FRACTION ONE HALF +11066..1106F ; Number # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11136..1113F ; Number # Nd [10] CHAKMA DIGIT ZERO..CHAKMA DIGIT NINE +111D0..111D9 ; Number # Nd [10] SHARADA DIGIT ZERO..SHARADA DIGIT NINE +111E1..111F4 ; Number # No [20] SINHALA ARCHAIC DIGIT ONE..SINHALA ARCHAIC NUMBER ONE THOUSAND +112F0..112F9 ; Number # Nd [10] KHUDAWADI DIGIT ZERO..KHUDAWADI DIGIT NINE +11450..11459 ; Number # Nd [10] NEWA DIGIT ZERO..NEWA DIGIT NINE +114D0..114D9 ; Number # Nd [10] TIRHUTA DIGIT ZERO..TIRHUTA DIGIT NINE +11650..11659 ; Number # Nd [10] MODI DIGIT ZERO..MODI DIGIT NINE +116C0..116C9 ; Number # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE +11730..11739 ; Number # Nd [10] AHOM DIGIT ZERO..AHOM DIGIT NINE +1173A..1173B ; Number # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY +11950..11959 ; Number # Nd [10] DIVES AKURU DIGIT ZERO..DIVES AKURU DIGIT NINE +11C50..11C59 ; Number # Nd [10] BHAIKSUKI DIGIT ZERO..BHAIKSUKI DIGIT NINE +11C5A..11C6C ; Number # No [19] BHAIKSUKI NUMBER ONE..BHAIKSUKI HUNDREDS UNIT MARK +11D50..11D59 ; Number # Nd [10] MASARAM GONDI DIGIT ZERO..MASARAM GONDI DIGIT NINE +11DA0..11DA9 ; Number # Nd [10] GUNJALA GONDI DIGIT ZERO..GUNJALA GONDI DIGIT NINE +11F50..11F59 ; Number # Nd [10] KAWI DIGIT ZERO..KAWI DIGIT NINE + +# ================================================ + +# Indic_Syllabic_Category=Brahmi_Joining_Number + +# Brahmi Joining Number (may be joined by a Number_Joiner of the same +# script, e.g. in Brahmi) +# +# Note: These are different from Numbers, in the way that there is no known +# evidence of Brahmi Joining Numbers taking vowels or subjoined consonants. +# Until such evidence is found, implementations may assume that Brahmi +# Joining Numbers only participate in shaping with other Brahmi Joining +# Numbers. + +# [Not derivable] + +11052..11065 ; Brahmi_Joining_Number # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND + +# EOF diff --git a/data/15.1.0-indic-positional-category.txt b/data/15.1.0-indic-positional-category.txt new file mode 100644 index 0000000..a7c5aef --- /dev/null +++ b/data/15.1.0-indic-positional-category.txt @@ -0,0 +1,808 @@ +# IndicPositionalCategory-15.1.0.txt +# Date: 2023-01-05 +# © 2023 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use, see https://www.unicode.org/terms_of_use.html +# +# For documentation, see UAX #44: Unicode Character Database, +# at https://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Positional_Category enumerated property +# +# Scope: This property is aimed at the problem of +# the specification of syllabic structure for Indic scripts. +# Because dependent vowels (matras), visible viramas, and other +# characters are placed in notional slots around the consonant (or +# consonant cluster) core of an Indic syllable, there may be +# cooccurrence constraints or other interactions. Also, it may be +# desirable, in cases where more than one such character may occur in +# sequence, as for example, in a top slot and a bottom slot, to +# specify preferred orders for spelling. As such, this property +# is designed primarily to supplement the Indic_Syllabic_Category +# property. +# +# In addition to combining marks associated with Indic scripts, the +# Indic_Positional_Category has non-trivial values for special signs +# associated with Indic_Syllabic_Category=Consonant_Prefixed +# or Indic_Syllabic_Category=Consonant_Preceding_Repha. Those signs +# have General_Category=Lo, rather than being combining marks. +# They occur in initial position in syllabic structure. However, when +# rendered, they appear as marks positioned with respect to another +# base letter (usually above it). Hence, having an explicit value for +# Indic_Positional_Category for those signs can be helpful. +# +# Note that this property is *not* intended as +# a prescriptive property regarding display or font design, +# for a number of reasons. Good font design requires information +# that is outside the context of a character encoding standard, +# and is best handled in other venues. For Indic dependent +# vowels and similar characters, in particular: +# +# 1. Matra placement may vary somewhat based on typeface design. +# 2. Matra placement, even within a single script, may vary +# somewhat according to historic period or local conventions. +# 3. Matra placement may be changed by explicit orthographic reform +# decisions. +# 4. Matras may ligate in various ways with a consonant (or even +# other elements of a syllable) instead of occurring in a +# discrete location. +# 5. Matra display may be contextually determined. This is +# notable, for example, in the Tamil script, where the shape +# and placement of -u and -uu vowels depends strongly on +# which consonant they adjoin. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Positional_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as containing dependent vowels or similar characters +# in the structural sense used for the Indic_Positional_Category are the +# following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Dives Akuru, Dogra, Grantha, Gujarati, +# Gunjala Gondi, Gurmukhi, Hanunoo, Javanese, Kaithi, Kannada, Kawi, +# Kayah Li, Kharoshthi, Khmer, Khojki, Khudawadi, Lao, Lepcha, Limbu, +# Makasar, Malayalam, Marchen, Masaram Gondi, Meetei Mayek, Modi, +# Myanmar, Nandinagari, Newa, New Tai Lue, Oriya, Rejang, Saurashtra, +# Sharada, Siddham, Sinhala, Soyombo, Sundanese, Syloti Nagri, +# Tagalog, Tagbanwa, Tai Tham, Tai Viet, Takri, Tamil, Telugu, Thai, +# Tibetan, Tirhuta, and Zanabazar Square. +# +# All characters for all other scripts not in that list +# take the default value for this property. +# +# See IndicSyllabicCategory.txt for a slightly more extended +# list of Indic scripts, including those which do not have +# positional characters. Currently, those additional +# Indic scripts without positional characters are +# Multani, Phags-pa, and Tai Le. +# +# Notes: +# +# 1. The following characters are all assigned the positional category Right, +# but may have different positions in some cases: +# * U+0BC1 TAMIL VOWEL SIGN U and U+0BC2 TAMIL VOWEL SIGN UU have +# contextually variable placement in Tamil. +# * U+0D41 MALAYALAM VOWEL SIGN U and U+0D42 MALAYALAM VOWEL SIGN UU form +# complex ligatures with consonants in older Malayalam orthography. +# * U+11341 GRANTHA VOWEL SIGN U and U+11342 GRANTHA VOWEL SIGN UU have +# contextually variable placement in Grantha. +# * U+11440 NEWA VOWEL SIGN O and U+11441 NEWA VOWEL SIGN AU have contextually +# variable placement in Newa. +# +# 2. The following characters are all assigned the positional category Top, +# but may have different positions in some cases: +# * U+1143E NEWA VOWEL SIGN E and U+1143F NEWA VOWEL SIGN AI have contextually +# variable placement in Newa. +# +# 3. The following characters are all assigned the positional category Bottom, +# but may have different positions in some cases: +# * U+102F MYANMAR VOWEL SIGN U and U+1030 MYANMAR VOWEL SIGN UU have +# contextually variable placement in Myanmar. +# * U+1A69 TAI THAM VOWEL SIGN U and U+1A6A TAI THAM VOWEL SIGN UU have +# contextually variable placement in Tai Tham. +# +# 4. The following character is assigned the positional category Left, but +# may have different positions in different styles: +# * U+119D2 NANDINAGARI VOWEL SIGN I has stylistically variable placement +# in Nandinagari. + + +# ================================================ + +# Property: Indic_Positional_Category +# +# All code points not explicitly listed for Indic_Positional_Category +# have the value NA (not applicable). +# +# @missing: 0000..10FFFF; NA + +# ------------------------------------------------ + +# Indic_Positional_Category=Right + +0903 ; Right # Mc DEVANAGARI SIGN VISARGA +093B ; Right # Mc DEVANAGARI VOWEL SIGN OOE +093E ; Right # Mc DEVANAGARI VOWEL SIGN AA +0940 ; Right # Mc DEVANAGARI VOWEL SIGN II +0949..094C ; Right # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094F ; Right # Mc DEVANAGARI VOWEL SIGN AW +0982..0983 ; Right # Mc [2] BENGALI SIGN ANUSVARA..BENGALI SIGN VISARGA +09BE ; Right # Mc BENGALI VOWEL SIGN AA +09C0 ; Right # Mc BENGALI VOWEL SIGN II +09D7 ; Right # Mc BENGALI AU LENGTH MARK +0A03 ; Right # Mc GURMUKHI SIGN VISARGA +0A3E ; Right # Mc GURMUKHI VOWEL SIGN AA +0A40 ; Right # Mc GURMUKHI VOWEL SIGN II +0A83 ; Right # Mc GUJARATI SIGN VISARGA +0ABE ; Right # Mc GUJARATI VOWEL SIGN AA +0AC0 ; Right # Mc GUJARATI VOWEL SIGN II +0ACB..0ACC ; Right # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0B02..0B03 ; Right # Mc [2] ORIYA SIGN ANUSVARA..ORIYA SIGN VISARGA +0B3E ; Right # Mc ORIYA VOWEL SIGN AA +0B40 ; Right # Mc ORIYA VOWEL SIGN II +0BBE..0BBF ; Right # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC1..0BC2 ; Right # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BD7 ; Right # Mc TAMIL AU LENGTH MARK +0C01..0C03 ; Right # Mc [3] TELUGU SIGN CANDRABINDU..TELUGU SIGN VISARGA +0C41..0C44 ; Right # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C82..0C83 ; Right # Mc [2] KANNADA SIGN ANUSVARA..KANNADA SIGN VISARGA +0CBE ; Right # Mc KANNADA VOWEL SIGN AA +0CC1..0CC4 ; Right # Mc [4] KANNADA VOWEL SIGN U..KANNADA VOWEL SIGN VOCALIC RR +0CD5..0CD6 ; Right # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CF3 ; Right # Mc KANNADA SIGN COMBINING ANUSVARA ABOVE RIGHT +0D02..0D03 ; Right # Mc [2] MALAYALAM SIGN ANUSVARA..MALAYALAM SIGN VISARGA +0D3E..0D40 ; Right # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D42 ; Right # Mn [2] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN UU +0D57 ; Right # Mc MALAYALAM AU LENGTH MARK +0D82..0D83 ; Right # Mc [2] SINHALA SIGN ANUSVARAYA..SINHALA SIGN VISARGAYA +0DCF..0DD1 ; Right # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD8 ; Right # Mc SINHALA VOWEL SIGN GAETTA-PILLA +0DDF ; Right # Mc SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Right # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Right # Lo THAI CHARACTER SARA A +0E32..0E33 ; Right # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E45 ; Right # Lo THAI CHARACTER LAKKHANGYAO +0EB0 ; Right # Lo LAO VOWEL SIGN A +0EB2..0EB3 ; Right # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0F3E ; Right # Mc TIBETAN SIGN YAR TSHES +0F7F ; Right # Mc TIBETAN SIGN RNAM BCAD +102B..102C ; Right # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +1038 ; Right # Mc MYANMAR SIGN VISARGA +103B ; Right # Mc MYANMAR CONSONANT SIGN MEDIAL YA +1056..1057 ; Right # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1062..1064 ; Right # Mc [3] MYANMAR VOWEL SIGN SGAW KAREN EU..MYANMAR TONE MARK SGAW KAREN KE PHO +1067..106D ; Right # Mc [7] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1083 ; Right # Mc MYANMAR VOWEL SIGN SHAN AA +1087..108C ; Right # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108F ; Right # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109C ; Right # Mc [3] MYANMAR SIGN KHAMTI TONE-1..MYANMAR VOWEL SIGN AITON A +1715 ; Right # Mc TAGALOG SIGN PAMUDPOD +1734 ; Right # Mc HANUNOO SIGN PAMUDPOD +17B6 ; Right # Mc KHMER VOWEL SIGN AA +17C7..17C8 ; Right # Mc [2] KHMER SIGN REAHMUK..KHMER SIGN YUUKALEAPINTU +1923..1924 ; Right # Mc [2] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AI +1929..192B ; Right # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1930..1931 ; Right # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Right # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +19B0..19B4 ; Right # Lo [5] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN UU +19B8..19B9 ; Right # Lo [2] NEW TAI LUE VOWEL SIGN OA..NEW TAI LUE VOWEL SIGN UE +19BB..19C0 ; Right # Lo [6] NEW TAI LUE VOWEL SIGN AAY..NEW TAI LUE VOWEL SIGN IY +19C8..19C9 ; Right # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A1A ; Right # Mc BUGINESE VOWEL SIGN O +1A57 ; Right # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A61 ; Right # Mc TAI THAM VOWEL SIGN A +1A63..1A64 ; Right # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A6D ; Right # Mc TAI THAM VOWEL SIGN OY +1B04 ; Right # Mc BALINESE SIGN BISAH +1B35 ; Right # Mc BALINESE VOWEL SIGN TEDUNG +1B44 ; Right # Mc BALINESE ADEG ADEG +1B82 ; Right # Mc SUNDANESE SIGN PANGWISAD +1BA1 ; Right # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA7 ; Right # Mc SUNDANESE VOWEL SIGN PANOLONG +1BAA ; Right # Mc SUNDANESE SIGN PAMAAEH +1BE7 ; Right # Mc BATAK VOWEL SIGN E +1BEA..1BEC ; Right # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BEE ; Right # Mc BATAK VOWEL SIGN U +1BF2..1BF3 ; Right # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +1C24..1C26 ; Right # Mc [3] LEPCHA SUBJOINED LETTER YA..LEPCHA VOWEL SIGN AA +1C2A..1C2B ; Right # Mc [2] LEPCHA VOWEL SIGN U..LEPCHA VOWEL SIGN UU +1CE1 ; Right # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF7 ; Right # Mc VEDIC SIGN ATIKRAMA +A823..A824 ; Right # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A827 ; Right # Mc SYLOTI NAGRI VOWEL SIGN OO +A880..A881 ; Right # Mc [2] SAURASHTRA SIGN ANUSVARA..SAURASHTRA SIGN VISARGA +A8B4..A8C3 ; Right # Mc [16] SAURASHTRA CONSONANT SIGN HAARU..SAURASHTRA VOWEL SIGN AU +A952..A953 ; Right # Mc [2] REJANG CONSONANT SIGN H..REJANG VIRAMA +A983 ; Right # Mc JAVANESE SIGN WIGNYAN +A9B4..A9B5 ; Right # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +AA33 ; Right # Mc CHAM CONSONANT SIGN YA +AA4D ; Right # Mc CHAM CONSONANT SIGN FINAL H +AA7B ; Right # Mc MYANMAR SIGN PAO KAREN TONE +AA7D ; Right # Mc MYANMAR SIGN TAI LAING TONE-5 +AAB1 ; Right # Lo TAI VIET VOWEL AA +AABA ; Right # Lo TAI VIET VOWEL UA +AABD ; Right # Lo TAI VIET VOWEL AN +AAEF ; Right # Mc MEETEI MAYEK VOWEL SIGN AAU +AAF5 ; Right # Mc MEETEI MAYEK VOWEL SIGN VISARGA +ABE3..ABE4 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE6..ABE7 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE9..ABEA ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +ABEC ; Right # Mc MEETEI MAYEK LUM IYEK +11000 ; Right # Mc BRAHMI SIGN CANDRABINDU +11002 ; Right # Mc BRAHMI SIGN VISARGA +11082 ; Right # Mc KAITHI SIGN VISARGA +110B0 ; Right # Mc KAITHI VOWEL SIGN AA +110B2 ; Right # Mc KAITHI VOWEL SIGN II +110B7..110B8 ; Right # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11145..11146 ; Right # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI +11182 ; Right # Mc SHARADA SIGN VISARGA +111B3 ; Right # Mc SHARADA VOWEL SIGN AA +111B5 ; Right # Mc SHARADA VOWEL SIGN II +111C0 ; Right # Mc SHARADA SIGN VIRAMA +1122C..1122E ; Right # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +11235 ; Right # Mc KHOJKI SIGN VIRAMA +112E0 ; Right # Mc KHUDAWADI VOWEL SIGN AA +112E2 ; Right # Mc KHUDAWADI VOWEL SIGN II +11302..11303 ; Right # Mc [2] GRANTHA SIGN ANUSVARA..GRANTHA SIGN VISARGA +1133E..1133F ; Right # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11341..11344 ; Right # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +1134D ; Right # Mc GRANTHA SIGN VIRAMA +11357 ; Right # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Right # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +11435 ; Right # Mc NEWA VOWEL SIGN AA +11437 ; Right # Mc NEWA VOWEL SIGN II +11440..11441 ; Right # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +11445 ; Right # Mc NEWA SIGN VISARGA +114B0 ; Right # Mc TIRHUTA VOWEL SIGN AA +114B2 ; Right # Mc TIRHUTA VOWEL SIGN II +114BD ; Right # Mc TIRHUTA VOWEL SIGN SHORT O +114C1 ; Right # Mc TIRHUTA SIGN VISARGA +115AF ; Right # Mc SIDDHAM VOWEL SIGN AA +115B1 ; Right # Mc SIDDHAM VOWEL SIGN II +115BE ; Right # Mc SIDDHAM SIGN VISARGA +11630..11632 ; Right # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +1163B..1163C ; Right # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +1163E ; Right # Mc MODI SIGN VISARGA +116AC ; Right # Mc TAKRI SIGN VISARGA +116AF ; Right # Mc TAKRI VOWEL SIGN II +116B6 ; Right # Mc TAKRI SIGN VIRAMA +11720..11721 ; Right # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +1182C ; Right # Mc DOGRA VOWEL SIGN AA +1182E ; Right # Mc DOGRA VOWEL SIGN II +11838 ; Right # Mc DOGRA SIGN VISARGA +11930..11934 ; Right # Mc [5] DIVES AKURU VOWEL SIGN AA..DIVES AKURU VOWEL SIGN UU +1193D ; Right # Mc DIVES AKURU SIGN HALANTA +11940 ; Right # Mc DIVES AKURU MEDIAL YA +119D1 ; Right # Mc NANDINAGARI VOWEL SIGN AA +119D3 ; Right # Mc NANDINAGARI VOWEL SIGN II +119DC..119DF ; Right # Mc [4] NANDINAGARI VOWEL SIGN O..NANDINAGARI SIGN VISARGA +11A39 ; Right # Mc ZANABAZAR SQUARE SIGN VISARGA +11A57..11A58 ; Right # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A97 ; Right # Mc SOYOMBO SIGN VISARGA +11C2F ; Right # Mc BHAIKSUKI VOWEL SIGN AA +11C3E ; Right # Mc BHAIKSUKI SIGN VISARGA +11CA9 ; Right # Mc MARCHEN SUBJOINED LETTER YA +11CB4 ; Right # Mc MARCHEN VOWEL SIGN O +11D46 ; Right # Lo MASARAM GONDI REPHA +11D8A..11D8E ; Right # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU +11D93..11D94 ; Right # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU +11D96 ; Right # Mc GUNJALA GONDI SIGN VISARGA +11EF6 ; Right # Mc MAKASAR VOWEL SIGN O +11F03 ; Right # Mc KAWI SIGN VISARGA +11F34..11F35 ; Right # Mc [2] KAWI VOWEL SIGN AA..KAWI VOWEL SIGN ALTERNATE AA +11F41 ; Right # Mc KAWI SIGN KILLER + +# Indic_Positional_Category=Left + +093F ; Left # Mc DEVANAGARI VOWEL SIGN I +094E ; Left # Mc DEVANAGARI VOWEL SIGN PRISHTHAMATRA E +09BF ; Left # Mc BENGALI VOWEL SIGN I +09C7..09C8 ; Left # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +0A3F ; Left # Mc GURMUKHI VOWEL SIGN I +0ABF ; Left # Mc GUJARATI VOWEL SIGN I +0B47 ; Left # Mc ORIYA VOWEL SIGN E +0BC6..0BC8 ; Left # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0D46..0D48 ; Left # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0DD9 ; Left # Mc SINHALA VOWEL SIGN KOMBUVA +0DDB ; Left # Mc SINHALA VOWEL SIGN KOMBU DEKA +0F3F ; Left # Mc TIBETAN SIGN MAR TSHES +1031 ; Left # Mc MYANMAR VOWEL SIGN E +1084 ; Left # Mc MYANMAR VOWEL SIGN SHAN E +17C1..17C3 ; Left # Mc [3] KHMER VOWEL SIGN E..KHMER VOWEL SIGN AI +1A19 ; Left # Mc BUGINESE VOWEL SIGN E +1A55 ; Left # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A6E..1A72 ; Left # Mc [5] TAI THAM VOWEL SIGN E..TAI THAM VOWEL SIGN THAM AI +1B3E..1B3F ; Left # Mc [2] BALINESE VOWEL SIGN TALING..BALINESE VOWEL SIGN TALING REPA +1BA6 ; Left # Mc SUNDANESE VOWEL SIGN PANAELAENG +1C27..1C28 ; Left # Mc [2] LEPCHA VOWEL SIGN I..LEPCHA VOWEL SIGN O +1C34..1C35 ; Left # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A9BA..A9BB ; Left # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +AA2F..AA30 ; Left # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA34 ; Left # Mc CHAM CONSONANT SIGN RA +AAEB ; Left # Mc MEETEI MAYEK VOWEL SIGN II +AAEE ; Left # Mc MEETEI MAYEK VOWEL SIGN AU +110B1 ; Left # Mc KAITHI VOWEL SIGN I +1112C ; Left # Mc CHAKMA VOWEL SIGN E +111B4 ; Left # Mc SHARADA VOWEL SIGN I +111CE ; Left # Mc SHARADA VOWEL SIGN PRISHTHAMATRA E +112E1 ; Left # Mc KHUDAWADI VOWEL SIGN I +11347..11348 ; Left # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +11436 ; Left # Mc NEWA VOWEL SIGN I +114B1 ; Left # Mc TIRHUTA VOWEL SIGN I +114B9 ; Left # Mc TIRHUTA VOWEL SIGN E +115B0 ; Left # Mc SIDDHAM VOWEL SIGN I +115B8 ; Left # Mc SIDDHAM VOWEL SIGN E +116AE ; Left # Mc TAKRI VOWEL SIGN I +11726 ; Left # Mc AHOM VOWEL SIGN E +1182D ; Left # Mc DOGRA VOWEL SIGN I +11935 ; Left # Mc DIVES AKURU VOWEL SIGN E +11937 ; Left # Mc DIVES AKURU VOWEL SIGN AI +119D2 ; Left # Mc NANDINAGARI VOWEL SIGN I +119E4 ; Left # Mc NANDINAGARI VOWEL SIGN PRISHTHAMATRA E +11CB1 ; Left # Mc MARCHEN VOWEL SIGN I +11EF5 ; Left # Mc MAKASAR VOWEL SIGN E +11F3E..11F3F ; Left # Mc [2] KAWI VOWEL SIGN E..KAWI VOWEL SIGN AI + +# Indic_Positional_Category=Visual_Order_Left + +# These are dependent vowels that occur to the left of the consonant +# letter in a syllable, but which occur in scripts using the visual order +# model, instead of the logical order model. Because of the different +# model, these left-side vowels occur first in the backing store (before +# the consonant letter) and are not reordered during text rendering. +# +# [Derivation: Logical_Order_Exception=Yes] + +0E40..0E44 ; Visual_Order_Left # Lo [5] THAI CHARACTER SARA E..THAI CHARACTER SARA AI MAIMALAI +0EC0..0EC4 ; Visual_Order_Left # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +19B5..19B7 ; Visual_Order_Left # Lo [3] NEW TAI LUE VOWEL SIGN E..NEW TAI LUE VOWEL SIGN O +19BA ; Visual_Order_Left # Lo NEW TAI LUE VOWEL SIGN AY +AAB5..AAB6 ; Visual_Order_Left # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB9 ; Visual_Order_Left # Lo TAI VIET VOWEL UEA +AABB..AABC ; Visual_Order_Left # Lo [2] TAI VIET VOWEL AUE..TAI VIET VOWEL AY + +# Indic_Positional_Category=Left_And_Right + +09CB..09CC ; Left_And_Right # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +0B4B ; Left_And_Right # Mc ORIYA VOWEL SIGN O +0BCA..0BCC ; Left_And_Right # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0D4A..0D4C ; Left_And_Right # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0DDC ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA +0DDE ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA +17C0 ; Left_And_Right # Mc KHMER VOWEL SIGN IE +17C4..17C5 ; Left_And_Right # Mc [2] KHMER VOWEL SIGN OO..KHMER VOWEL SIGN AU +1B40..1B41 ; Left_And_Right # Mc [2] BALINESE VOWEL SIGN TALING TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1134B..1134C ; Left_And_Right # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +114BC ; Left_And_Right # Mc TIRHUTA VOWEL SIGN O +114BE ; Left_And_Right # Mc TIRHUTA VOWEL SIGN AU +115BA ; Left_And_Right # Mc SIDDHAM VOWEL SIGN O +11938 ; Left_And_Right # Mc DIVES AKURU VOWEL SIGN O + +# Indic_Positional_Category=Top + +0900..0902 ; Top # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +093A ; Top # Mn DEVANAGARI VOWEL SIGN OE +0945..0948 ; Top # Mn [4] DEVANAGARI VOWEL SIGN CANDRA E..DEVANAGARI VOWEL SIGN AI +0951 ; Top # Mn DEVANAGARI STRESS SIGN UDATTA +0955 ; Top # Mn DEVANAGARI VOWEL SIGN CANDRA LONG E +0981 ; Top # Mn BENGALI SIGN CANDRABINDU +09FE ; Top # Mn BENGALI SANDHI MARK +0A01..0A02 ; Top # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A47..0A48 ; Top # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Top # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0A70..0A71 ; Top # Mn [2] GURMUKHI TIPPI..GURMUKHI ADDAK +0A81..0A82 ; Top # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0AC5 ; Top # Mn GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Top # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AFA..0AFF ; Top # Mn [6] GUJARATI SIGN SUKUN..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B01 ; Top # Mn ORIYA SIGN CANDRABINDU +0B3F ; Top # Mn ORIYA VOWEL SIGN I +0B55..0B56 ; Top # Mn [2] ORIYA SIGN OVERLINE..ORIYA AI LENGTH MARK +0B82 ; Top # Mn TAMIL SIGN ANUSVARA +0BC0 ; Top # Mn TAMIL VOWEL SIGN II +0BCD ; Top # Mn TAMIL SIGN VIRAMA +0C00 ; Top # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C04 ; Top # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C3E..0C40 ; Top # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C46..0C47 ; Top # Mn [2] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN EE +0C4A..0C4D ; Top # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA +0C55 ; Top # Mn TELUGU LENGTH MARK +0C81 ; Top # Mn KANNADA SIGN CANDRABINDU +0CBF ; Top # Mn KANNADA VOWEL SIGN I +0CC6 ; Top # Mn KANNADA VOWEL SIGN E +0CCC..0CCD ; Top # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA +0D00..0D01 ; Top # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU +0D3B..0D3C ; Top # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA +0D4D ; Top # Mn MALAYALAM SIGN VIRAMA +0D4E ; Top # Lo MALAYALAM LETTER DOT REPH +0D81 ; Top # Mn SINHALA SIGN CANDRABINDU +0DCA ; Top # Mn SINHALA SIGN AL-LAKUNA +0DD2..0DD3 ; Top # Mn [2] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN DIGA IS-PILLA +0E31 ; Top # Mn THAI CHARACTER MAI HAN-AKAT +0E34..0E37 ; Top # Mn [4] THAI CHARACTER SARA I..THAI CHARACTER SARA UEE +0E47..0E4E ; Top # Mn [8] THAI CHARACTER MAITAIKHU..THAI CHARACTER YAMAKKAN +0EB1 ; Top # Mn LAO VOWEL SIGN MAI KAN +0EB4..0EB7 ; Top # Mn [4] LAO VOWEL SIGN I..LAO VOWEL SIGN YY +0EBB ; Top # Mn LAO VOWEL SIGN MAI KON +0EC8..0ECE ; Top # Mn [7] LAO TONE MAI EK..LAO YAMAKKAN +0F39 ; Top # Mn TIBETAN MARK TSA -PHRU +0F72 ; Top # Mn TIBETAN VOWEL SIGN I +0F7A..0F7E ; Top # Mn [5] TIBETAN VOWEL SIGN E..TIBETAN SIGN RJES SU NGA RO +0F80 ; Top # Mn TIBETAN VOWEL SIGN REVERSED I +0F82..0F83 ; Top # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +0F86..0F87 ; Top # Mn [2] TIBETAN SIGN LCI RTAGS..TIBETAN SIGN YANG RTAGS +102D..102E ; Top # Mn [2] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN II +1032..1036 ; Top # Mn [5] MYANMAR VOWEL SIGN AI..MYANMAR SIGN ANUSVARA +103A ; Top # Mn MYANMAR SIGN ASAT +1071..1074 ; Top # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1085..1086 ; Top # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109D ; Top # Mn MYANMAR VOWEL SIGN AITON AI +1712 ; Top # Mn TAGALOG VOWEL SIGN I +1732 ; Top # Mn HANUNOO VOWEL SIGN I +1752 ; Top # Mn BUHID VOWEL SIGN I +1772 ; Top # Mn TAGBANWA VOWEL SIGN I +17B7..17BA ; Top # Mn [4] KHMER VOWEL SIGN I..KHMER VOWEL SIGN YY +17C6 ; Top # Mn KHMER SIGN NIKAHIT +17C9..17D1 ; Top # Mn [9] KHMER SIGN MUUSIKATOAN..KHMER SIGN VIRIAM +17D3 ; Top # Mn KHMER SIGN BATHAMASAT +17DD ; Top # Mn KHMER SIGN ATTHACAN +1920..1921 ; Top # Mn [2] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN I +1927..1928 ; Top # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Top # Mn LIMBU SIGN KEMPHRENG +1A17 ; Top # Mn BUGINESE VOWEL SIGN I +1A1B ; Top # Mn BUGINESE VOWEL SIGN AE +1A58..1A5A ; Top # Mn [3] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN LOW PA +1A62 ; Top # Mn TAI THAM VOWEL SIGN MAI SAT +1A65..1A68 ; Top # Mn [4] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN UUE +1A6B ; Top # Mn TAI THAM VOWEL SIGN O +1A73..1A7C ; Top # Mn [10] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN KHUEN-LUE KARAN +1B00..1B03 ; Top # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG +1B34 ; Top # Mn BALINESE SIGN REREKAN +1B36..1B37 ; Top # Mn [2] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN ULU SARI +1B42 ; Top # Mn BALINESE VOWEL SIGN PEPET +1B6B ; Top # Mn BALINESE MUSICAL SYMBOL COMBINING TEGEH +1B6D..1B73 ; Top # Mn [7] BALINESE MUSICAL SYMBOL COMBINING KEMPUL..BALINESE MUSICAL SYMBOL COMBINING GONG +1B80..1B81 ; Top # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR +1BA4 ; Top # Mn SUNDANESE VOWEL SIGN PANGHULU +1BA8..1BA9 ; Top # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE6 ; Top # Mn BATAK SIGN TOMPI +1BE8..1BE9 ; Top # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BED ; Top # Mn BATAK VOWEL SIGN KARO O +1BEF..1BF1 ; Top # Mn [3] BATAK VOWEL SIGN U FOR SIMALUNGUN SA..BATAK CONSONANT SIGN H +1C2D..1C33 ; Top # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +1C36 ; Top # Mn LEPCHA SIGN RAN +1CD0..1CD2 ; Top # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CDA..1CDB ; Top # Mn [2] VEDIC TONE DOUBLE SVARITA..VEDIC TONE TRIPLE SVARITA +1CE0 ; Top # Mn VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CF4 ; Top # Mn VEDIC TONE CANDRA ABOVE +1DFB ; Top # Mn COMBINING DELETION MARK +20F0 ; Top # Mn COMBINING ASTERISK ABOVE +A802 ; Top # Mn SYLOTI NAGRI SIGN DVISVARA +A806 ; Top # Mn SYLOTI NAGRI SIGN HASANTA +A80B ; Top # Mn SYLOTI NAGRI SIGN ANUSVARA +A826 ; Top # Mn SYLOTI NAGRI VOWEL SIGN E +A8C5 ; Top # Mn SAURASHTRA SIGN CANDRABINDU +A8E0..A8F1 ; Top # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +A8FF ; Top # Mn DEVANAGARI VOWEL SIGN AY +A926..A92A ; Top # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O +A94A ; Top # Mn REJANG VOWEL SIGN AI +A94F..A951 ; Top # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A980..A982 ; Top # Mn [3] JAVANESE SIGN PANYANGGA..JAVANESE SIGN LAYAR +A9B3 ; Top # Mn JAVANESE SIGN CECAK TELU +A9B6..A9B7 ; Top # Mn [2] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN WULU MELIK +A9BC ; Top # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Top # Mn MYANMAR SIGN SHAN SAW +AA29..AA2C ; Top # Mn [4] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN EI +AA2E ; Top # Mn CHAM VOWEL SIGN OE +AA31 ; Top # Mn CHAM VOWEL SIGN AU +AA43 ; Top # Mn CHAM CONSONANT SIGN FINAL NG +AA4C ; Top # Mn CHAM CONSONANT SIGN FINAL M +AA7C ; Top # Mn MYANMAR SIGN TAI LAING TONE-2 +AAB0 ; Top # Mn TAI VIET MAI KANG +AAB2..AAB3 ; Top # Mn [2] TAI VIET VOWEL I..TAI VIET VOWEL UE +AAB7..AAB8 ; Top # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AABE..AABF ; Top # Mn [2] TAI VIET VOWEL AM..TAI VIET TONE MAI EK +AAC1 ; Top # Mn TAI VIET TONE MAI THO +AAED ; Top # Mn MEETEI MAYEK VOWEL SIGN AAI +ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP +10A05 ; Top # Mn KHAROSHTHI VOWEL SIGN E +10A0F ; Top # Mn KHAROSHTHI SIGN VISARGA +10A38 ; Top # Mn KHAROSHTHI SIGN BAR ABOVE +11001 ; Top # Mn BRAHMI SIGN ANUSVARA +11038..1103B ; Top # Mn [4] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN II +11042..11046 ; Top # Mn [5] BRAHMI VOWEL SIGN E..BRAHMI VIRAMA +11070 ; Top # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11073..11074 ; Top # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O +11080..11081 ; Top # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +110B5..110B6 ; Top # Mn [2] KAITHI VOWEL SIGN E..KAITHI VOWEL SIGN AI +11100..11102 ; Top # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA +11127..11129 ; Top # Mn [3] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN II +1112D ; Top # Mn CHAKMA VOWEL SIGN AI +11130 ; Top # Mn CHAKMA VOWEL SIGN OI +11134 ; Top # Mn CHAKMA MAAYYAA +11180..11181 ; Top # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +111BC..111BE ; Top # Mn [3] SHARADA VOWEL SIGN E..SHARADA VOWEL SIGN O +111C2..111C3 ; Top # Lo [2] SHARADA SIGN JIHVAMULIYA..SHARADA SIGN UPADHMANIYA +111CB ; Top # Mn SHARADA VOWEL MODIFIER MARK +111CF ; Top # Mn SHARADA SIGN INVERTED CANDRABINDU +11230..11231 ; Top # Mn [2] KHOJKI VOWEL SIGN E..KHOJKI VOWEL SIGN AI +11234 ; Top # Mn KHOJKI SIGN ANUSVARA +11236..11237 ; Top # Mn [2] KHOJKI SIGN NUKTA..KHOJKI SIGN SHADDA +1123E ; Top # Mn KHOJKI SIGN SUKUN +112DF ; Top # Mn KHUDAWADI SIGN ANUSVARA +112E5..112E8 ; Top # Mn [4] KHUDAWADI VOWEL SIGN E..KHUDAWADI VOWEL SIGN AU +11300..11301 ; Top # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11340 ; Top # Mn GRANTHA VOWEL SIGN II +11366..1136C ; Top # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Top # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA +1143E..1143F ; Top # Mn [2] NEWA VOWEL SIGN E..NEWA VOWEL SIGN AI +11443..11444 ; Top # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +1145E ; Top # Mn NEWA SANDHI MARK +114BA ; Top # Mn TIRHUTA VOWEL SIGN SHORT E +114BF..114C0 ; Top # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Top # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +11639..1163A ; Top # Mn [2] MODI VOWEL SIGN E..MODI VOWEL SIGN AI +1163D ; Top # Mn MODI SIGN ANUSVARA +11640 ; Top # Mn MODI SIGN ARDHACANDRA +116AB ; Top # Mn TAKRI SIGN ANUSVARA +116AD ; Top # Mn TAKRI VOWEL SIGN AA +116B2..116B5 ; Top # Mn [4] TAKRI VOWEL SIGN E..TAKRI VOWEL SIGN AU +1171F ; Top # Mn AHOM CONSONANT SIGN MEDIAL LIGATING RA +11722..11723 ; Top # Mn [2] AHOM VOWEL SIGN I..AHOM VOWEL SIGN II +11727 ; Top # Mn AHOM VOWEL SIGN AW +11729..1172B ; Top # Mn [3] AHOM VOWEL SIGN AI..AHOM SIGN KILLER +11833..11837 ; Top # Mn [5] DOGRA VOWEL SIGN E..DOGRA SIGN ANUSVARA +1193B..1193C ; Top # Mn [2] DIVES AKURU SIGN ANUSVARA..DIVES AKURU SIGN CANDRABINDU +1193F ; Top # Lo DIVES AKURU PREFIXED NASAL SIGN +11941 ; Top # Lo DIVES AKURU INITIAL RA +119DA..119DB ; Top # Mn [2] NANDINAGARI VOWEL SIGN E..NANDINAGARI VOWEL SIGN AI +11A01 ; Top # Mn ZANABAZAR SQUARE VOWEL SIGN I +11A04..11A09 ; Top # Mn [6] ZANABAZAR SQUARE VOWEL SIGN E..ZANABAZAR SQUARE VOWEL SIGN REVERSED I +11A35..11A38 ; Top # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A3A ; Top # Lo ZANABAZAR SQUARE CLUSTER-INITIAL LETTER RA +11A51 ; Top # Mn SOYOMBO VOWEL SIGN I +11A54..11A56 ; Top # Mn [3] SOYOMBO VOWEL SIGN E..SOYOMBO VOWEL SIGN OE +11A84..11A89 ; Top # Lo [6] SOYOMBO SIGN JIHVAMULIYA..SOYOMBO CLUSTER-INITIAL LETTER SA +11A96 ; Top # Mn SOYOMBO SIGN ANUSVARA +11A98 ; Top # Mn SOYOMBO GEMINATION MARK +11C30..11C31 ; Top # Mn [2] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN II +11C38..11C3D ; Top # Mn [6] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI SIGN ANUSVARA +11CB3 ; Top # Mn MARCHEN VOWEL SIGN E +11CB5..11CB6 ; Top # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D31..11D35 ; Top # Mn [5] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN UU +11D3A ; Top # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Top # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F..11D41 ; Top # Mn [3] MASARAM GONDI VOWEL SIGN AU..MASARAM GONDI SIGN VISARGA +11D43 ; Top # Mn MASARAM GONDI SIGN CANDRA +11D90..11D91 ; Top # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI +11D95 ; Top # Mn GUNJALA GONDI SIGN ANUSVARA +11EF3 ; Top # Mn MAKASAR VOWEL SIGN I +11F00..11F01 ; Top # Mn [2] KAWI SIGN CANDRABINDU..KAWI SIGN ANUSVARA +11F02 ; Top # Lo KAWI SIGN REPHA +11F36..11F37 ; Top # Mn [2] KAWI VOWEL SIGN I..KAWI VOWEL SIGN II +11F40 ; Top # Mn KAWI VOWEL SIGN EU + +# Indic_Positional_Category=Bottom + +093C ; Bottom # Mn DEVANAGARI SIGN NUKTA +0941..0944 ; Bottom # Mn [4] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN VOCALIC RR +094D ; Bottom # Mn DEVANAGARI SIGN VIRAMA +0952 ; Bottom # Mn DEVANAGARI STRESS SIGN ANUDATTA +0956..0957 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN UE..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BC ; Bottom # Mn BENGALI SIGN NUKTA +09C1..09C4 ; Bottom # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09CD ; Bottom # Mn BENGALI SIGN VIRAMA +09E2..09E3 ; Bottom # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3C ; Bottom # Mn GURMUKHI SIGN NUKTA +0A41..0A42 ; Bottom # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A4D ; Bottom # Mn GURMUKHI SIGN VIRAMA +0A51 ; Bottom # Mn GURMUKHI SIGN UDAAT +0A75 ; Bottom # Mn GURMUKHI SIGN YAKASH +0ABC ; Bottom # Mn GUJARATI SIGN NUKTA +0AC1..0AC4 ; Bottom # Mn [4] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN VOCALIC RR +0ACD ; Bottom # Mn GUJARATI SIGN VIRAMA +0AE2..0AE3 ; Bottom # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3C ; Bottom # Mn ORIYA SIGN NUKTA +0B41..0B44 ; Bottom # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B4D ; Bottom # Mn ORIYA SIGN VIRAMA +0B62..0B63 ; Bottom # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0C3C ; Bottom # Mn TELUGU SIGN NUKTA +0C56 ; Bottom # Mn TELUGU AI LENGTH MARK +0C62..0C63 ; Bottom # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBC ; Bottom # Mn KANNADA SIGN NUKTA +0CE2..0CE3 ; Bottom # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D43..0D44 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC R..MALAYALAM VOWEL SIGN VOCALIC RR +0D62..0D63 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DD4 ; Bottom # Mn SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Bottom # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0E38..0E3A ; Bottom # Mn [3] THAI CHARACTER SARA U..THAI CHARACTER PHINTHU +0EB8..0EBA ; Bottom # Mn [3] LAO VOWEL SIGN U..LAO SIGN PALI VIRAMA +0EBC ; Bottom # Mn LAO SEMIVOWEL SIGN LO +0F18..0F19 ; Bottom # Mn [2] TIBETAN ASTROLOGICAL SIGN -KHYUD PA..TIBETAN ASTROLOGICAL SIGN SDONG TSHUGS +0F35 ; Bottom # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Bottom # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0F71 ; Bottom # Mn TIBETAN VOWEL SIGN AA +0F74..0F75 ; Bottom # Mn [2] TIBETAN VOWEL SIGN U..TIBETAN VOWEL SIGN UU +0F84 ; Bottom # Mn TIBETAN MARK HALANTA +0F8D..0F97 ; Bottom # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Bottom # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +0FC6 ; Bottom # Mn TIBETAN SYMBOL PADMA GDAN +102F..1030 ; Bottom # Mn [2] MYANMAR VOWEL SIGN U..MYANMAR VOWEL SIGN UU +1037 ; Bottom # Mn MYANMAR SIGN DOT BELOW +103D..103E ; Bottom # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +1058..1059 ; Bottom # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +105E..1060 ; Bottom # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Bottom # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +108D ; Bottom # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +1713..1714 ; Bottom # Mn [2] TAGALOG VOWEL SIGN U..TAGALOG SIGN VIRAMA +1733 ; Bottom # Mn HANUNOO VOWEL SIGN U +1753 ; Bottom # Mn BUHID VOWEL SIGN U +1773 ; Bottom # Mn TAGBANWA VOWEL SIGN U +17BB..17BD ; Bottom # Mn [3] KHMER VOWEL SIGN U..KHMER VOWEL SIGN UA +1922 ; Bottom # Mn LIMBU VOWEL SIGN U +1932 ; Bottom # Mn LIMBU SMALL LETTER ANUSVARA +1939 ; Bottom # Mn LIMBU SIGN MUKPHRENG +193B ; Bottom # Mn LIMBU SIGN SA-I +1A18 ; Bottom # Mn BUGINESE VOWEL SIGN U +1A56 ; Bottom # Mn TAI THAM CONSONANT SIGN MEDIAL LA +1A5B..1A5E ; Bottom # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1A69..1A6A ; Bottom # Mn [2] TAI THAM VOWEL SIGN U..TAI THAM VOWEL SIGN UU +1A6C ; Bottom # Mn TAI THAM VOWEL SIGN OA BELOW +1A7F ; Bottom # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1B38..1B3A ; Bottom # Mn [3] BALINESE VOWEL SIGN SUKU..BALINESE VOWEL SIGN RA REPA +1B6C ; Bottom # Mn BALINESE MUSICAL SYMBOL COMBINING ENDEP +1BA2..1BA3 ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BA5 ; Bottom # Mn SUNDANESE VOWEL SIGN PANYUKU +1BAC..1BAD ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C2C ; Bottom # Mn LEPCHA VOWEL SIGN E +1C37 ; Bottom # Mn LEPCHA SIGN NUKTA +1CD5..1CD9 ; Bottom # Mn [5] VEDIC TONE YAJURVEDIC AGGRAVATED INDEPENDENT SVARITA..VEDIC TONE YAJURVEDIC KATHAKA INDEPENDENT SVARITA SCHROEDER +1CDC..1CDF ; Bottom # Mn [4] VEDIC TONE KATHAKA ANUDATTA..VEDIC TONE THREE DOTS BELOW +1CED ; Bottom # Mn VEDIC SIGN TIRYAK +A825 ; Bottom # Mn SYLOTI NAGRI VOWEL SIGN U +A82C ; Bottom # Mn SYLOTI NAGRI SIGN ALTERNATE HASANTA +A8C4 ; Bottom # Mn SAURASHTRA SIGN VIRAMA +A92B..A92D ; Bottom # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +A947..A949 ; Bottom # Mn [3] REJANG VOWEL SIGN I..REJANG VOWEL SIGN E +A94B..A94E ; Bottom # Mn [4] REJANG VOWEL SIGN O..REJANG VOWEL SIGN EA +A9B8..A9B9 ; Bottom # Mn [2] JAVANESE VOWEL SIGN SUKU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BD ; Bottom # Mn JAVANESE CONSONANT SIGN KERET +AA2D ; Bottom # Mn CHAM VOWEL SIGN U +AA32 ; Bottom # Mn CHAM VOWEL SIGN UE +AA35..AA36 ; Bottom # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +AAB4 ; Bottom # Mn TAI VIET VOWEL U +AAEC ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UU +ABE8 ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK +10A02..10A03 ; Bottom # Mn [2] KHAROSHTHI VOWEL SIGN U..KHAROSHTHI VOWEL SIGN VOCALIC R +10A0C..10A0E ; Bottom # Mn [3] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN ANUSVARA +10A39..10A3A ; Bottom # Mn [2] KHAROSHTHI SIGN CAUDA..KHAROSHTHI SIGN DOT BELOW +1103C..11041 ; Bottom # Mn [6] BRAHMI VOWEL SIGN U..BRAHMI VOWEL SIGN VOCALIC LL +110B3..110B4 ; Bottom # Mn [2] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN UU +110B9..110BA ; Bottom # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +110C2 ; Bottom # Mn KAITHI VOWEL SIGN VOCALIC R +1112A..1112B ; Bottom # Mn [2] CHAKMA VOWEL SIGN U..CHAKMA VOWEL SIGN UU +11131..11132 ; Bottom # Mn [2] CHAKMA O MARK..CHAKMA AU MARK +11173 ; Bottom # Mn MAHAJANI SIGN NUKTA +111B6..111BB ; Bottom # Mn [6] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN VOCALIC LL +111C9..111CA ; Bottom # Mn [2] SHARADA SANDHI MARK..SHARADA SIGN NUKTA +111CC ; Bottom # Mn SHARADA EXTRA SHORT VOWEL MARK +1122F ; Bottom # Mn KHOJKI VOWEL SIGN U +11241 ; Bottom # Mn KHOJKI VOWEL SIGN VOCALIC R +112E3..112E4 ; Bottom # Mn [2] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN UU +112E9..112EA ; Bottom # Mn [2] KHUDAWADI SIGN NUKTA..KHUDAWADI SIGN VIRAMA +1133B..1133C ; Bottom # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA +11438..1143D ; Bottom # Mn [6] NEWA VOWEL SIGN U..NEWA VOWEL SIGN VOCALIC LL +11442 ; Bottom # Mn NEWA SIGN VIRAMA +11446 ; Bottom # Mn NEWA SIGN NUKTA +114B3..114B8 ; Bottom # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114C2..114C3 ; Bottom # Mn [2] TIRHUTA SIGN VIRAMA..TIRHUTA SIGN NUKTA +115B2..115B5 ; Bottom # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115BF..115C0 ; Bottom # Mn [2] SIDDHAM SIGN VIRAMA..SIDDHAM SIGN NUKTA +115DC..115DD ; Bottom # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11633..11638 ; Bottom # Mn [6] MODI VOWEL SIGN U..MODI VOWEL SIGN VOCALIC LL +1163F ; Bottom # Mn MODI SIGN VIRAMA +116B0..116B1 ; Bottom # Mn [2] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN UU +116B7 ; Bottom # Mn TAKRI SIGN NUKTA +1171D ; Bottom # Mn AHOM CONSONANT SIGN MEDIAL LA +11724..11725 ; Bottom # Mn [2] AHOM VOWEL SIGN U..AHOM VOWEL SIGN UU +11728 ; Bottom # Mn AHOM VOWEL SIGN O +1182F..11832 ; Bottom # Mn [4] DOGRA VOWEL SIGN U..DOGRA VOWEL SIGN VOCALIC RR +11839..1183A ; Bottom # Mn [2] DOGRA SIGN VIRAMA..DOGRA SIGN NUKTA +11943 ; Bottom # Mn DIVES AKURU SIGN NUKTA +119D4..119D7 ; Bottom # Mn [4] NANDINAGARI VOWEL SIGN U..NANDINAGARI VOWEL SIGN VOCALIC RR +119E0 ; Bottom # Mn NANDINAGARI SIGN VIRAMA +11A02..11A03 ; Bottom # Mn [2] ZANABAZAR SQUARE VOWEL SIGN UE..ZANABAZAR SQUARE VOWEL SIGN U +11A0A ; Bottom # Mn ZANABAZAR SQUARE VOWEL LENGTH MARK +11A33..11A34 ; Bottom # Mn [2] ZANABAZAR SQUARE FINAL CONSONANT MARK..ZANABAZAR SQUARE SIGN VIRAMA +11A3B..11A3E ; Bottom # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11A52..11A53 ; Bottom # Mn [2] SOYOMBO VOWEL SIGN UE..SOYOMBO VOWEL SIGN U +11A59..11A5B ; Bottom # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11A8A..11A95 ; Bottom # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A +11C32..11C36 ; Bottom # Mn [5] BHAIKSUKI VOWEL SIGN U..BHAIKSUKI VOWEL SIGN VOCALIC L +11C3F ; Bottom # Mn BHAIKSUKI SIGN VIRAMA +11C92..11CA7 ; Bottom # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CAA..11CB0 ; Bottom # Mn [7] MARCHEN SUBJOINED LETTER RA..MARCHEN VOWEL SIGN AA +11CB2 ; Bottom # Mn MARCHEN VOWEL SIGN U +11D36 ; Bottom # Mn MASARAM GONDI VOWEL SIGN VOCALIC R +11D42 ; Bottom # Mn MASARAM GONDI SIGN NUKTA +11D44 ; Bottom # Mn MASARAM GONDI SIGN HALANTA +11D47 ; Bottom # Mn MASARAM GONDI RA-KARA +11EF4 ; Bottom # Mn MAKASAR VOWEL SIGN U +11F38..11F3A ; Bottom # Mn [3] KAWI VOWEL SIGN U..KAWI VOWEL SIGN VOCALIC R + +# Indic_Positional_Category=Top_And_Bottom + +0C48 ; Top_And_Bottom # Mn TELUGU VOWEL SIGN AI +0F73 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN II +0F76..0F79 ; Top_And_Bottom # Mn [4] TIBETAN VOWEL SIGN VOCALIC R..TIBETAN VOWEL SIGN VOCALIC LL +0F81 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN REVERSED II +1B3C ; Top_And_Bottom # Mn BALINESE VOWEL SIGN LA LENGA +1112E..1112F ; Top_And_Bottom # Mn [2] CHAKMA VOWEL SIGN O..CHAKMA VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Right + +0AC9 ; Top_And_Right # Mc GUJARATI VOWEL SIGN CANDRA O +0B57 ; Top_And_Right # Mc ORIYA AU LENGTH MARK +0CC0 ; Top_And_Right # Mc KANNADA VOWEL SIGN II +0CC7..0CC8 ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +1925..1926 ; Top_And_Right # Mc [2] LIMBU VOWEL SIGN OO..LIMBU VOWEL SIGN AU +1B43 ; Top_And_Right # Mc BALINESE VOWEL SIGN PEPET TEDUNG +111BF ; Top_And_Right # Mc SHARADA VOWEL SIGN AU +11232..11233 ; Top_And_Right # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Left + +0B48 ; Top_And_Left # Mc ORIYA VOWEL SIGN AI +0DDA ; Top_And_Left # Mc SINHALA VOWEL SIGN DIGA KOMBUVA +17BE ; Top_And_Left # Mc KHMER VOWEL SIGN OE +1C29 ; Top_And_Left # Mc LEPCHA VOWEL SIGN OO +114BB ; Top_And_Left # Mc TIRHUTA VOWEL SIGN AI +115B9 ; Top_And_Left # Mc SIDDHAM VOWEL SIGN AI + +# Indic_Positional_Category=Top_And_Left_And_Right + +0B4C ; Top_And_Left_And_Right # Mc ORIYA VOWEL SIGN AU +0DDD ; Top_And_Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA +17BF ; Top_And_Left_And_Right # Mc KHMER VOWEL SIGN YA +115BB ; Top_And_Left_And_Right # Mc SIDDHAM VOWEL SIGN AU + +# Indic_Positional_Category=Bottom_And_Right + +1B3B ; Bottom_And_Right # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +A9BE ; Bottom_And_Right # Mc JAVANESE CONSONANT SIGN PENGKAL +A9C0 ; Bottom_And_Right # Mc JAVANESE PANGKON +11942 ; Bottom_And_Right # Mc DIVES AKURU MEDIAL RA + +# Indic_Positional_Category=Bottom_And_Left + +A9BF ; Bottom_And_Left # Mc JAVANESE CONSONANT SIGN CAKRA + +# Indic_Positional_Category=Top_And_Bottom_And_Right + +1B3D ; Top_And_Bottom_And_Right # Mc BALINESE VOWEL SIGN LA LENGA TEDUNG + +# Indic_Positional_Category=Top_And_Bottom_And_Left + +103C ; Top_And_Bottom_And_Left # Mc MYANMAR CONSONANT SIGN MEDIAL RA +1171E ; Top_And_Bottom_And_Left # Mn AHOM CONSONANT SIGN MEDIAL RA + +# Indic_Positional_Category=Overstruck + +1CD4 ; Overstruck # Mn VEDIC SIGN YAJURVEDIC MIDLINE SVARITA +1CE2..1CE8 ; Overstruck # Mn [7] VEDIC SIGN VISARGA SVARITA..VEDIC SIGN VISARGA ANUDATTA WITH TAIL +10A01 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN I +10A06 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN O + +# EOF diff --git a/data/15.1.0-indic-syllabic-category.txt b/data/15.1.0-indic-syllabic-category.txt new file mode 100644 index 0000000..f2623b4 --- /dev/null +++ b/data/15.1.0-indic-syllabic-category.txt @@ -0,0 +1,1347 @@ +# IndicSyllabicCategory-15.1.0.txt +# Date: 2023-01-05 +# © 2023 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use, see https://www.unicode.org/terms_of_use.html +# +# For documentation, see UAX #44: Unicode Character Database, +# at https://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Syllabic_Category enumerated property +# +# Scope: This property is aimed at two general problem +# areas involving the analysis and processing of Indic scripts: +# +# 1. Specification of syllabic structure. +# 2. Specification of segmentation rules. +# +# Both of these problem areas may benefit from having defined subtypes +# of Indic script characters which are relevant to how Indic +# syllables (or aksaras) are constructed. Note that rules for +# syllabic structure in Indic scripts may differ significantly +# from how phonological syllables are defined. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Syllabic_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as Indic in the structural sense used for the +# Indic_Syllabic_Category are the following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Dives Akuru, Dogra, Grantha, Gujarati, +# Gunjala Gondi, Gurmukhi, Hanunoo, Javanese, Kaithi, Kannada, Kawi, +# Kayah Li, Kharoshthi, Khmer, Khojki, Khudawadi, Lao, Lepcha, Limbu, +# Mahajani, Makasar, Malayalam, Marchen, Masaram Gondi, Meetei Mayek, +# Modi, Multani, Myanmar, Nandinagari, Newa, New Tai Lue, Oriya, +# Phags-pa, Rejang, Saurashtra, Sharada, Siddham, Sinhala, Soyombo, +# Sundanese, Syloti Nagri, Tagalog, Tagbanwa, Tai Le, Tai Tham, +# Tai Viet, Takri, Tamil, Telugu, Thai, Tibetan, Tirhuta, and +# Zanabazar Square. +# +# All characters for all other scripts not in that list +# take the default value for this property, unless they +# are individually listed in this data file. +# + +# ================================================ + +# Property: Indic_Syllabic_Category +# +# All code points not explicitly listed for Indic_Syllabic_Category +# have the value Other. +# +# @missing: 0000..10FFFF; Other + +# ================================================ + +# Indic_Syllabic_Category=Bindu + +# Bindu/Anusvara (nasalization or -n) + +# [Not derivable] + +0900..0902 ; Bindu # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +0981 ; Bindu # Mn BENGALI SIGN CANDRABINDU +0982 ; Bindu # Mc BENGALI SIGN ANUSVARA +09FC ; Bindu # Lo BENGALI LETTER VEDIC ANUSVARA +0A01..0A02 ; Bindu # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A70 ; Bindu # Mn GURMUKHI TIPPI +0A81..0A82 ; Bindu # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0B01 ; Bindu # Mn ORIYA SIGN CANDRABINDU +0B02 ; Bindu # Mc ORIYA SIGN ANUSVARA +0B82 ; Bindu # Mn TAMIL SIGN ANUSVARA +0C00 ; Bindu # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C01..0C02 ; Bindu # Mc [2] TELUGU SIGN CANDRABINDU..TELUGU SIGN ANUSVARA +0C04 ; Bindu # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C80 ; Bindu # Lo KANNADA SIGN SPACING CANDRABINDU +0C81 ; Bindu # Mn KANNADA SIGN CANDRABINDU +0C82 ; Bindu # Mc KANNADA SIGN ANUSVARA +0CF3 ; Bindu # Mc KANNADA SIGN COMBINING ANUSVARA ABOVE RIGHT +0D00..0D01 ; Bindu # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU +0D02 ; Bindu # Mc MALAYALAM SIGN ANUSVARA +0D04 ; Bindu # Lo MALAYALAM LETTER VEDIC ANUSVARA +0D81 ; Bindu # Mn SINHALA SIGN CANDRABINDU +0D82 ; Bindu # Mc SINHALA SIGN ANUSVARAYA +0E4D ; Bindu # Mn THAI CHARACTER NIKHAHIT +0ECD ; Bindu # Mn LAO NIGGAHITA +0F7E ; Bindu # Mn TIBETAN SIGN RJES SU NGA RO +0F82..0F83 ; Bindu # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +1036 ; Bindu # Mn MYANMAR SIGN ANUSVARA +17C6 ; Bindu # Mn KHMER SIGN NIKAHIT +1932 ; Bindu # Mn LIMBU SMALL LETTER ANUSVARA +1A74 ; Bindu # Mn TAI THAM SIGN MAI KANG +1B00..1B02 ; Bindu # Mn [3] BALINESE SIGN ULU RICEM..BALINESE SIGN CECEK +1B80 ; Bindu # Mn SUNDANESE SIGN PANYECEK +1C34..1C35 ; Bindu # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A80B ; Bindu # Mn SYLOTI NAGRI SIGN ANUSVARA +A873 ; Bindu # Lo PHAGS-PA LETTER CANDRABINDU +A880 ; Bindu # Mc SAURASHTRA SIGN ANUSVARA +A8C5 ; Bindu # Mn SAURASHTRA SIGN CANDRABINDU +A8F2..A8F3 ; Bindu # Lo [2] DEVANAGARI SIGN SPACING CANDRABINDU..DEVANAGARI SIGN CANDRABINDU VIRAMA +A980..A981 ; Bindu # Mn [2] JAVANESE SIGN PANYANGGA..JAVANESE SIGN CECAK +10A0E ; Bindu # Mn KHAROSHTHI SIGN ANUSVARA +11000 ; Bindu # Mc BRAHMI SIGN CANDRABINDU +11001 ; Bindu # Mn BRAHMI SIGN ANUSVARA +11080..11081 ; Bindu # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +11100..11101 ; Bindu # Mn [2] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN ANUSVARA +11180..11181 ; Bindu # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +111CF ; Bindu # Mn SHARADA SIGN INVERTED CANDRABINDU +11234 ; Bindu # Mn KHOJKI SIGN ANUSVARA +112DF ; Bindu # Mn KHUDAWADI SIGN ANUSVARA +11300..11301 ; Bindu # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11302 ; Bindu # Mc GRANTHA SIGN ANUSVARA +1135E..1135F ; Bindu # Lo [2] GRANTHA LETTER VEDIC ANUSVARA..GRANTHA LETTER VEDIC DOUBLE ANUSVARA +11443..11444 ; Bindu # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +1145F ; Bindu # Lo NEWA LETTER VEDIC ANUSVARA +114BF..114C0 ; Bindu # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Bindu # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +1163D ; Bindu # Mn MODI SIGN ANUSVARA +116AB ; Bindu # Mn TAKRI SIGN ANUSVARA +11837 ; Bindu # Mn DOGRA SIGN ANUSVARA +1193B..1193C ; Bindu # Mn [2] DIVES AKURU SIGN ANUSVARA..DIVES AKURU SIGN CANDRABINDU +119DE ; Bindu # Mc NANDINAGARI SIGN ANUSVARA +11A35..11A38 ; Bindu # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A96 ; Bindu # Mn SOYOMBO SIGN ANUSVARA +11C3C..11C3D ; Bindu # Mn [2] BHAIKSUKI SIGN CANDRABINDU..BHAIKSUKI SIGN ANUSVARA +11CB5..11CB6 ; Bindu # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D40 ; Bindu # Mn MASARAM GONDI SIGN ANUSVARA +11D95 ; Bindu # Mn GUNJALA GONDI SIGN ANUSVARA +11F00..11F01 ; Bindu # Mn [2] KAWI SIGN CANDRABINDU..KAWI SIGN ANUSVARA + +# ================================================ + +# Indic_Syllabic_Category=Visarga + +# Visarga (-h) +# Excludes letters for jihvamuliya and upadhmaniya, which are +# related, but structured somewhat differently. + +# [Not derivable] + +0903 ; Visarga # Mc DEVANAGARI SIGN VISARGA +0983 ; Visarga # Mc BENGALI SIGN VISARGA +0A03 ; Visarga # Mc GURMUKHI SIGN VISARGA +0A83 ; Visarga # Mc GUJARATI SIGN VISARGA +0B03 ; Visarga # Mc ORIYA SIGN VISARGA +0C03 ; Visarga # Mc TELUGU SIGN VISARGA +0C83 ; Visarga # Mc KANNADA SIGN VISARGA +0D03 ; Visarga # Mc MALAYALAM SIGN VISARGA +0D83 ; Visarga # Mc SINHALA SIGN VISARGAYA +0F7F ; Visarga # Mc TIBETAN SIGN RNAM BCAD +1038 ; Visarga # Mc MYANMAR SIGN VISARGA +17C7 ; Visarga # Mc KHMER SIGN REAHMUK +1B04 ; Visarga # Mc BALINESE SIGN BISAH +1B82 ; Visarga # Mc SUNDANESE SIGN PANGWISAD +A881 ; Visarga # Mc SAURASHTRA SIGN VISARGA +A983 ; Visarga # Mc JAVANESE SIGN WIGNYAN +AAF5 ; Visarga # Mc MEETEI MAYEK VOWEL SIGN VISARGA +10A0F ; Visarga # Mn KHAROSHTHI SIGN VISARGA +11002 ; Visarga # Mc BRAHMI SIGN VISARGA +11082 ; Visarga # Mc KAITHI SIGN VISARGA +11102 ; Visarga # Mn CHAKMA SIGN VISARGA +11182 ; Visarga # Mc SHARADA SIGN VISARGA +11303 ; Visarga # Mc GRANTHA SIGN VISARGA +11445 ; Visarga # Mc NEWA SIGN VISARGA +114C1 ; Visarga # Mc TIRHUTA SIGN VISARGA +115BE ; Visarga # Mc SIDDHAM SIGN VISARGA +1163E ; Visarga # Mc MODI SIGN VISARGA +116AC ; Visarga # Mc TAKRI SIGN VISARGA +11838 ; Visarga # Mc DOGRA SIGN VISARGA +119DF ; Visarga # Mc NANDINAGARI SIGN VISARGA +11A39 ; Visarga # Mc ZANABAZAR SQUARE SIGN VISARGA +11A97 ; Visarga # Mc SOYOMBO SIGN VISARGA +11C3E ; Visarga # Mc BHAIKSUKI SIGN VISARGA +11D41 ; Visarga # Mn MASARAM GONDI SIGN VISARGA +11D96 ; Visarga # Mc GUNJALA GONDI SIGN VISARGA +11F03 ; Visarga # Mc KAWI SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Avagraha + +# Avagraha (elision of initial a- in sandhi) + +# [Not derivable] + +093D ; Avagraha # Lo DEVANAGARI SIGN AVAGRAHA +09BD ; Avagraha # Lo BENGALI SIGN AVAGRAHA +0ABD ; Avagraha # Lo GUJARATI SIGN AVAGRAHA +0B3D ; Avagraha # Lo ORIYA SIGN AVAGRAHA +0C3D ; Avagraha # Lo TELUGU SIGN AVAGRAHA +0CBD ; Avagraha # Lo KANNADA SIGN AVAGRAHA +0D3D ; Avagraha # Lo MALAYALAM SIGN AVAGRAHA +0F85 ; Avagraha # Po TIBETAN MARK PALUTA +17DC ; Avagraha # Lo KHMER SIGN AVAKRAHASANYA +1BBA ; Avagraha # Lo SUNDANESE AVAGRAHA +111C1 ; Avagraha # Lo SHARADA SIGN AVAGRAHA +1133D ; Avagraha # Lo GRANTHA SIGN AVAGRAHA +11447 ; Avagraha # Lo NEWA SIGN AVAGRAHA +114C4 ; Avagraha # Lo TIRHUTA SIGN AVAGRAHA +119E1 ; Avagraha # Lo NANDINAGARI SIGN AVAGRAHA +11A9D ; Avagraha # Lo SOYOMBO MARK PLUTA +11C40 ; Avagraha # Lo BHAIKSUKI SIGN AVAGRAHA + +# ================================================ + +# Indic_Syllabic_Category=Nukta + +# Nukta (diacritic for borrowed consonants or other consonant +# modifications). Note that while the resulting sound is typically a +# consonant, the base letter a nukta follows may be an independent +# vowel. For example, is used to transcribe ARABIC LETTER +# AIN. + +# [Not derivable] + +093C ; Nukta # Mn DEVANAGARI SIGN NUKTA +09BC ; Nukta # Mn BENGALI SIGN NUKTA +0A3C ; Nukta # Mn GURMUKHI SIGN NUKTA +0ABC ; Nukta # Mn GUJARATI SIGN NUKTA +0AFD..0AFF ; Nukta # Mn [3] GUJARATI SIGN THREE-DOT NUKTA ABOVE..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B3C ; Nukta # Mn ORIYA SIGN NUKTA +0C3C ; Nukta # Mn TELUGU SIGN NUKTA +0CBC ; Nukta # Mn KANNADA SIGN NUKTA +0F39 ; Nukta # Mn TIBETAN MARK TSA -PHRU +1B34 ; Nukta # Mn BALINESE SIGN REREKAN +1BE6 ; Nukta # Mn BATAK SIGN TOMPI +1C37 ; Nukta # Mn LEPCHA SIGN NUKTA +A9B3 ; Nukta # Mn JAVANESE SIGN CECAK TELU +10A38..10A3A ; Nukta # Mn [3] KHAROSHTHI SIGN BAR ABOVE..KHAROSHTHI SIGN DOT BELOW +110BA ; Nukta # Mn KAITHI SIGN NUKTA +11173 ; Nukta # Mn MAHAJANI SIGN NUKTA +111CA ; Nukta # Mn SHARADA SIGN NUKTA +11236 ; Nukta # Mn KHOJKI SIGN NUKTA +112E9 ; Nukta # Mn KHUDAWADI SIGN NUKTA +1133B..1133C ; Nukta # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA +11446 ; Nukta # Mn NEWA SIGN NUKTA +114C3 ; Nukta # Mn TIRHUTA SIGN NUKTA +115C0 ; Nukta # Mn SIDDHAM SIGN NUKTA +116B7 ; Nukta # Mn TAKRI SIGN NUKTA +1183A ; Nukta # Mn DOGRA SIGN NUKTA +11943 ; Nukta # Mn DIVES AKURU SIGN NUKTA +11D42 ; Nukta # Mn MASARAM GONDI SIGN NUKTA + +# ================================================ + +# Indic_Syllabic_Category=Virama + +# Virama (killing of inherent vowel in consonant sequence +# or consonant stacker) +# Only includes characters that can act both as visible killer viramas +# and consonant stackers. Separate property values exist for characters +# that can only act as pure killers or only as consonant stackers. + +# [Derivation: (ccc=9) - (InSC=Pure_Killer) - (InSC=Invisible_Stacker) +# - (InSC=Number_Joiner) - 2D7F] + +094D ; Virama # Mn DEVANAGARI SIGN VIRAMA +09CD ; Virama # Mn BENGALI SIGN VIRAMA +0A4D ; Virama # Mn GURMUKHI SIGN VIRAMA +0ACD ; Virama # Mn GUJARATI SIGN VIRAMA +0B4D ; Virama # Mn ORIYA SIGN VIRAMA +0BCD ; Virama # Mn TAMIL SIGN VIRAMA +0C4D ; Virama # Mn TELUGU SIGN VIRAMA +0CCD ; Virama # Mn KANNADA SIGN VIRAMA +0D4D ; Virama # Mn MALAYALAM SIGN VIRAMA +0DCA ; Virama # Mn SINHALA SIGN AL-LAKUNA +1B44 ; Virama # Mc BALINESE ADEG ADEG +A806 ; Virama # Mn SYLOTI NAGRI SIGN HASANTA +A8C4 ; Virama # Mn SAURASHTRA SIGN VIRAMA +A9C0 ; Virama # Mc JAVANESE PANGKON +11046 ; Virama # Mn BRAHMI VIRAMA +110B9 ; Virama # Mn KAITHI SIGN VIRAMA +111C0 ; Virama # Mc SHARADA SIGN VIRAMA +11235 ; Virama # Mc KHOJKI SIGN VIRAMA +1134D ; Virama # Mc GRANTHA SIGN VIRAMA +11442 ; Virama # Mn NEWA SIGN VIRAMA +114C2 ; Virama # Mn TIRHUTA SIGN VIRAMA +115BF ; Virama # Mn SIDDHAM SIGN VIRAMA +1163F ; Virama # Mn MODI SIGN VIRAMA +116B6 ; Virama # Mc TAKRI SIGN VIRAMA +11839 ; Virama # Mn DOGRA SIGN VIRAMA +119E0 ; Virama # Mn NANDINAGARI SIGN VIRAMA +11C3F ; Virama # Mn BHAIKSUKI SIGN VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Pure_Killer + +# Pure killer (killing of inherent vowel in consonant sequence, +# with no consonant stacking behavior) + +# [Not derivable] + +0D3B..0D3C ; Pure_Killer # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA +0E3A ; Pure_Killer # Mn THAI CHARACTER PHINTHU +0E4E ; Pure_Killer # Mn THAI CHARACTER YAMAKKAN +0EBA ; Pure_Killer # Mn LAO SIGN PALI VIRAMA +0F84 ; Pure_Killer # Mn TIBETAN MARK HALANTA +103A ; Pure_Killer # Mn MYANMAR SIGN ASAT +1714 ; Pure_Killer # Mn TAGALOG SIGN VIRAMA +1715 ; Pure_Killer # Mc TAGALOG SIGN PAMUDPOD +1734 ; Pure_Killer # Mc HANUNOO SIGN PAMUDPOD +17D1 ; Pure_Killer # Mn KHMER SIGN VIRIAM +1A7A ; Pure_Killer # Mn TAI THAM SIGN RA HAAM +1BAA ; Pure_Killer # Mc SUNDANESE SIGN PAMAAEH +1BF2..1BF3 ; Pure_Killer # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +A82C ; Pure_Killer # Mn SYLOTI NAGRI SIGN ALTERNATE HASANTA +A953 ; Pure_Killer # Mc REJANG VIRAMA +ABED ; Pure_Killer # Mn MEETEI MAYEK APUN IYEK +11070 ; Pure_Killer # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11134 ; Pure_Killer # Mn CHAKMA MAAYYAA +112EA ; Pure_Killer # Mn KHUDAWADI SIGN VIRAMA +1172B ; Pure_Killer # Mn AHOM SIGN KILLER +1193D ; Pure_Killer # Mc DIVES AKURU SIGN HALANTA +11A34 ; Pure_Killer # Mn ZANABAZAR SQUARE SIGN VIRAMA +11D44 ; Pure_Killer # Mn MASARAM GONDI SIGN HALANTA +11F41 ; Pure_Killer # Mc KAWI SIGN KILLER + +# ================================================ + +# Indic_Syllabic_Category=Invisible_Stacker + +# Invisible stacker (invisible consonant stacker virama). +# +# Note that in some scripts, such as Kharoshthi and Masaram Gondi, an invisible +# stacker may have a second function, changing the shape and/or location of the +# consonant preceding it, even when there is no consonant following the +# invisible stacker. + +# [Not derivable] + +1039 ; Invisible_Stacker # Mn MYANMAR SIGN VIRAMA +17D2 ; Invisible_Stacker # Mn KHMER SIGN COENG +1A60 ; Invisible_Stacker # Mn TAI THAM SIGN SAKOT +1BAB ; Invisible_Stacker # Mn SUNDANESE SIGN VIRAMA +AAF6 ; Invisible_Stacker # Mn MEETEI MAYEK VIRAMA +10A3F ; Invisible_Stacker # Mn KHAROSHTHI VIRAMA +11133 ; Invisible_Stacker # Mn CHAKMA VIRAMA +1193E ; Invisible_Stacker # Mn DIVES AKURU VIRAMA +11A47 ; Invisible_Stacker # Mn ZANABAZAR SQUARE SUBJOINER +11A99 ; Invisible_Stacker # Mn SOYOMBO SUBJOINER +11D45 ; Invisible_Stacker # Mn MASARAM GONDI VIRAMA +11D97 ; Invisible_Stacker # Mn GUNJALA GONDI VIRAMA +11F42 ; Invisible_Stacker # Mn KAWI CONJOINER + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Independent + +# Independent Vowels (contrasted with matras) + +# [Not derivable] + +0904..0914 ; Vowel_Independent # Lo [17] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER AU +0960..0961 ; Vowel_Independent # Lo [2] DEVANAGARI LETTER VOCALIC RR..DEVANAGARI LETTER VOCALIC LL +0972..0977 ; Vowel_Independent # Lo [6] DEVANAGARI LETTER CANDRA A..DEVANAGARI LETTER UUE +0985..098C ; Vowel_Independent # Lo [8] BENGALI LETTER A..BENGALI LETTER VOCALIC L +098F..0990 ; Vowel_Independent # Lo [2] BENGALI LETTER E..BENGALI LETTER AI +0993..0994 ; Vowel_Independent # Lo [2] BENGALI LETTER O..BENGALI LETTER AU +09E0..09E1 ; Vowel_Independent # Lo [2] BENGALI LETTER VOCALIC RR..BENGALI LETTER VOCALIC LL +0A05..0A0A ; Vowel_Independent # Lo [6] GURMUKHI LETTER A..GURMUKHI LETTER UU +0A0F..0A10 ; Vowel_Independent # Lo [2] GURMUKHI LETTER EE..GURMUKHI LETTER AI +0A13..0A14 ; Vowel_Independent # Lo [2] GURMUKHI LETTER OO..GURMUKHI LETTER AU +0A85..0A8D ; Vowel_Independent # Lo [9] GUJARATI LETTER A..GUJARATI VOWEL CANDRA E +0A8F..0A91 ; Vowel_Independent # Lo [3] GUJARATI LETTER E..GUJARATI VOWEL CANDRA O +0A93..0A94 ; Vowel_Independent # Lo [2] GUJARATI LETTER O..GUJARATI LETTER AU +0AE0..0AE1 ; Vowel_Independent # Lo [2] GUJARATI LETTER VOCALIC RR..GUJARATI LETTER VOCALIC LL +0B05..0B0C ; Vowel_Independent # Lo [8] ORIYA LETTER A..ORIYA LETTER VOCALIC L +0B0F..0B10 ; Vowel_Independent # Lo [2] ORIYA LETTER E..ORIYA LETTER AI +0B13..0B14 ; Vowel_Independent # Lo [2] ORIYA LETTER O..ORIYA LETTER AU +0B60..0B61 ; Vowel_Independent # Lo [2] ORIYA LETTER VOCALIC RR..ORIYA LETTER VOCALIC LL +0B85..0B8A ; Vowel_Independent # Lo [6] TAMIL LETTER A..TAMIL LETTER UU +0B8E..0B90 ; Vowel_Independent # Lo [3] TAMIL LETTER E..TAMIL LETTER AI +0B92..0B94 ; Vowel_Independent # Lo [3] TAMIL LETTER O..TAMIL LETTER AU +0C05..0C0C ; Vowel_Independent # Lo [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L +0C0E..0C10 ; Vowel_Independent # Lo [3] TELUGU LETTER E..TELUGU LETTER AI +0C12..0C14 ; Vowel_Independent # Lo [3] TELUGU LETTER O..TELUGU LETTER AU +0C60..0C61 ; Vowel_Independent # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL +0C85..0C8C ; Vowel_Independent # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L +0C8E..0C90 ; Vowel_Independent # Lo [3] KANNADA LETTER E..KANNADA LETTER AI +0C92..0C94 ; Vowel_Independent # Lo [3] KANNADA LETTER O..KANNADA LETTER AU +0CE0..0CE1 ; Vowel_Independent # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL +0D05..0D0C ; Vowel_Independent # Lo [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L +0D0E..0D10 ; Vowel_Independent # Lo [3] MALAYALAM LETTER E..MALAYALAM LETTER AI +0D12..0D14 ; Vowel_Independent # Lo [3] MALAYALAM LETTER O..MALAYALAM LETTER AU +0D5F..0D61 ; Vowel_Independent # Lo [3] MALAYALAM LETTER ARCHAIC II..MALAYALAM LETTER VOCALIC LL +0D85..0D96 ; Vowel_Independent # Lo [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA +1021..102A ; Vowel_Independent # Lo [10] MYANMAR LETTER A..MYANMAR LETTER AU +1052..1055 ; Vowel_Independent # Lo [4] MYANMAR LETTER VOCALIC R..MYANMAR LETTER VOCALIC LL +1700..1702 ; Vowel_Independent # Lo [3] TAGALOG LETTER A..TAGALOG LETTER U +1720..1722 ; Vowel_Independent # Lo [3] HANUNOO LETTER A..HANUNOO LETTER U +1740..1742 ; Vowel_Independent # Lo [3] BUHID LETTER A..BUHID LETTER U +1760..1762 ; Vowel_Independent # Lo [3] TAGBANWA LETTER A..TAGBANWA LETTER U +17A3..17B3 ; Vowel_Independent # Lo [17] KHMER INDEPENDENT VOWEL QAQ..KHMER INDEPENDENT VOWEL QAU +1A4D..1A52 ; Vowel_Independent # Lo [6] TAI THAM LETTER I..TAI THAM LETTER OO +1B05..1B12 ; Vowel_Independent # Lo [14] BALINESE LETTER AKARA..BALINESE LETTER OKARA TEDUNG +1B83..1B89 ; Vowel_Independent # Lo [7] SUNDANESE LETTER A..SUNDANESE LETTER EU +1BE4..1BE5 ; Vowel_Independent # Lo [2] BATAK LETTER I..BATAK LETTER U +A800..A801 ; Vowel_Independent # Lo [2] SYLOTI NAGRI LETTER A..SYLOTI NAGRI LETTER I +A803..A805 ; Vowel_Independent # Lo [3] SYLOTI NAGRI LETTER U..SYLOTI NAGRI LETTER O +A882..A891 ; Vowel_Independent # Lo [16] SAURASHTRA LETTER A..SAURASHTRA LETTER AU +A8FE ; Vowel_Independent # Lo DEVANAGARI LETTER AY +A984..A988 ; Vowel_Independent # Lo [5] JAVANESE LETTER A..JAVANESE LETTER U +A98C..A98E ; Vowel_Independent # Lo [3] JAVANESE LETTER E..JAVANESE LETTER O +AA00..AA05 ; Vowel_Independent # Lo [6] CHAM LETTER A..CHAM LETTER O +AAE0..AAE1 ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER E..MEETEI MAYEK LETTER O +ABCE..ABCF ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER UN..MEETEI MAYEK LETTER I +ABD1 ; Vowel_Independent # Lo MEETEI MAYEK LETTER ATIYA +11005..11012 ; Vowel_Independent # Lo [14] BRAHMI LETTER A..BRAHMI LETTER AU +11071..11072 ; Vowel_Independent # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11083..1108C ; Vowel_Independent # Lo [10] KAITHI LETTER A..KAITHI LETTER AU +11103..11106 ; Vowel_Independent # Lo [4] CHAKMA LETTER AA..CHAKMA LETTER E +11183..11190 ; Vowel_Independent # Lo [14] SHARADA LETTER A..SHARADA LETTER AU +11200..11207 ; Vowel_Independent # Lo [8] KHOJKI LETTER A..KHOJKI LETTER AU +11240 ; Vowel_Independent # Lo KHOJKI LETTER SHORT I +11280..11283 ; Vowel_Independent # Lo [4] MULTANI LETTER A..MULTANI LETTER E +112B0..112B9 ; Vowel_Independent # Lo [10] KHUDAWADI LETTER A..KHUDAWADI LETTER AU +11305..1130C ; Vowel_Independent # Lo [8] GRANTHA LETTER A..GRANTHA LETTER VOCALIC L +1130F..11310 ; Vowel_Independent # Lo [2] GRANTHA LETTER EE..GRANTHA LETTER AI +11313..11314 ; Vowel_Independent # Lo [2] GRANTHA LETTER OO..GRANTHA LETTER AU +11360..11361 ; Vowel_Independent # Lo [2] GRANTHA LETTER VOCALIC RR..GRANTHA LETTER VOCALIC LL +11400..1140D ; Vowel_Independent # Lo [14] NEWA LETTER A..NEWA LETTER AU +11481..1148E ; Vowel_Independent # Lo [14] TIRHUTA LETTER A..TIRHUTA LETTER AU +11580..1158D ; Vowel_Independent # Lo [14] SIDDHAM LETTER A..SIDDHAM LETTER AU +115D8..115DB ; Vowel_Independent # Lo [4] SIDDHAM LETTER THREE-CIRCLE ALTERNATE I..SIDDHAM LETTER ALTERNATE U +11600..1160D ; Vowel_Independent # Lo [14] MODI LETTER A..MODI LETTER AU +11680..11689 ; Vowel_Independent # Lo [10] TAKRI LETTER A..TAKRI LETTER AU +11800..11809 ; Vowel_Independent # Lo [10] DOGRA LETTER A..DOGRA LETTER AU +11900..11906 ; Vowel_Independent # Lo [7] DIVES AKURU LETTER A..DIVES AKURU LETTER E +11909 ; Vowel_Independent # Lo DIVES AKURU LETTER O +119A0..119A7 ; Vowel_Independent # Lo [8] NANDINAGARI LETTER A..NANDINAGARI LETTER VOCALIC RR +119AA..119AD ; Vowel_Independent # Lo [4] NANDINAGARI LETTER E..NANDINAGARI LETTER AU +11A00 ; Vowel_Independent # Lo ZANABAZAR SQUARE LETTER A +11A50 ; Vowel_Independent # Lo SOYOMBO LETTER A +11C00..11C08 ; Vowel_Independent # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L +11C0A..11C0D ; Vowel_Independent # Lo [4] BHAIKSUKI LETTER E..BHAIKSUKI LETTER AU +11D00..11D06 ; Vowel_Independent # Lo [7] MASARAM GONDI LETTER A..MASARAM GONDI LETTER E +11D08..11D09 ; Vowel_Independent # Lo [2] MASARAM GONDI LETTER AI..MASARAM GONDI LETTER O +11D0B ; Vowel_Independent # Lo MASARAM GONDI LETTER AU +11D60..11D65 ; Vowel_Independent # Lo [6] GUNJALA GONDI LETTER A..GUNJALA GONDI LETTER UU +11D67..11D68 ; Vowel_Independent # Lo [2] GUNJALA GONDI LETTER EE..GUNJALA GONDI LETTER AI +11D6A..11D6B ; Vowel_Independent # Lo [2] GUNJALA GONDI LETTER OO..GUNJALA GONDI LETTER AU +11F04..11F10 ; Vowel_Independent # Lo [13] KAWI LETTER A..KAWI LETTER O + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Dependent + +# Dependent Vowels (contrasted with independent vowels and/or with +# complex placement). Known as matras in Indic scripts. Also +# includes vowel modifiers that follow dependent (and sometimes +# independent) vowels. + +# [Not derivable] + +093A ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN OE +093B ; Vowel_Dependent # Mc DEVANAGARI VOWEL SIGN OOE +093E..0940 ; Vowel_Dependent # Mc [3] DEVANAGARI VOWEL SIGN AA..DEVANAGARI VOWEL SIGN II +0941..0948 ; Vowel_Dependent # Mn [8] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN AI +0949..094C ; Vowel_Dependent # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094E..094F ; Vowel_Dependent # Mc [2] DEVANAGARI VOWEL SIGN PRISHTHAMATRA E..DEVANAGARI VOWEL SIGN AW +0955..0957 ; Vowel_Dependent # Mn [3] DEVANAGARI VOWEL SIGN CANDRA LONG E..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Vowel_Dependent # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BE..09C0 ; Vowel_Dependent # Mc [3] BENGALI VOWEL SIGN AA..BENGALI VOWEL SIGN II +09C1..09C4 ; Vowel_Dependent # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09C7..09C8 ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +09CB..09CC ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +09D7 ; Vowel_Dependent # Mc BENGALI AU LENGTH MARK +09E2..09E3 ; Vowel_Dependent # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3E..0A40 ; Vowel_Dependent # Mc [3] GURMUKHI VOWEL SIGN AA..GURMUKHI VOWEL SIGN II +0A41..0A42 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A47..0A48 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0ABE..0AC0 ; Vowel_Dependent # Mc [3] GUJARATI VOWEL SIGN AA..GUJARATI VOWEL SIGN II +0AC1..0AC5 ; Vowel_Dependent # Mn [5] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AC9 ; Vowel_Dependent # Mc GUJARATI VOWEL SIGN CANDRA O +0ACB..0ACC ; Vowel_Dependent # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0AE2..0AE3 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3E ; Vowel_Dependent # Mc ORIYA VOWEL SIGN AA +0B3F ; Vowel_Dependent # Mn ORIYA VOWEL SIGN I +0B40 ; Vowel_Dependent # Mc ORIYA VOWEL SIGN II +0B41..0B44 ; Vowel_Dependent # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B47..0B48 ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI +0B4B..0B4C ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN O..ORIYA VOWEL SIGN AU +0B55..0B56 ; Vowel_Dependent # Mn [2] ORIYA SIGN OVERLINE..ORIYA AI LENGTH MARK +0B57 ; Vowel_Dependent # Mc ORIYA AU LENGTH MARK +0B62..0B63 ; Vowel_Dependent # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BBE..0BBF ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC0 ; Vowel_Dependent # Mn TAMIL VOWEL SIGN II +0BC1..0BC2 ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BC6..0BC8 ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0BCA..0BCC ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0BD7 ; Vowel_Dependent # Mc TAMIL AU LENGTH MARK +0C3E..0C40 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C41..0C44 ; Vowel_Dependent # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C46..0C48 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI +0C4A..0C4C ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C55..0C56 ; Vowel_Dependent # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK +0C62..0C63 ; Vowel_Dependent # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBE ; Vowel_Dependent # Mc KANNADA VOWEL SIGN AA +0CBF ; Vowel_Dependent # Mn KANNADA VOWEL SIGN I +0CC0..0CC4 ; Vowel_Dependent # Mc [5] KANNADA VOWEL SIGN II..KANNADA VOWEL SIGN VOCALIC RR +0CC6 ; Vowel_Dependent # Mn KANNADA VOWEL SIGN E +0CC7..0CC8 ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +0CCC ; Vowel_Dependent # Mn KANNADA VOWEL SIGN AU +0CD5..0CD6 ; Vowel_Dependent # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CE2..0CE3 ; Vowel_Dependent # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D3E..0D40 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D44 ; Vowel_Dependent # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR +0D46..0D48 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0D4A..0D4C ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0D57 ; Vowel_Dependent # Mc MALAYALAM AU LENGTH MARK +0D62..0D63 ; Vowel_Dependent # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DCF..0DD1 ; Vowel_Dependent # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD2..0DD4 ; Vowel_Dependent # Mn [3] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Vowel_Dependent # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0DD8..0DDF ; Vowel_Dependent # Mc [8] SINHALA VOWEL SIGN GAETTA-PILLA..SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Vowel_Dependent # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Vowel_Dependent # Lo THAI CHARACTER SARA A +0E31 ; Vowel_Dependent # Mn THAI CHARACTER MAI HAN-AKAT +0E32..0E33 ; Vowel_Dependent # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E34..0E39 ; Vowel_Dependent # Mn [6] THAI CHARACTER SARA I..THAI CHARACTER SARA UU +0E40..0E45 ; Vowel_Dependent # Lo [6] THAI CHARACTER SARA E..THAI CHARACTER LAKKHANGYAO +0E47 ; Vowel_Dependent # Mn THAI CHARACTER MAITAIKHU +0EB0 ; Vowel_Dependent # Lo LAO VOWEL SIGN A +0EB1 ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KAN +0EB2..0EB3 ; Vowel_Dependent # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0EB4..0EB9 ; Vowel_Dependent # Mn [6] LAO VOWEL SIGN I..LAO VOWEL SIGN UU +0EBB ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KON +0EC0..0EC4 ; Vowel_Dependent # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +0F71..0F7D ; Vowel_Dependent # Mn [13] TIBETAN VOWEL SIGN AA..TIBETAN VOWEL SIGN OO +0F80..0F81 ; Vowel_Dependent # Mn [2] TIBETAN VOWEL SIGN REVERSED I..TIBETAN VOWEL SIGN REVERSED II +102B..102C ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +102D..1030 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN UU +1031 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN E +1032..1035 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +1056..1057 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1058..1059 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1062 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1071..1074 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1083..1084 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN SHAN AA..MYANMAR VOWEL SIGN SHAN E +1085..1086 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109C ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN AITON A +109D ; Vowel_Dependent # Mn MYANMAR VOWEL SIGN AITON AI +1712..1713 ; Vowel_Dependent # Mn [2] TAGALOG VOWEL SIGN I..TAGALOG VOWEL SIGN U +1732..1733 ; Vowel_Dependent # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1752..1753 ; Vowel_Dependent # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U +1772..1773 ; Vowel_Dependent # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U +17B6 ; Vowel_Dependent # Mc KHMER VOWEL SIGN AA +17B7..17BD ; Vowel_Dependent # Mn [7] KHMER VOWEL SIGN I..KHMER VOWEL SIGN UA +17BE..17C5 ; Vowel_Dependent # Mc [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU +17C8 ; Vowel_Dependent # Mc KHMER SIGN YUUKALEAPINTU +1920..1922 ; Vowel_Dependent # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U +1923..1926 ; Vowel_Dependent # Mc [4] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AU +1927..1928 ; Vowel_Dependent # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Vowel_Dependent # Mn LIMBU SIGN KEMPHRENG +19B0..19C0 ; Vowel_Dependent # Lo [17] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN IY +1A17..1A18 ; Vowel_Dependent # Mn [2] BUGINESE VOWEL SIGN I..BUGINESE VOWEL SIGN U +1A19..1A1A ; Vowel_Dependent # Mc [2] BUGINESE VOWEL SIGN E..BUGINESE VOWEL SIGN O +1A1B ; Vowel_Dependent # Mn BUGINESE VOWEL SIGN AE +1A61 ; Vowel_Dependent # Mc TAI THAM VOWEL SIGN A +1A62 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN MAI SAT +1A63..1A64 ; Vowel_Dependent # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A65..1A6C ; Vowel_Dependent # Mn [8] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN OA BELOW +1A6D..1A72 ; Vowel_Dependent # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI +1A73 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN OA ABOVE +1B35 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN TEDUNG +1B36..1B3A ; Vowel_Dependent # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA +1B3B ; Vowel_Dependent # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +1B3C ; Vowel_Dependent # Mn BALINESE VOWEL SIGN LA LENGA +1B3D..1B41 ; Vowel_Dependent # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1B42 ; Vowel_Dependent # Mn BALINESE VOWEL SIGN PEPET +1B43 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN PEPET TEDUNG +1BA4..1BA5 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PANGHULU..SUNDANESE VOWEL SIGN PANYUKU +1BA6..1BA7 ; Vowel_Dependent # Mc [2] SUNDANESE VOWEL SIGN PANAELAENG..SUNDANESE VOWEL SIGN PANOLONG +1BA8..1BA9 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE7 ; Vowel_Dependent # Mc BATAK VOWEL SIGN E +1BE8..1BE9 ; Vowel_Dependent # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BEA..1BEC ; Vowel_Dependent # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BED ; Vowel_Dependent # Mn BATAK VOWEL SIGN KARO O +1BEE ; Vowel_Dependent # Mc BATAK VOWEL SIGN U +1BEF ; Vowel_Dependent # Mn BATAK VOWEL SIGN U FOR SIMALUNGUN SA +1C26..1C2B ; Vowel_Dependent # Mc [6] LEPCHA VOWEL SIGN AA..LEPCHA VOWEL SIGN UU +1C2C ; Vowel_Dependent # Mn LEPCHA VOWEL SIGN E +A802 ; Vowel_Dependent # Mn SYLOTI NAGRI SIGN DVISVARA +A823..A824 ; Vowel_Dependent # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A825..A826 ; Vowel_Dependent # Mn [2] SYLOTI NAGRI VOWEL SIGN U..SYLOTI NAGRI VOWEL SIGN E +A827 ; Vowel_Dependent # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Vowel_Dependent # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A8FF ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN AY +A947..A94E ; Vowel_Dependent # Mn [8] REJANG VOWEL SIGN I..REJANG VOWEL SIGN EA +A9B4..A9B5 ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9B6..A9B9 ; Vowel_Dependent # Mn [4] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BA..A9BB ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +A9BC ; Vowel_Dependent # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Vowel_Dependent # Mn MYANMAR SIGN SHAN SAW +AA29..AA2E ; Vowel_Dependent # Mn [6] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN OE +AA2F..AA30 ; Vowel_Dependent # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA31..AA32 ; Vowel_Dependent # Mn [2] CHAM VOWEL SIGN AU..CHAM VOWEL SIGN UE +AAB0 ; Vowel_Dependent # Mn TAI VIET MAI KANG +AAB1 ; Vowel_Dependent # Lo TAI VIET VOWEL AA +AAB2..AAB4 ; Vowel_Dependent # Mn [3] TAI VIET VOWEL I..TAI VIET VOWEL U +AAB5..AAB6 ; Vowel_Dependent # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB7..AAB8 ; Vowel_Dependent # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AAB9..AABD ; Vowel_Dependent # Lo [5] TAI VIET VOWEL UEA..TAI VIET VOWEL AN +AABE ; Vowel_Dependent # Mn TAI VIET VOWEL AM +AAEB ; Vowel_Dependent # Mc MEETEI MAYEK VOWEL SIGN II +AAEC..AAED ; Vowel_Dependent # Mn [2] MEETEI MAYEK VOWEL SIGN UU..MEETEI MAYEK VOWEL SIGN AAI +AAEE..AAEF ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN AU..MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE5 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN ANAP +ABE6..ABE7 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE8 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABE9..ABEA ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +10A01..10A03 ; Vowel_Dependent # Mn [3] KHAROSHTHI VOWEL SIGN I..KHAROSHTHI VOWEL SIGN VOCALIC R +10A05..10A06 ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O +10A0C..10A0D ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN DOUBLE RING BELOW +11038..11045 ; Vowel_Dependent # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +11073..11074 ; Vowel_Dependent # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O +110B0..110B2 ; Vowel_Dependent # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II +110B3..110B6 ; Vowel_Dependent # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI +110B7..110B8 ; Vowel_Dependent # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +110C2 ; Vowel_Dependent # Mn KAITHI VOWEL SIGN VOCALIC R +11127..1112B ; Vowel_Dependent # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU +1112C ; Vowel_Dependent # Mc CHAKMA VOWEL SIGN E +1112D..11132 ; Vowel_Dependent # Mn [6] CHAKMA VOWEL SIGN AI..CHAKMA AU MARK +11145..11146 ; Vowel_Dependent # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI +111B3..111B5 ; Vowel_Dependent # Mc [3] SHARADA VOWEL SIGN AA..SHARADA VOWEL SIGN II +111B6..111BE ; Vowel_Dependent # Mn [9] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN O +111BF ; Vowel_Dependent # Mc SHARADA VOWEL SIGN AU +111CB..111CC ; Vowel_Dependent # Mn [2] SHARADA VOWEL MODIFIER MARK..SHARADA EXTRA SHORT VOWEL MARK +111CE ; Vowel_Dependent # Mc SHARADA VOWEL SIGN PRISHTHAMATRA E +1122C..1122E ; Vowel_Dependent # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +1122F..11231 ; Vowel_Dependent # Mn [3] KHOJKI VOWEL SIGN U..KHOJKI VOWEL SIGN AI +11232..11233 ; Vowel_Dependent # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU +11241 ; Vowel_Dependent # Mn KHOJKI VOWEL SIGN VOCALIC R +112E0..112E2 ; Vowel_Dependent # Mc [3] KHUDAWADI VOWEL SIGN AA..KHUDAWADI VOWEL SIGN II +112E3..112E8 ; Vowel_Dependent # Mn [6] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN AU +1133E..1133F ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11340 ; Vowel_Dependent # Mn GRANTHA VOWEL SIGN II +11341..11344 ; Vowel_Dependent # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +11347..11348 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +1134B..1134C ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +11357 ; Vowel_Dependent # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +11435..11437 ; Vowel_Dependent # Mc [3] NEWA VOWEL SIGN AA..NEWA VOWEL SIGN II +11438..1143F ; Vowel_Dependent # Mn [8] NEWA VOWEL SIGN U..NEWA VOWEL SIGN AI +11440..11441 ; Vowel_Dependent # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +114B0..114B2 ; Vowel_Dependent # Mc [3] TIRHUTA VOWEL SIGN AA..TIRHUTA VOWEL SIGN II +114B3..114B8 ; Vowel_Dependent # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114B9 ; Vowel_Dependent # Mc TIRHUTA VOWEL SIGN E +114BA ; Vowel_Dependent # Mn TIRHUTA VOWEL SIGN SHORT E +114BB..114BE ; Vowel_Dependent # Mc [4] TIRHUTA VOWEL SIGN AI..TIRHUTA VOWEL SIGN AU +115AF..115B1 ; Vowel_Dependent # Mc [3] SIDDHAM VOWEL SIGN AA..SIDDHAM VOWEL SIGN II +115B2..115B5 ; Vowel_Dependent # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115B8..115BB ; Vowel_Dependent # Mc [4] SIDDHAM VOWEL SIGN E..SIDDHAM VOWEL SIGN AU +115DC..115DD ; Vowel_Dependent # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11630..11632 ; Vowel_Dependent # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +11633..1163A ; Vowel_Dependent # Mn [8] MODI VOWEL SIGN U..MODI VOWEL SIGN AI +1163B..1163C ; Vowel_Dependent # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +11640 ; Vowel_Dependent # Mn MODI SIGN ARDHACANDRA +116AD ; Vowel_Dependent # Mn TAKRI VOWEL SIGN AA +116AE..116AF ; Vowel_Dependent # Mc [2] TAKRI VOWEL SIGN I..TAKRI VOWEL SIGN II +116B0..116B5 ; Vowel_Dependent # Mn [6] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN AU +11720..11721 ; Vowel_Dependent # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +11722..11725 ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN I..AHOM VOWEL SIGN UU +11726 ; Vowel_Dependent # Mc AHOM VOWEL SIGN E +11727..1172A ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN AW..AHOM VOWEL SIGN AM +1182C..1182E ; Vowel_Dependent # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II +1182F..11836 ; Vowel_Dependent # Mn [8] DOGRA VOWEL SIGN U..DOGRA VOWEL SIGN AU +11930..11935 ; Vowel_Dependent # Mc [6] DIVES AKURU VOWEL SIGN AA..DIVES AKURU VOWEL SIGN E +11937..11938 ; Vowel_Dependent # Mc [2] DIVES AKURU VOWEL SIGN AI..DIVES AKURU VOWEL SIGN O +119D1..119D3 ; Vowel_Dependent # Mc [3] NANDINAGARI VOWEL SIGN AA..NANDINAGARI VOWEL SIGN II +119D4..119D7 ; Vowel_Dependent # Mn [4] NANDINAGARI VOWEL SIGN U..NANDINAGARI VOWEL SIGN VOCALIC RR +119DA..119DB ; Vowel_Dependent # Mn [2] NANDINAGARI VOWEL SIGN E..NANDINAGARI VOWEL SIGN AI +119DC..119DD ; Vowel_Dependent # Mc [2] NANDINAGARI VOWEL SIGN O..NANDINAGARI VOWEL SIGN AU +119E4 ; Vowel_Dependent # Mc NANDINAGARI VOWEL SIGN PRISHTHAMATRA E +11A01..11A0A ; Vowel_Dependent # Mn [10] ZANABAZAR SQUARE VOWEL SIGN I..ZANABAZAR SQUARE VOWEL LENGTH MARK +11A51..11A56 ; Vowel_Dependent # Mn [6] SOYOMBO VOWEL SIGN I..SOYOMBO VOWEL SIGN OE +11A57..11A58 ; Vowel_Dependent # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A59..11A5B ; Vowel_Dependent # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11C2F ; Vowel_Dependent # Mc BHAIKSUKI VOWEL SIGN AA +11C30..11C36 ; Vowel_Dependent # Mn [7] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN VOCALIC L +11C38..11C3B ; Vowel_Dependent # Mn [4] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI VOWEL SIGN AU +11CB0 ; Vowel_Dependent # Mn MARCHEN VOWEL SIGN AA +11CB1 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN I +11CB2..11CB3 ; Vowel_Dependent # Mn [2] MARCHEN VOWEL SIGN U..MARCHEN VOWEL SIGN E +11CB4 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN O +11D31..11D36 ; Vowel_Dependent # Mn [6] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN VOCALIC R +11D3A ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Vowel_Dependent # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN AU +11D43 ; Vowel_Dependent # Mn MASARAM GONDI SIGN CANDRA +11D8A..11D8E ; Vowel_Dependent # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU +11D90..11D91 ; Vowel_Dependent # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI +11D93..11D94 ; Vowel_Dependent # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU +11EF3..11EF4 ; Vowel_Dependent # Mn [2] MAKASAR VOWEL SIGN I..MAKASAR VOWEL SIGN U +11EF5..11EF6 ; Vowel_Dependent # Mc [2] MAKASAR VOWEL SIGN E..MAKASAR VOWEL SIGN O +11F34..11F35 ; Vowel_Dependent # Mc [2] KAWI VOWEL SIGN AA..KAWI VOWEL SIGN ALTERNATE AA +11F36..11F3A ; Vowel_Dependent # Mn [5] KAWI VOWEL SIGN I..KAWI VOWEL SIGN VOCALIC R +11F3E..11F3F ; Vowel_Dependent # Mc [2] KAWI VOWEL SIGN E..KAWI VOWEL SIGN AI +11F40 ; Vowel_Dependent # Mn KAWI VOWEL SIGN EU + +# ================================================ + +# Indic_Syllabic_Category=Vowel + +# (Other) Vowels (reanalyzed as ordinary alphabetic letters or marks) + +# [Not derivable] + +1963..196D ; Vowel # Lo [11] TAI LE LETTER A..TAI LE LETTER AI +A85E..A861 ; Vowel # Lo [4] PHAGS-PA LETTER I..PHAGS-PA LETTER O +A866 ; Vowel # Lo PHAGS-PA LETTER EE +A922..A925 ; Vowel # Lo [4] KAYAH LI LETTER A..KAYAH LI LETTER OO +A926..A92A ; Vowel # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O +11150..11154 ; Vowel # Lo [5] MAHAJANI LETTER A..MAHAJANI LETTER O + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Placeholder + +# Consonant Placeholder +# This includes generic placeholders used for +# Indic script layout (NBSP and dotted circle), as well as a few script- +# specific vowel-holder characters which are not technically +# consonants, but serve instead as bases for placement of vowel marks. + +# [Not derivable] + +002D ; Consonant_Placeholder # Pd HYPHEN-MINUS +00A0 ; Consonant_Placeholder # Zs NO-BREAK SPACE +00D7 ; Consonant_Placeholder # Sm MULTIPLICATION SIGN +0980 ; Consonant_Placeholder # Lo BENGALI ANJI +0A72..0A73 ; Consonant_Placeholder # Lo [2] GURMUKHI IRI..GURMUKHI URA +104B ; Consonant_Placeholder # Po MYANMAR SIGN SECTION +104E ; Consonant_Placeholder # Po MYANMAR SYMBOL AFOREMENTIONED +1900 ; Consonant_Placeholder # Lo LIMBU VOWEL-CARRIER LETTER +1CFA ; Consonant_Placeholder # Lo VEDIC SIGN DOUBLE ANUSVARA ANTARGOMUKHA +2010..2014 ; Consonant_Placeholder # Pd [5] HYPHEN..EM DASH +25CC ; Consonant_Placeholder # So DOTTED CIRCLE +AA74..AA76 ; Consonant_Placeholder # Lo [3] MYANMAR LOGOGRAM KHAMTI OAY..MYANMAR LOGOGRAM KHAMTI HM +11A3F ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL HEAD MARK +11A45 ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL DOUBLE-LINED HEAD MARK +11EF2 ; Consonant_Placeholder # Lo MAKASAR ANGKA + +# ================================================ + +# Indic_Syllabic_Category=Consonant + +# Consonant (ordinary abugida consonants, with inherent vowels) + +# [Not derivable] + +0915..0939 ; Consonant # Lo [37] DEVANAGARI LETTER KA..DEVANAGARI LETTER HA +0958..095F ; Consonant # Lo [8] DEVANAGARI LETTER QA..DEVANAGARI LETTER YYA +0978..097F ; Consonant # Lo [8] DEVANAGARI LETTER MARWARI DDA..DEVANAGARI LETTER BBA +0995..09A8 ; Consonant # Lo [20] BENGALI LETTER KA..BENGALI LETTER NA +09AA..09B0 ; Consonant # Lo [7] BENGALI LETTER PA..BENGALI LETTER RA +09B2 ; Consonant # Lo BENGALI LETTER LA +09B6..09B9 ; Consonant # Lo [4] BENGALI LETTER SHA..BENGALI LETTER HA +09DC..09DD ; Consonant # Lo [2] BENGALI LETTER RRA..BENGALI LETTER RHA +09DF ; Consonant # Lo BENGALI LETTER YYA +09F0..09F1 ; Consonant # Lo [2] BENGALI LETTER RA WITH MIDDLE DIAGONAL..BENGALI LETTER RA WITH LOWER DIAGONAL +0A15..0A28 ; Consonant # Lo [20] GURMUKHI LETTER KA..GURMUKHI LETTER NA +0A2A..0A30 ; Consonant # Lo [7] GURMUKHI LETTER PA..GURMUKHI LETTER RA +0A32..0A33 ; Consonant # Lo [2] GURMUKHI LETTER LA..GURMUKHI LETTER LLA +0A35..0A36 ; Consonant # Lo [2] GURMUKHI LETTER VA..GURMUKHI LETTER SHA +0A38..0A39 ; Consonant # Lo [2] GURMUKHI LETTER SA..GURMUKHI LETTER HA +0A59..0A5C ; Consonant # Lo [4] GURMUKHI LETTER KHHA..GURMUKHI LETTER RRA +0A5E ; Consonant # Lo GURMUKHI LETTER FA +0A95..0AA8 ; Consonant # Lo [20] GUJARATI LETTER KA..GUJARATI LETTER NA +0AAA..0AB0 ; Consonant # Lo [7] GUJARATI LETTER PA..GUJARATI LETTER RA +0AB2..0AB3 ; Consonant # Lo [2] GUJARATI LETTER LA..GUJARATI LETTER LLA +0AB5..0AB9 ; Consonant # Lo [5] GUJARATI LETTER VA..GUJARATI LETTER HA +0AF9 ; Consonant # Lo GUJARATI LETTER ZHA +0B15..0B28 ; Consonant # Lo [20] ORIYA LETTER KA..ORIYA LETTER NA +0B2A..0B30 ; Consonant # Lo [7] ORIYA LETTER PA..ORIYA LETTER RA +0B32..0B33 ; Consonant # Lo [2] ORIYA LETTER LA..ORIYA LETTER LLA +0B35..0B39 ; Consonant # Lo [5] ORIYA LETTER VA..ORIYA LETTER HA +0B5C..0B5D ; Consonant # Lo [2] ORIYA LETTER RRA..ORIYA LETTER RHA +0B5F ; Consonant # Lo ORIYA LETTER YYA +0B71 ; Consonant # Lo ORIYA LETTER WA +0B95 ; Consonant # Lo TAMIL LETTER KA +0B99..0B9A ; Consonant # Lo [2] TAMIL LETTER NGA..TAMIL LETTER CA +0B9C ; Consonant # Lo TAMIL LETTER JA +0B9E..0B9F ; Consonant # Lo [2] TAMIL LETTER NYA..TAMIL LETTER TTA +0BA3..0BA4 ; Consonant # Lo [2] TAMIL LETTER NNA..TAMIL LETTER TA +0BA8..0BAA ; Consonant # Lo [3] TAMIL LETTER NA..TAMIL LETTER PA +0BAE..0BB9 ; Consonant # Lo [12] TAMIL LETTER MA..TAMIL LETTER HA +0C15..0C28 ; Consonant # Lo [20] TELUGU LETTER KA..TELUGU LETTER NA +0C2A..0C39 ; Consonant # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C58..0C5A ; Consonant # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C95..0CA8 ; Consonant # Lo [20] KANNADA LETTER KA..KANNADA LETTER NA +0CAA..0CB3 ; Consonant # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA +0CB5..0CB9 ; Consonant # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA +0CDE ; Consonant # Lo KANNADA LETTER FA +0D15..0D3A ; Consonant # Lo [38] MALAYALAM LETTER KA..MALAYALAM LETTER TTTA +0D9A..0DB1 ; Consonant # Lo [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA +0DB3..0DBB ; Consonant # Lo [9] SINHALA LETTER SANYAKA DAYANNA..SINHALA LETTER RAYANNA +0DBD ; Consonant # Lo SINHALA LETTER DANTAJA LAYANNA +0DC0..0DC6 ; Consonant # Lo [7] SINHALA LETTER VAYANNA..SINHALA LETTER FAYANNA +0E01..0E2E ; Consonant # Lo [46] THAI CHARACTER KO KAI..THAI CHARACTER HO NOKHUK +0E81..0E82 ; Consonant # Lo [2] LAO LETTER KO..LAO LETTER KHO SUNG +0E84 ; Consonant # Lo LAO LETTER KHO TAM +0E86..0E8A ; Consonant # Lo [5] LAO LETTER PALI GHA..LAO LETTER SO TAM +0E8C..0EA3 ; Consonant # Lo [24] LAO LETTER PALI JHA..LAO LETTER LO LING +0EA5 ; Consonant # Lo LAO LETTER LO LOOT +0EA7..0EAE ; Consonant # Lo [8] LAO LETTER WO..LAO LETTER HO TAM +0EDC..0EDF ; Consonant # Lo [4] LAO HO NO..LAO LETTER KHMU NYO +0F40..0F47 ; Consonant # Lo [8] TIBETAN LETTER KA..TIBETAN LETTER JA +0F49..0F6C ; Consonant # Lo [36] TIBETAN LETTER NYA..TIBETAN LETTER RRA +1000..1020 ; Consonant # Lo [33] MYANMAR LETTER KA..MYANMAR LETTER LLA +103F ; Consonant # Lo MYANMAR LETTER GREAT SA +1050..1051 ; Consonant # Lo [2] MYANMAR LETTER SHA..MYANMAR LETTER SSA +105A..105D ; Consonant # Lo [4] MYANMAR LETTER MON NGA..MYANMAR LETTER MON BBE +1061 ; Consonant # Lo MYANMAR LETTER SGAW KAREN SHA +1065..1066 ; Consonant # Lo [2] MYANMAR LETTER WESTERN PWO KAREN THA..MYANMAR LETTER WESTERN PWO KAREN PWA +106E..1070 ; Consonant # Lo [3] MYANMAR LETTER EASTERN PWO KAREN NNA..MYANMAR LETTER EASTERN PWO KAREN GHWA +1075..1081 ; Consonant # Lo [13] MYANMAR LETTER SHAN KA..MYANMAR LETTER SHAN HA +108E ; Consonant # Lo MYANMAR LETTER RUMAI PALAUNG FA +1703..1711 ; Consonant # Lo [15] TAGALOG LETTER KA..TAGALOG LETTER HA +171F ; Consonant # Lo TAGALOG LETTER ARCHAIC RA +1723..1731 ; Consonant # Lo [15] HANUNOO LETTER KA..HANUNOO LETTER HA +1743..1751 ; Consonant # Lo [15] BUHID LETTER KA..BUHID LETTER HA +1763..176C ; Consonant # Lo [10] TAGBANWA LETTER KA..TAGBANWA LETTER YA +176E..1770 ; Consonant # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA +1780..17A2 ; Consonant # Lo [35] KHMER LETTER KA..KHMER LETTER QA +1901..191E ; Consonant # Lo [30] LIMBU LETTER KA..LIMBU LETTER TRA +1950..1962 ; Consonant # Lo [19] TAI LE LETTER KA..TAI LE LETTER NA +1980..19AB ; Consonant # Lo [44] NEW TAI LUE LETTER HIGH QA..NEW TAI LUE LETTER LOW SUA +1A00..1A16 ; Consonant # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA +1A20..1A4C ; Consonant # Lo [45] TAI THAM LETTER HIGH KA..TAI THAM LETTER LOW HA +1A53..1A54 ; Consonant # Lo [2] TAI THAM LETTER LAE..TAI THAM LETTER GREAT SA +1B13..1B33 ; Consonant # Lo [33] BALINESE LETTER KA..BALINESE LETTER HA +1B45..1B4C ; Consonant # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA +1B8A..1BA0 ; Consonant # Lo [23] SUNDANESE LETTER KA..SUNDANESE LETTER HA +1BAE..1BAF ; Consonant # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA +1BBB..1BBD ; Consonant # Lo [3] SUNDANESE LETTER REU..SUNDANESE LETTER BHA +1BC0..1BE3 ; Consonant # Lo [36] BATAK LETTER A..BATAK LETTER MBA +1C00..1C23 ; Consonant # Lo [36] LEPCHA LETTER KA..LEPCHA LETTER A +1C4D..1C4F ; Consonant # Lo [3] LEPCHA LETTER TTA..LEPCHA LETTER DDA +A807..A80A ; Consonant # Lo [4] SYLOTI NAGRI LETTER KO..SYLOTI NAGRI LETTER GHO +A80C..A822 ; Consonant # Lo [23] SYLOTI NAGRI LETTER CO..SYLOTI NAGRI LETTER HO +A840..A85D ; Consonant # Lo [30] PHAGS-PA LETTER KA..PHAGS-PA LETTER A +A862..A865 ; Consonant # Lo [4] PHAGS-PA LETTER QA..PHAGS-PA LETTER GGA +A869..A870 ; Consonant # Lo [8] PHAGS-PA LETTER TTA..PHAGS-PA LETTER ASPIRATED FA +A872 ; Consonant # Lo PHAGS-PA SUPERFIXED LETTER RA +A892..A8B3 ; Consonant # Lo [34] SAURASHTRA LETTER KA..SAURASHTRA LETTER LLA +A90A..A921 ; Consonant # Lo [24] KAYAH LI LETTER KA..KAYAH LI LETTER CA +A930..A946 ; Consonant # Lo [23] REJANG LETTER KA..REJANG LETTER A +A989..A98B ; Consonant # Lo [3] JAVANESE LETTER PA CEREK..JAVANESE LETTER NGA LELET RASWADI +A98F..A9B2 ; Consonant # Lo [36] JAVANESE LETTER KA..JAVANESE LETTER HA +A9E0..A9E4 ; Consonant # Lo [5] MYANMAR LETTER SHAN GHA..MYANMAR LETTER SHAN BHA +A9E7..A9EF ; Consonant # Lo [9] MYANMAR LETTER TAI LAING NYA..MYANMAR LETTER TAI LAING NNA +A9FA..A9FE ; Consonant # Lo [5] MYANMAR LETTER TAI LAING LLA..MYANMAR LETTER TAI LAING BHA +AA06..AA28 ; Consonant # Lo [35] CHAM LETTER KA..CHAM LETTER HA +AA60..AA6F ; Consonant # Lo [16] MYANMAR LETTER KHAMTI GA..MYANMAR LETTER KHAMTI FA +AA71..AA73 ; Consonant # Lo [3] MYANMAR LETTER KHAMTI XA..MYANMAR LETTER KHAMTI RA +AA7A ; Consonant # Lo MYANMAR LETTER AITON RA +AA7E..AA7F ; Consonant # Lo [2] MYANMAR LETTER SHWE PALAUNG CHA..MYANMAR LETTER SHWE PALAUNG SHA +AA80..AAAF ; Consonant # Lo [48] TAI VIET LETTER LOW KO..TAI VIET LETTER HIGH O +AAE2..AAEA ; Consonant # Lo [9] MEETEI MAYEK LETTER CHA..MEETEI MAYEK LETTER SSA +ABC0..ABCD ; Consonant # Lo [14] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER HUK +ABD0 ; Consonant # Lo MEETEI MAYEK LETTER PHAM +ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTER BHAM +10A00 ; Consonant # Lo KHAROSHTHI LETTER A +10A10..10A13 ; Consonant # Lo [4] KHAROSHTHI LETTER KA..KHAROSHTHI LETTER GHA +10A15..10A17 ; Consonant # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA +10A19..10A35 ; Consonant # Lo [29] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER VHA +11013..11037 ; Consonant # Lo [37] BRAHMI LETTER KA..BRAHMI LETTER OLD TAMIL NNNA +11075 ; Consonant # Lo BRAHMI LETTER OLD TAMIL LLA +1108D..110AF ; Consonant # Lo [35] KAITHI LETTER KA..KAITHI LETTER HA +11107..11126 ; Consonant # Lo [32] CHAKMA LETTER KAA..CHAKMA LETTER HAA +11144 ; Consonant # Lo CHAKMA LETTER LHAA +11147 ; Consonant # Lo CHAKMA LETTER VAA +11155..11172 ; Consonant # Lo [30] MAHAJANI LETTER KA..MAHAJANI LETTER RRA +11191..111B2 ; Consonant # Lo [34] SHARADA LETTER KA..SHARADA LETTER HA +11208..11211 ; Consonant # Lo [10] KHOJKI LETTER KA..KHOJKI LETTER JJA +11213..1122B ; Consonant # Lo [25] KHOJKI LETTER NYA..KHOJKI LETTER LLA +1123F ; Consonant # Lo KHOJKI LETTER QA +11284..11286 ; Consonant # Lo [3] MULTANI LETTER KA..MULTANI LETTER GA +11288 ; Consonant # Lo MULTANI LETTER GHA +1128A..1128D ; Consonant # Lo [4] MULTANI LETTER CA..MULTANI LETTER JJA +1128F..1129D ; Consonant # Lo [15] MULTANI LETTER NYA..MULTANI LETTER BA +1129F..112A8 ; Consonant # Lo [10] MULTANI LETTER BHA..MULTANI LETTER RHA +112BA..112DE ; Consonant # Lo [37] KHUDAWADI LETTER KA..KHUDAWADI LETTER HA +11315..11328 ; Consonant # Lo [20] GRANTHA LETTER KA..GRANTHA LETTER NA +1132A..11330 ; Consonant # Lo [7] GRANTHA LETTER PA..GRANTHA LETTER RA +11332..11333 ; Consonant # Lo [2] GRANTHA LETTER LA..GRANTHA LETTER LLA +11335..11339 ; Consonant # Lo [5] GRANTHA LETTER VA..GRANTHA LETTER HA +1140E..11434 ; Consonant # Lo [39] NEWA LETTER KA..NEWA LETTER HA +1148F..114AF ; Consonant # Lo [33] TIRHUTA LETTER KA..TIRHUTA LETTER HA +1158E..115AE ; Consonant # Lo [33] SIDDHAM LETTER KA..SIDDHAM LETTER HA +1160E..1162F ; Consonant # Lo [34] MODI LETTER KA..MODI LETTER LLA +1168A..116AA ; Consonant # Lo [33] TAKRI LETTER KA..TAKRI LETTER RRA +116B8 ; Consonant # Lo TAKRI LETTER ARCHAIC KHA +11700..1171A ; Consonant # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA +11740..11746 ; Consonant # Lo [7] AHOM LETTER CA..AHOM LETTER LLA +1180A..1182B ; Consonant # Lo [34] DOGRA LETTER KA..DOGRA LETTER RRA +1190C..11913 ; Consonant # Lo [8] DIVES AKURU LETTER KA..DIVES AKURU LETTER JA +11915..11916 ; Consonant # Lo [2] DIVES AKURU LETTER NYA..DIVES AKURU LETTER TTA +11918..1192F ; Consonant # Lo [24] DIVES AKURU LETTER DDA..DIVES AKURU LETTER ZA +119AE..119D0 ; Consonant # Lo [35] NANDINAGARI LETTER KA..NANDINAGARI LETTER RRA +11A0B..11A32 ; Consonant # Lo [40] ZANABAZAR SQUARE LETTER KA..ZANABAZAR SQUARE LETTER KSSA +11A5C..11A83 ; Consonant # Lo [40] SOYOMBO LETTER KA..SOYOMBO LETTER KSSA +11C0E..11C2E ; Consonant # Lo [33] BHAIKSUKI LETTER KA..BHAIKSUKI LETTER HA +11C72..11C8F ; Consonant # Lo [30] MARCHEN LETTER KA..MARCHEN LETTER A +11D0C..11D30 ; Consonant # Lo [37] MASARAM GONDI LETTER KA..MASARAM GONDI LETTER TRA +11D6C..11D89 ; Consonant # Lo [30] GUNJALA GONDI LETTER YA..GUNJALA GONDI LETTER SA +11EE0..11EF1 ; Consonant # Lo [18] MAKASAR LETTER KA..MAKASAR LETTER A +11F12..11F33 ; Consonant # Lo [34] KAWI LETTER KA..KAWI LETTER JNYA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Dead + +# Dead Consonant (special consonant with killed vowel) + +# [Not derivable] + +09CE ; Consonant_Dead # Lo BENGALI LETTER KHANDA TA +0C5D ; Consonant_Dead # Lo TELUGU LETTER NAKAARA POLLU +0CDD ; Consonant_Dead # Lo KANNADA LETTER NAKAARA POLLU +0D54..0D56 ; Consonant_Dead # Lo [3] MALAYALAM LETTER CHILLU M..MALAYALAM LETTER CHILLU LLL +0D7A..0D7F ; Consonant_Dead # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K +1CF2..1CF3 ; Consonant_Dead # Lo [2] VEDIC SIGN ARDHAVISARGA..VEDIC SIGN ROTATED ARDHAVISARGA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_With_Stacker + +# Consonants that may make stacked ligatures with the next consonant +# without the use of a virama + +# [Not derivable] + +0CF1..0CF2 ; Consonant_With_Stacker # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA +1CF5..1CF6 ; Consonant_With_Stacker # Lo [2] VEDIC SIGN JIHVAMULIYA..VEDIC SIGN UPADHMANIYA +11003..11004 ; Consonant_With_Stacker # Lo [2] BRAHMI SIGN JIHVAMULIYA..BRAHMI SIGN UPADHMANIYA +11460..11461 ; Consonant_With_Stacker # Lo [2] NEWA SIGN JIHVAMULIYA..NEWA SIGN UPADHMANIYA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Prefixed + +# Cluster-initial consonants + +# [Not derivable] + +111C2..111C3 ; Consonant_Prefixed # Lo [2] SHARADA SIGN JIHVAMULIYA..SHARADA SIGN UPADHMANIYA +1193F ; Consonant_Prefixed # Lo DIVES AKURU PREFIXED NASAL SIGN +11A3A ; Consonant_Prefixed # Lo ZANABAZAR SQUARE CLUSTER-INITIAL LETTER RA +11A84..11A89 ; Consonant_Prefixed # Lo [6] SOYOMBO SIGN JIHVAMULIYA..SOYOMBO CLUSTER-INITIAL LETTER SA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Preceding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when preceding the main +# consonant. + +# [Not derivable] + +0D4E ; Consonant_Preceding_Repha # Lo MALAYALAM LETTER DOT REPH +11941 ; Consonant_Preceding_Repha # Lo DIVES AKURU INITIAL RA +11D46 ; Consonant_Preceding_Repha # Lo MASARAM GONDI REPHA +11F02 ; Consonant_Preceding_Repha # Lo KAWI SIGN REPHA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Initial_Postfixed + +# Consonants that succeed the main consonant in character sequences, but are +# pronounced before it. + +# [Not derivable] + +1A5A ; Consonant_Initial_Postfixed # Mn TAI THAM CONSONANT SIGN LOW PA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Succeeding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when succeeding the main +# consonant. + +# [Not derivable] + +17CC ; Consonant_Succeeding_Repha # Mn KHMER SIGN ROBAT + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Subjoined + +# Subjoined Consonant (C2 form subtending a base consonant in Tibetan, etc.) + +# [Not derivable] + +0F8D..0F97 ; Consonant_Subjoined # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Consonant_Subjoined # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +1929..192B ; Consonant_Subjoined # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1A57 ; Consonant_Subjoined # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A5B..1A5E ; Consonant_Subjoined # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1BA1 ; Consonant_Subjoined # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA2..1BA3 ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BAC..1BAD ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C24..1C25 ; Consonant_Subjoined # Mc [2] LEPCHA SUBJOINED LETTER YA..LEPCHA SUBJOINED LETTER RA +A867..A868 ; Consonant_Subjoined # Lo [2] PHAGS-PA SUBJOINED LETTER WA..PHAGS-PA SUBJOINED LETTER YA +A871 ; Consonant_Subjoined # Lo PHAGS-PA SUBJOINED LETTER RA +11C92..11CA7 ; Consonant_Subjoined # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CA9 ; Consonant_Subjoined # Mc MARCHEN SUBJOINED LETTER YA +11CAA..11CAF ; Consonant_Subjoined # Mn [6] MARCHEN SUBJOINED LETTER RA..MARCHEN SUBJOINED LETTER A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Medial + +# Medial Consonant (medial liquid, occurring in clusters) + +# [Not derivable] + +0A75 ; Consonant_Medial # Mn GURMUKHI SIGN YAKASH +0EBC ; Consonant_Medial # Mn LAO SEMIVOWEL SIGN LO +0EBD ; Consonant_Medial # Lo LAO SEMIVOWEL SIGN NYO +103B..103C ; Consonant_Medial # Mc [2] MYANMAR CONSONANT SIGN MEDIAL YA..MYANMAR CONSONANT SIGN MEDIAL RA +103D..103E ; Consonant_Medial # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +105E..1060 ; Consonant_Medial # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Consonant_Medial # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +1A55 ; Consonant_Medial # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A56 ; Consonant_Medial # Mn TAI THAM CONSONANT SIGN MEDIAL LA +A8B4 ; Consonant_Medial # Mc SAURASHTRA CONSONANT SIGN HAARU +A9BD ; Consonant_Medial # Mn JAVANESE CONSONANT SIGN KERET +A9BE..A9BF ; Consonant_Medial # Mc [2] JAVANESE CONSONANT SIGN PENGKAL..JAVANESE CONSONANT SIGN CAKRA +AA33..AA34 ; Consonant_Medial # Mc [2] CHAM CONSONANT SIGN YA..CHAM CONSONANT SIGN RA +AA35..AA36 ; Consonant_Medial # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +1171D..1171F ; Consonant_Medial # Mn [3] AHOM CONSONANT SIGN MEDIAL LA..AHOM CONSONANT SIGN MEDIAL LIGATING RA +11940 ; Consonant_Medial # Mc DIVES AKURU MEDIAL YA +11942 ; Consonant_Medial # Mc DIVES AKURU MEDIAL RA +11A3B..11A3E ; Consonant_Medial # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11D47 ; Consonant_Medial # Mn MASARAM GONDI RA-KARA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Final + +# Final Consonant (special final forms which do not take vowels) + +# [Not derivable] + +1930..1931 ; Consonant_Final # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Consonant_Final # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +1939 ; Consonant_Final # Mn LIMBU SIGN MUKPHRENG +19C1..19C7 ; Consonant_Final # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B +1A58..1A59 ; Consonant_Final # Mn [2] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN FINAL NGA +1B03 ; Consonant_Final # Mn BALINESE SIGN SURANG +1B81 ; Consonant_Final # Mn SUNDANESE SIGN PANGLAYAR +1BBE..1BBF ; Consonant_Final # Lo [2] SUNDANESE LETTER FINAL K..SUNDANESE LETTER FINAL M +1BF0..1BF1 ; Consonant_Final # Mn [2] BATAK CONSONANT SIGN NG..BATAK CONSONANT SIGN H +1C2D..1C33 ; Consonant_Final # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +A94F..A951 ; Consonant_Final # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A952 ; Consonant_Final # Mc REJANG CONSONANT SIGN H +A982 ; Consonant_Final # Mn JAVANESE SIGN LAYAR +AA40..AA42 ; Consonant_Final # Lo [3] CHAM LETTER FINAL K..CHAM LETTER FINAL NG +AA43 ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL NG +AA44..AA4B ; Consonant_Final # Lo [8] CHAM LETTER FINAL CH..CHAM LETTER FINAL SS +AA4C ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL M +AA4D ; Consonant_Final # Mc CHAM CONSONANT SIGN FINAL H +ABDB..ABE2 ; Consonant_Final # Lo [8] MEETEI MAYEK LETTER KOK LONSUM..MEETEI MAYEK LETTER I LONSUM +11A8A..11A95 ; Consonant_Final # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Head_Letter + +# Head Letter (Tibetan) + +# [Not derivable] + +0F88..0F8C ; Consonant_Head_Letter # Lo [5] TIBETAN SIGN LCE TSA CAN..TIBETAN SIGN INVERTED MCHU CAN + +# ================================================ + +# Indic_Syllabic_Category=Modifying_Letter + +# Reanalyzed letters not participating in the abugida structure, but +# serving to modify the sound of an adjacent vowel or consonant. +# Note that this is not the same as General_Category=Modifier_Letter. + +# [Not derivable] + +0B83 ; Modifying_Letter # Lo TAMIL SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Tone_Letter + +# Tone Letter (spacing lexical tone mark with status as a letter) + +# [Not derivable] + +1970..1974 ; Tone_Letter # Lo [5] TAI LE LETTER TONE-2..TAI LE LETTER TONE-6 +AAC0 ; Tone_Letter # Lo TAI VIET TONE MAI NUENG +AAC2 ; Tone_Letter # Lo TAI VIET TONE MAI SONG + +# ================================================ + +# Indic_Syllabic_Category=Tone_Mark + +# Tone Mark (nonspacing or spacing lexical tone mark) + +# [Not derivable] + +0E48..0E4B ; Tone_Mark # Mn [4] THAI CHARACTER MAI EK..THAI CHARACTER MAI CHATTAWA +0EC8..0ECB ; Tone_Mark # Mn [4] LAO TONE MAI EK..LAO TONE MAI CATAWA +1037 ; Tone_Mark # Mn MYANMAR SIGN DOT BELOW +1063..1064 ; Tone_Mark # Mc [2] MYANMAR TONE MARK SGAW KAREN HATHI..MYANMAR TONE MARK SGAW KAREN KE PHO +1069..106D ; Tone_Mark # Mc [5] MYANMAR SIGN WESTERN PWO KAREN TONE-1..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1087..108C ; Tone_Mark # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108D ; Tone_Mark # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +108F ; Tone_Mark # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109B ; Tone_Mark # Mc [2] MYANMAR SIGN KHAMTI TONE-1..MYANMAR SIGN KHAMTI TONE-3 +19C8..19C9 ; Tone_Mark # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A75..1A79 ; Tone_Mark # Mn [5] TAI THAM SIGN TONE-1..TAI THAM SIGN KHUEN TONE-5 +A92B..A92D ; Tone_Mark # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +AA7B ; Tone_Mark # Mc MYANMAR SIGN PAO KAREN TONE +AA7C ; Tone_Mark # Mn MYANMAR SIGN TAI LAING TONE-2 +AA7D ; Tone_Mark # Mc MYANMAR SIGN TAI LAING TONE-5 +AABF ; Tone_Mark # Mn TAI VIET TONE MAI EK +AAC1 ; Tone_Mark # Mn TAI VIET TONE MAI THO +ABEC ; Tone_Mark # Mc MEETEI MAYEK LUM IYEK + +# ================================================ + +# Indic_Syllabic_Category=Gemination_Mark + +# Gemination Mark (doubling of the preceding or following consonant) +# +# U+0A71 GURMUKHI ADDAK precedes the consonant it geminates, while the +# others follow the consonant they geminate. + +# [Not derivable] + +0A71 ; Gemination_Mark # Mn GURMUKHI ADDAK +0AFB ; Gemination_Mark # Mn GUJARATI SIGN SHADDA +11237 ; Gemination_Mark # Mn KHOJKI SIGN SHADDA +11A98 ; Gemination_Mark # Mn SOYOMBO GEMINATION MARK + +# ================================================ + +# Indic_Syllabic_Category=Cantillation_Mark + +# Cantillation Mark (recitation marks, such as svara markers for the Samaveda) + +# [Not derivable] + +0951..0952 ; Cantillation_Mark # Mn [2] DEVANAGARI STRESS SIGN UDATTA..DEVANAGARI STRESS SIGN ANUDATTA +0A51 ; Cantillation_Mark # Mn GURMUKHI SIGN UDAAT +0AFA ; Cantillation_Mark # Mn GUJARATI SIGN SUKUN +0AFC ; Cantillation_Mark # Mn GUJARATI SIGN MADDAH +1CD0..1CD2 ; Cantillation_Mark # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CD4..1CE0 ; Cantillation_Mark # Mn [13] VEDIC SIGN YAJURVEDIC MIDLINE SVARITA..VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CE1 ; Cantillation_Mark # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF4 ; Cantillation_Mark # Mn VEDIC TONE CANDRA ABOVE +1CF7 ; Cantillation_Mark # Mc VEDIC SIGN ATIKRAMA +1CF8..1CF9 ; Cantillation_Mark # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE +20F0 ; Cantillation_Mark # Mn COMBINING ASTERISK ABOVE +A8E0..A8F1 ; Cantillation_Mark # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +1123E ; Cantillation_Mark # Mn KHOJKI SIGN SUKUN +11366..1136C ; Cantillation_Mark # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Cantillation_Mark # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA + +# ================================================ + +# Indic_Syllabic_Category=Register_Shifter + +# Register Shifter (shifts register for consonants, akin to a tone mark) + +# [Not derivable] + +17C9..17CA ; Register_Shifter # Mn [2] KHMER SIGN MUUSIKATOAN..KHMER SIGN TRIISAP + +# ================================================ + +# Indic_Syllabic_Category=Syllable_Modifier + +# Syllable Modifier (miscellaneous combining characters that modify +# something in the orthographic syllable they succeed or appear in) + +# [Not derivable] + +00B2..00B3 ; Syllable_Modifier # No [2] SUPERSCRIPT TWO..SUPERSCRIPT THREE +09FE ; Syllable_Modifier # Mn BENGALI SANDHI MARK +0ECE ; Syllable_Modifier # Mn LAO YAMAKKAN +0F35 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0FC6 ; Syllable_Modifier # Mn TIBETAN SYMBOL PADMA GDAN +17CB ; Syllable_Modifier # Mn KHMER SIGN BANTOC +17CE..17D0 ; Syllable_Modifier # Mn [3] KHMER SIGN KAKABAT..KHMER SIGN SAMYOK SANNYA +17D3 ; Syllable_Modifier # Mn KHMER SIGN BATHAMASAT +17DD ; Syllable_Modifier # Mn KHMER SIGN ATTHACAN +193B ; Syllable_Modifier # Mn LIMBU SIGN SA-I +1A7B..1A7C ; Syllable_Modifier # Mn [2] TAI THAM SIGN MAI SAM..TAI THAM SIGN KHUEN-LUE KARAN +1A7F ; Syllable_Modifier # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1C36 ; Syllable_Modifier # Mn LEPCHA SIGN RAN +1DFB ; Syllable_Modifier # Mn COMBINING DELETION MARK +2074 ; Syllable_Modifier # No SUPERSCRIPT FOUR +2082..2084 ; Syllable_Modifier # No [3] SUBSCRIPT TWO..SUBSCRIPT FOUR +111C9 ; Syllable_Modifier # Mn SHARADA SANDHI MARK +1145E ; Syllable_Modifier # Mn NEWA SANDHI MARK +11A33 ; Syllable_Modifier # Mn ZANABAZAR SQUARE FINAL CONSONANT MARK + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Killer + +# Consonant Killer (signifies that the previous consonant or consonants are +# not pronounced) + +# [Not derivable] + +0E4C ; Consonant_Killer # Mn THAI CHARACTER THANTHAKHAT +17CD ; Consonant_Killer # Mn KHMER SIGN TOANDAKHIAT + +# ================================================ + +# Indic_Syllabic_Category=Non_Joiner + +# Non_Joiner (Zero Width Non-Joiner) + +# [Not derivable] + +200C ; Non_Joiner # Cf ZERO WIDTH NON-JOINER + +# ================================================ + +# Indic_Syllabic_Category=Joiner + +# Joiner (Zero Width Joiner) + +# [Not derivable] + +200D ; Joiner # Cf ZERO WIDTH JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number_Joiner + +# Number_Joiner (forms ligatures between numbers for multiplication) + +# [Not derivable] + +1107F ; Number_Joiner # Mn BRAHMI NUMBER JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number + +# Number (can be used as vowel-holders like consonant placeholders) +# Note: A number may even hold subjoined consonants which may in turn +# have been formed using a virama or a stacker, e.g. the sequence +# where THAI THAM LETTER LOW TA is subjoined to +# TAI THAM THAM DIGIT THREE using an invisible stacker. + +# [Not derivable] + +0030..0039 ; Number # Nd [10] DIGIT ZERO..DIGIT NINE +0966..096F ; Number # Nd [10] DEVANAGARI DIGIT ZERO..DEVANAGARI DIGIT NINE +09E6..09EF ; Number # Nd [10] BENGALI DIGIT ZERO..BENGALI DIGIT NINE +0A66..0A6F ; Number # Nd [10] GURMUKHI DIGIT ZERO..GURMUKHI DIGIT NINE +0AE6..0AEF ; Number # Nd [10] GUJARATI DIGIT ZERO..GUJARATI DIGIT NINE +0B66..0B6F ; Number # Nd [10] ORIYA DIGIT ZERO..ORIYA DIGIT NINE +0BE6..0BEF ; Number # Nd [10] TAMIL DIGIT ZERO..TAMIL DIGIT NINE +0C66..0C6F ; Number # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE +0CE6..0CEF ; Number # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE +0D66..0D6F ; Number # Nd [10] MALAYALAM DIGIT ZERO..MALAYALAM DIGIT NINE +0DE6..0DEF ; Number # Nd [10] SINHALA LITH DIGIT ZERO..SINHALA LITH DIGIT NINE +0E50..0E59 ; Number # Nd [10] THAI DIGIT ZERO..THAI DIGIT NINE +0ED0..0ED9 ; Number # Nd [10] LAO DIGIT ZERO..LAO DIGIT NINE +0F20..0F29 ; Number # Nd [10] TIBETAN DIGIT ZERO..TIBETAN DIGIT NINE +0F2A..0F33 ; Number # No [10] TIBETAN DIGIT HALF ONE..TIBETAN DIGIT HALF ZERO +1040..1049 ; Number # Nd [10] MYANMAR DIGIT ZERO..MYANMAR DIGIT NINE +1090..1099 ; Number # Nd [10] MYANMAR SHAN DIGIT ZERO..MYANMAR SHAN DIGIT NINE +17E0..17E9 ; Number # Nd [10] KHMER DIGIT ZERO..KHMER DIGIT NINE +1946..194F ; Number # Nd [10] LIMBU DIGIT ZERO..LIMBU DIGIT NINE +19D0..19D9 ; Number # Nd [10] NEW TAI LUE DIGIT ZERO..NEW TAI LUE DIGIT NINE +19DA ; Number # No NEW TAI LUE THAM DIGIT ONE +1A80..1A89 ; Number # Nd [10] TAI THAM HORA DIGIT ZERO..TAI THAM HORA DIGIT NINE +1A90..1A99 ; Number # Nd [10] TAI THAM THAM DIGIT ZERO..TAI THAM THAM DIGIT NINE +1B50..1B59 ; Number # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE +1BB0..1BB9 ; Number # Nd [10] SUNDANESE DIGIT ZERO..SUNDANESE DIGIT NINE +1C40..1C49 ; Number # Nd [10] LEPCHA DIGIT ZERO..LEPCHA DIGIT NINE +A8D0..A8D9 ; Number # Nd [10] SAURASHTRA DIGIT ZERO..SAURASHTRA DIGIT NINE +A900..A909 ; Number # Nd [10] KAYAH LI DIGIT ZERO..KAYAH LI DIGIT NINE +A9D0..A9D9 ; Number # Nd [10] JAVANESE DIGIT ZERO..JAVANESE DIGIT NINE +A9F0..A9F9 ; Number # Nd [10] MYANMAR TAI LAING DIGIT ZERO..MYANMAR TAI LAING DIGIT NINE +AA50..AA59 ; Number # Nd [10] CHAM DIGIT ZERO..CHAM DIGIT NINE +ABF0..ABF9 ; Number # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE +10A40..10A48 ; Number # No [9] KHAROSHTHI DIGIT ONE..KHAROSHTHI FRACTION ONE HALF +11066..1106F ; Number # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11136..1113F ; Number # Nd [10] CHAKMA DIGIT ZERO..CHAKMA DIGIT NINE +111D0..111D9 ; Number # Nd [10] SHARADA DIGIT ZERO..SHARADA DIGIT NINE +111E1..111F4 ; Number # No [20] SINHALA ARCHAIC DIGIT ONE..SINHALA ARCHAIC NUMBER ONE THOUSAND +112F0..112F9 ; Number # Nd [10] KHUDAWADI DIGIT ZERO..KHUDAWADI DIGIT NINE +11450..11459 ; Number # Nd [10] NEWA DIGIT ZERO..NEWA DIGIT NINE +114D0..114D9 ; Number # Nd [10] TIRHUTA DIGIT ZERO..TIRHUTA DIGIT NINE +11650..11659 ; Number # Nd [10] MODI DIGIT ZERO..MODI DIGIT NINE +116C0..116C9 ; Number # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE +11730..11739 ; Number # Nd [10] AHOM DIGIT ZERO..AHOM DIGIT NINE +1173A..1173B ; Number # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY +11950..11959 ; Number # Nd [10] DIVES AKURU DIGIT ZERO..DIVES AKURU DIGIT NINE +11C50..11C59 ; Number # Nd [10] BHAIKSUKI DIGIT ZERO..BHAIKSUKI DIGIT NINE +11C5A..11C6C ; Number # No [19] BHAIKSUKI NUMBER ONE..BHAIKSUKI HUNDREDS UNIT MARK +11D50..11D59 ; Number # Nd [10] MASARAM GONDI DIGIT ZERO..MASARAM GONDI DIGIT NINE +11DA0..11DA9 ; Number # Nd [10] GUNJALA GONDI DIGIT ZERO..GUNJALA GONDI DIGIT NINE +11F50..11F59 ; Number # Nd [10] KAWI DIGIT ZERO..KAWI DIGIT NINE + +# ================================================ + +# Indic_Syllabic_Category=Brahmi_Joining_Number + +# Brahmi Joining Number (may be joined by a Number_Joiner of the same +# script, e.g. in Brahmi) +# +# Note: These are different from Numbers, in the way that there is no known +# evidence of Brahmi Joining Numbers taking vowels or subjoined consonants. +# Until such evidence is found, implementations may assume that Brahmi +# Joining Numbers only participate in shaping with other Brahmi Joining +# Numbers. + +# [Not derivable] + +11052..11065 ; Brahmi_Joining_Number # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND + +# EOF diff --git a/data/16.0.0-indic-positional-category.txt b/data/16.0.0-indic-positional-category.txt new file mode 100644 index 0000000..7379b43 --- /dev/null +++ b/data/16.0.0-indic-positional-category.txt @@ -0,0 +1,836 @@ +# IndicPositionalCategory-16.0.0.txt +# Date: 2024-04-30, 21:48:21 GMT +# © 2024 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use and license, see https://www.unicode.org/terms_of_use.html +# +# Unicode Character Database +# For documentation, see https://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Positional_Category enumerated property +# +# Scope: This property is aimed at the problem of +# the specification of syllabic structure for Indic scripts. +# Because dependent vowels (matras), visible viramas, and other +# characters are placed in notional slots around the consonant (or +# consonant cluster) core of an Indic syllable, there may be +# cooccurrence constraints or other interactions. Also, it may be +# desirable, in cases where more than one such character may occur in +# sequence, as for example, in a top slot and a bottom slot, to +# specify preferred orders for spelling. As such, this property +# is designed primarily to supplement the Indic_Syllabic_Category +# property. +# +# In addition to combining marks associated with Indic scripts, the +# Indic_Positional_Category has non-trivial values for special signs +# associated with Indic_Syllabic_Category=Consonant_Prefixed +# or Indic_Syllabic_Category=Consonant_Preceding_Repha. Those signs +# have General_Category=Lo, rather than being combining marks. +# They occur in initial position in syllabic structure. However, when +# rendered, they appear as marks positioned with respect to another +# base letter (usually above it). Hence, having an explicit value for +# Indic_Positional_Category for those signs can be helpful. +# +# Note that this property is *not* intended as +# a prescriptive property regarding display or font design, +# for a number of reasons. Good font design requires information +# that is outside the context of a character encoding standard, +# and is best handled in other venues. For Indic dependent +# vowels and similar characters, in particular: +# +# 1. Matra placement may vary somewhat based on typeface design. +# 2. Matra placement, even within a single script, may vary +# somewhat according to historic period or local conventions. +# 3. Matra placement may be changed by explicit orthographic reform +# decisions. +# 4. Matras may ligate in various ways with a consonant (or even +# other elements of a syllable) instead of occurring in a +# discrete location. +# 5. Matra display may be contextually determined. This is +# notable, for example, in the Tamil script, where the shape +# and placement of -u and -uu vowels depends strongly on +# which consonant they adjoin. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Positional_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as containing dependent vowels or similar characters +# in the structural sense used for the Indic_Positional_Category are the +# following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Dives Akuru, Dogra, Grantha, Gujarati, +# Gunjala Gondi, Gurmukhi, Gurung Khema, Hanunoo, Javanese, Kaithi, +# Kannada, Kawi, Kayah Li, Kharoshthi, Khmer, Khojki, Khudawadi, +# Kirat Rai, Lao, Lepcha, Limbu, Makasar, Malayalam, Marchen, +# Masaram Gondi, Meetei Mayek, Modi, Myanmar, Nandinagari, Newa, +# New Tai Lue, Oriya, Rejang, Saurashtra, Sharada, Siddham, Sinhala, +# Soyombo, Sundanese, Syloti Nagri, Tagalog, Tagbanwa, Tai Tham, +# Tai Viet, Takri, Tamil, Telugu, Thai, Tibetan, Tirhuta, +# Tulu-Tigalari, and Zanabazar Square. +# +# All characters for all other scripts not in that list +# take the default value for this property. +# +# See IndicSyllabicCategory.txt for a slightly more extended +# list of Indic scripts, including those which do not have +# positional characters. Currently, those additional +# Indic scripts without positional characters are +# Multani, Phags-pa, and Tai Le. +# +# Notes: +# +# 1. The following characters are all assigned the positional category Right, +# but may have different positions in some cases: +# * U+0BC1 TAMIL VOWEL SIGN U and U+0BC2 TAMIL VOWEL SIGN UU have +# contextually variable placement in Tamil. +# * U+11341 GRANTHA VOWEL SIGN U and U+11342 GRANTHA VOWEL SIGN UU have +# contextually variable placement in Grantha. +# * U+11440 NEWA VOWEL SIGN O and U+11441 NEWA VOWEL SIGN AU have contextually +# variable placement in Newa. +# +# 2. The following characters are all assigned the positional category Top, +# but may have different positions in some cases: +# * U+1143E NEWA VOWEL SIGN E and U+1143F NEWA VOWEL SIGN AI have contextually +# variable placement in Newa. +# +# 3. The following characters are all assigned the positional category Bottom, +# but may have different positions in some cases: +# * U+0D41 MALAYALAM VOWEL SIGN U and U+0D42 MALAYALAM VOWEL SIGN UU form +# complex ligatures with consonants in older Malayalam orthography, and +# are spacing marks to the right of the base in reformed Malayalam +# orthography. +# * U+102F MYANMAR VOWEL SIGN U and U+1030 MYANMAR VOWEL SIGN UU have +# contextually variable placement in Myanmar. +# * U+1A69 TAI THAM VOWEL SIGN U and U+1A6A TAI THAM VOWEL SIGN UU have +# contextually variable placement in Tai Tham. +# * U+113BB TULU-TIGALARI VOWEL SIGN U and +# U+113BC TULU-TIGALARI VOWEL SIGN UU form complex ligatures with +# consonants. +# +# 4. The following character is assigned the positional category Left, but +# may have different positions in different styles: +# * U+119D2 NANDINAGARI VOWEL SIGN I has stylistically variable placement +# in Nandinagari. + + +# ================================================ + +# Property: Indic_Positional_Category +# +# All code points not explicitly listed for Indic_Positional_Category +# have the value NA (not applicable). +# +# @missing: 0000..10FFFF; NA + +# ------------------------------------------------ + +# Indic_Positional_Category=Right + +0903 ; Right # Mc DEVANAGARI SIGN VISARGA +093B ; Right # Mc DEVANAGARI VOWEL SIGN OOE +093E ; Right # Mc DEVANAGARI VOWEL SIGN AA +0940 ; Right # Mc DEVANAGARI VOWEL SIGN II +0949..094C ; Right # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094F ; Right # Mc DEVANAGARI VOWEL SIGN AW +0982..0983 ; Right # Mc [2] BENGALI SIGN ANUSVARA..BENGALI SIGN VISARGA +09BE ; Right # Mc BENGALI VOWEL SIGN AA +09C0 ; Right # Mc BENGALI VOWEL SIGN II +09D7 ; Right # Mc BENGALI AU LENGTH MARK +0A03 ; Right # Mc GURMUKHI SIGN VISARGA +0A3E ; Right # Mc GURMUKHI VOWEL SIGN AA +0A40 ; Right # Mc GURMUKHI VOWEL SIGN II +0A83 ; Right # Mc GUJARATI SIGN VISARGA +0ABE ; Right # Mc GUJARATI VOWEL SIGN AA +0AC0 ; Right # Mc GUJARATI VOWEL SIGN II +0ACB..0ACC ; Right # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0B02..0B03 ; Right # Mc [2] ORIYA SIGN ANUSVARA..ORIYA SIGN VISARGA +0B3E ; Right # Mc ORIYA VOWEL SIGN AA +0B40 ; Right # Mc ORIYA VOWEL SIGN II +0BBE..0BBF ; Right # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC1..0BC2 ; Right # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BD7 ; Right # Mc TAMIL AU LENGTH MARK +0C01..0C03 ; Right # Mc [3] TELUGU SIGN CANDRABINDU..TELUGU SIGN VISARGA +0C41..0C44 ; Right # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C82..0C83 ; Right # Mc [2] KANNADA SIGN ANUSVARA..KANNADA SIGN VISARGA +0CBE ; Right # Mc KANNADA VOWEL SIGN AA +0CC1..0CC4 ; Right # Mc [4] KANNADA VOWEL SIGN U..KANNADA VOWEL SIGN VOCALIC RR +0CD5..0CD6 ; Right # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CF3 ; Right # Mc KANNADA SIGN COMBINING ANUSVARA ABOVE RIGHT +0D02..0D03 ; Right # Mc [2] MALAYALAM SIGN ANUSVARA..MALAYALAM SIGN VISARGA +0D3E..0D40 ; Right # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D57 ; Right # Mc MALAYALAM AU LENGTH MARK +0D82..0D83 ; Right # Mc [2] SINHALA SIGN ANUSVARAYA..SINHALA SIGN VISARGAYA +0DCF..0DD1 ; Right # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD8 ; Right # Mc SINHALA VOWEL SIGN GAETTA-PILLA +0DDF ; Right # Mc SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Right # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Right # Lo THAI CHARACTER SARA A +0E32..0E33 ; Right # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E45 ; Right # Lo THAI CHARACTER LAKKHANGYAO +0EB0 ; Right # Lo LAO VOWEL SIGN A +0EB2..0EB3 ; Right # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0F3E ; Right # Mc TIBETAN SIGN YAR TSHES +0F7F ; Right # Mc TIBETAN SIGN RNAM BCAD +102B..102C ; Right # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +1038 ; Right # Mc MYANMAR SIGN VISARGA +103B ; Right # Mc MYANMAR CONSONANT SIGN MEDIAL YA +1056..1057 ; Right # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1062..1064 ; Right # Mc [3] MYANMAR VOWEL SIGN SGAW KAREN EU..MYANMAR TONE MARK SGAW KAREN KE PHO +1067..106D ; Right # Mc [7] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1083 ; Right # Mc MYANMAR VOWEL SIGN SHAN AA +1087..108C ; Right # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108F ; Right # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109C ; Right # Mc [3] MYANMAR SIGN KHAMTI TONE-1..MYANMAR VOWEL SIGN AITON A +1715 ; Right # Mc TAGALOG SIGN PAMUDPOD +1734 ; Right # Mc HANUNOO SIGN PAMUDPOD +17B6 ; Right # Mc KHMER VOWEL SIGN AA +17C7..17C8 ; Right # Mc [2] KHMER SIGN REAHMUK..KHMER SIGN YUUKALEAPINTU +1923..1924 ; Right # Mc [2] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AI +1929..192B ; Right # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1930..1931 ; Right # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Right # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +19B0..19B4 ; Right # Lo [5] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN UU +19B8..19B9 ; Right # Lo [2] NEW TAI LUE VOWEL SIGN OA..NEW TAI LUE VOWEL SIGN UE +19BB..19C0 ; Right # Lo [6] NEW TAI LUE VOWEL SIGN AAY..NEW TAI LUE VOWEL SIGN IY +19C8..19C9 ; Right # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A1A ; Right # Mc BUGINESE VOWEL SIGN O +1A57 ; Right # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A61 ; Right # Mc TAI THAM VOWEL SIGN A +1A63..1A64 ; Right # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A6D ; Right # Mc TAI THAM VOWEL SIGN OY +1B04 ; Right # Mc BALINESE SIGN BISAH +1B35 ; Right # Mc BALINESE VOWEL SIGN TEDUNG +1B44 ; Right # Mc BALINESE ADEG ADEG +1B82 ; Right # Mc SUNDANESE SIGN PANGWISAD +1BA1 ; Right # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA7 ; Right # Mc SUNDANESE VOWEL SIGN PANOLONG +1BAA ; Right # Mc SUNDANESE SIGN PAMAAEH +1BE7 ; Right # Mc BATAK VOWEL SIGN E +1BEA..1BEC ; Right # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BEE ; Right # Mc BATAK VOWEL SIGN U +1BF2..1BF3 ; Right # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +1C24..1C26 ; Right # Mc [3] LEPCHA SUBJOINED LETTER YA..LEPCHA VOWEL SIGN AA +1C2A..1C2B ; Right # Mc [2] LEPCHA VOWEL SIGN U..LEPCHA VOWEL SIGN UU +1CE1 ; Right # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF7 ; Right # Mc VEDIC SIGN ATIKRAMA +A823..A824 ; Right # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A827 ; Right # Mc SYLOTI NAGRI VOWEL SIGN OO +A880..A881 ; Right # Mc [2] SAURASHTRA SIGN ANUSVARA..SAURASHTRA SIGN VISARGA +A8B4..A8C3 ; Right # Mc [16] SAURASHTRA CONSONANT SIGN HAARU..SAURASHTRA VOWEL SIGN AU +A952..A953 ; Right # Mc [2] REJANG CONSONANT SIGN H..REJANG VIRAMA +A983 ; Right # Mc JAVANESE SIGN WIGNYAN +A9B4..A9B5 ; Right # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +AA33 ; Right # Mc CHAM CONSONANT SIGN YA +AA4D ; Right # Mc CHAM CONSONANT SIGN FINAL H +AA7B ; Right # Mc MYANMAR SIGN PAO KAREN TONE +AA7D ; Right # Mc MYANMAR SIGN TAI LAING TONE-5 +AAB1 ; Right # Lo TAI VIET VOWEL AA +AABA ; Right # Lo TAI VIET VOWEL UA +AABD ; Right # Lo TAI VIET VOWEL AN +AAEF ; Right # Mc MEETEI MAYEK VOWEL SIGN AAU +AAF5 ; Right # Mc MEETEI MAYEK VOWEL SIGN VISARGA +ABE3..ABE4 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE6..ABE7 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE9..ABEA ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +ABEC ; Right # Mc MEETEI MAYEK LUM IYEK +11000 ; Right # Mc BRAHMI SIGN CANDRABINDU +11002 ; Right # Mc BRAHMI SIGN VISARGA +11082 ; Right # Mc KAITHI SIGN VISARGA +110B0 ; Right # Mc KAITHI VOWEL SIGN AA +110B2 ; Right # Mc KAITHI VOWEL SIGN II +110B7..110B8 ; Right # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11145..11146 ; Right # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI +11182 ; Right # Mc SHARADA SIGN VISARGA +111B3 ; Right # Mc SHARADA VOWEL SIGN AA +111B5 ; Right # Mc SHARADA VOWEL SIGN II +111C0 ; Right # Mc SHARADA SIGN VIRAMA +1122C..1122E ; Right # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +11235 ; Right # Mc KHOJKI SIGN VIRAMA +112E0 ; Right # Mc KHUDAWADI VOWEL SIGN AA +112E2 ; Right # Mc KHUDAWADI VOWEL SIGN II +11302..11303 ; Right # Mc [2] GRANTHA SIGN ANUSVARA..GRANTHA SIGN VISARGA +1133E..1133F ; Right # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11341..11344 ; Right # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +1134D ; Right # Mc GRANTHA SIGN VIRAMA +11357 ; Right # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Right # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +113B8 ; Right # Mc TULU-TIGALARI VOWEL SIGN AA +113C9..113CA ; Right # Mc [2] TULU-TIGALARI AU LENGTH MARK..TULU-TIGALARI SIGN CANDRA ANUNASIKA +113CC..113CD ; Right # Mc [2] TULU-TIGALARI SIGN ANUSVARA..TULU-TIGALARI SIGN VISARGA +113CF ; Right # Mc TULU-TIGALARI SIGN LOOPED VIRAMA +11435 ; Right # Mc NEWA VOWEL SIGN AA +11437 ; Right # Mc NEWA VOWEL SIGN II +11440..11441 ; Right # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +11445 ; Right # Mc NEWA SIGN VISARGA +114B0 ; Right # Mc TIRHUTA VOWEL SIGN AA +114B2 ; Right # Mc TIRHUTA VOWEL SIGN II +114BD ; Right # Mc TIRHUTA VOWEL SIGN SHORT O +114C1 ; Right # Mc TIRHUTA SIGN VISARGA +115AF ; Right # Mc SIDDHAM VOWEL SIGN AA +115B1 ; Right # Mc SIDDHAM VOWEL SIGN II +115BE ; Right # Mc SIDDHAM SIGN VISARGA +11630..11632 ; Right # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +1163B..1163C ; Right # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +1163E ; Right # Mc MODI SIGN VISARGA +116AC ; Right # Mc TAKRI SIGN VISARGA +116AF ; Right # Mc TAKRI VOWEL SIGN II +116B6 ; Right # Mc TAKRI SIGN VIRAMA +11720..11721 ; Right # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +1182C ; Right # Mc DOGRA VOWEL SIGN AA +1182E ; Right # Mc DOGRA VOWEL SIGN II +11838 ; Right # Mc DOGRA SIGN VISARGA +11930..11934 ; Right # Mc [5] DIVES AKURU VOWEL SIGN AA..DIVES AKURU VOWEL SIGN UU +1193D ; Right # Mc DIVES AKURU SIGN HALANTA +11940 ; Right # Mc DIVES AKURU MEDIAL YA +119D1 ; Right # Mc NANDINAGARI VOWEL SIGN AA +119D3 ; Right # Mc NANDINAGARI VOWEL SIGN II +119DC..119DF ; Right # Mc [4] NANDINAGARI VOWEL SIGN O..NANDINAGARI SIGN VISARGA +11A39 ; Right # Mc ZANABAZAR SQUARE SIGN VISARGA +11A57..11A58 ; Right # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A97 ; Right # Mc SOYOMBO SIGN VISARGA +11C2F ; Right # Mc BHAIKSUKI VOWEL SIGN AA +11C3E ; Right # Mc BHAIKSUKI SIGN VISARGA +11CA9 ; Right # Mc MARCHEN SUBJOINED LETTER YA +11CB4 ; Right # Mc MARCHEN VOWEL SIGN O +11D46 ; Right # Lo MASARAM GONDI REPHA +11D8A..11D8E ; Right # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU +11D93..11D94 ; Right # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU +11D96 ; Right # Mc GUNJALA GONDI SIGN VISARGA +11EF6 ; Right # Mc MAKASAR VOWEL SIGN O +11F03 ; Right # Mc KAWI SIGN VISARGA +11F34..11F35 ; Right # Mc [2] KAWI VOWEL SIGN AA..KAWI VOWEL SIGN ALTERNATE AA +11F41 ; Right # Mc KAWI SIGN KILLER +1612C ; Right # Mc GURUNG KHEMA CONSONANT SIGN MEDIAL HA +16D40..16D42 ; Right # Lm [3] KIRAT RAI SIGN ANUSVARA..KIRAT RAI SIGN VISARGA +16D63..16D6A ; Right # Lo [8] KIRAT RAI VOWEL SIGN AA..KIRAT RAI VOWEL SIGN AU +16D6B..16D6C ; Right # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT + +# Indic_Positional_Category=Left + +093F ; Left # Mc DEVANAGARI VOWEL SIGN I +094E ; Left # Mc DEVANAGARI VOWEL SIGN PRISHTHAMATRA E +09BF ; Left # Mc BENGALI VOWEL SIGN I +09C7..09C8 ; Left # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +0A3F ; Left # Mc GURMUKHI VOWEL SIGN I +0ABF ; Left # Mc GUJARATI VOWEL SIGN I +0B47 ; Left # Mc ORIYA VOWEL SIGN E +0BC6..0BC8 ; Left # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0D46..0D48 ; Left # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0DD9 ; Left # Mc SINHALA VOWEL SIGN KOMBUVA +0DDB ; Left # Mc SINHALA VOWEL SIGN KOMBU DEKA +0F3F ; Left # Mc TIBETAN SIGN MAR TSHES +1031 ; Left # Mc MYANMAR VOWEL SIGN E +1084 ; Left # Mc MYANMAR VOWEL SIGN SHAN E +17C1..17C3 ; Left # Mc [3] KHMER VOWEL SIGN E..KHMER VOWEL SIGN AI +1A19 ; Left # Mc BUGINESE VOWEL SIGN E +1A55 ; Left # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A6E..1A72 ; Left # Mc [5] TAI THAM VOWEL SIGN E..TAI THAM VOWEL SIGN THAM AI +1B3E..1B3F ; Left # Mc [2] BALINESE VOWEL SIGN TALING..BALINESE VOWEL SIGN TALING REPA +1BA6 ; Left # Mc SUNDANESE VOWEL SIGN PANAELAENG +1C27..1C28 ; Left # Mc [2] LEPCHA VOWEL SIGN I..LEPCHA VOWEL SIGN O +1C34..1C35 ; Left # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A9BA..A9BB ; Left # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +AA2F..AA30 ; Left # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA34 ; Left # Mc CHAM CONSONANT SIGN RA +AAEB ; Left # Mc MEETEI MAYEK VOWEL SIGN II +AAEE ; Left # Mc MEETEI MAYEK VOWEL SIGN AU +110B1 ; Left # Mc KAITHI VOWEL SIGN I +1112C ; Left # Mc CHAKMA VOWEL SIGN E +111B4 ; Left # Mc SHARADA VOWEL SIGN I +111CE ; Left # Mc SHARADA VOWEL SIGN PRISHTHAMATRA E +112E1 ; Left # Mc KHUDAWADI VOWEL SIGN I +11347..11348 ; Left # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +113C2 ; Left # Mc TULU-TIGALARI VOWEL SIGN EE +113C5 ; Left # Mc TULU-TIGALARI VOWEL SIGN AI +11436 ; Left # Mc NEWA VOWEL SIGN I +114B1 ; Left # Mc TIRHUTA VOWEL SIGN I +114B9 ; Left # Mc TIRHUTA VOWEL SIGN E +115B0 ; Left # Mc SIDDHAM VOWEL SIGN I +115B8 ; Left # Mc SIDDHAM VOWEL SIGN E +116AE ; Left # Mc TAKRI VOWEL SIGN I +11726 ; Left # Mc AHOM VOWEL SIGN E +1182D ; Left # Mc DOGRA VOWEL SIGN I +11935 ; Left # Mc DIVES AKURU VOWEL SIGN E +11937 ; Left # Mc DIVES AKURU VOWEL SIGN AI +119D2 ; Left # Mc NANDINAGARI VOWEL SIGN I +119E4 ; Left # Mc NANDINAGARI VOWEL SIGN PRISHTHAMATRA E +11CB1 ; Left # Mc MARCHEN VOWEL SIGN I +11EF5 ; Left # Mc MAKASAR VOWEL SIGN E +11F3E..11F3F ; Left # Mc [2] KAWI VOWEL SIGN E..KAWI VOWEL SIGN AI +1612A..1612B ; Left # Mc [2] GURUNG KHEMA CONSONANT SIGN MEDIAL YA..GURUNG KHEMA CONSONANT SIGN MEDIAL VA + +# Indic_Positional_Category=Visual_Order_Left + +# These are dependent vowels that occur to the left of the consonant +# letter in a syllable, but which occur in scripts using the visual order +# model, instead of the logical order model. Because of the different +# model, these left-side vowels occur first in the backing store (before +# the consonant letter) and are not reordered during text rendering. +# +# [Derivation: Logical_Order_Exception=Yes] + +0E40..0E44 ; Visual_Order_Left # Lo [5] THAI CHARACTER SARA E..THAI CHARACTER SARA AI MAIMALAI +0EC0..0EC4 ; Visual_Order_Left # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +19B5..19B7 ; Visual_Order_Left # Lo [3] NEW TAI LUE VOWEL SIGN E..NEW TAI LUE VOWEL SIGN O +19BA ; Visual_Order_Left # Lo NEW TAI LUE VOWEL SIGN AY +AAB5..AAB6 ; Visual_Order_Left # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB9 ; Visual_Order_Left # Lo TAI VIET VOWEL UEA +AABB..AABC ; Visual_Order_Left # Lo [2] TAI VIET VOWEL AUE..TAI VIET VOWEL AY + +# Indic_Positional_Category=Left_And_Right + +09CB..09CC ; Left_And_Right # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +0B4B ; Left_And_Right # Mc ORIYA VOWEL SIGN O +0BCA..0BCC ; Left_And_Right # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0D4A..0D4C ; Left_And_Right # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0DDC ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA +0DDE ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA +17C0 ; Left_And_Right # Mc KHMER VOWEL SIGN IE +17C4..17C5 ; Left_And_Right # Mc [2] KHMER VOWEL SIGN OO..KHMER VOWEL SIGN AU +1B40..1B41 ; Left_And_Right # Mc [2] BALINESE VOWEL SIGN TALING TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1134B..1134C ; Left_And_Right # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +113C7..113C8 ; Left_And_Right # Mc [2] TULU-TIGALARI VOWEL SIGN OO..TULU-TIGALARI VOWEL SIGN AU +114BC ; Left_And_Right # Mc TIRHUTA VOWEL SIGN O +114BE ; Left_And_Right # Mc TIRHUTA VOWEL SIGN AU +115BA ; Left_And_Right # Mc SIDDHAM VOWEL SIGN O +11938 ; Left_And_Right # Mc DIVES AKURU VOWEL SIGN O + +# Indic_Positional_Category=Top + +0900..0902 ; Top # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +093A ; Top # Mn DEVANAGARI VOWEL SIGN OE +0945..0948 ; Top # Mn [4] DEVANAGARI VOWEL SIGN CANDRA E..DEVANAGARI VOWEL SIGN AI +0951 ; Top # Mn DEVANAGARI STRESS SIGN UDATTA +0955 ; Top # Mn DEVANAGARI VOWEL SIGN CANDRA LONG E +0981 ; Top # Mn BENGALI SIGN CANDRABINDU +09FE ; Top # Mn BENGALI SANDHI MARK +0A01..0A02 ; Top # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A47..0A48 ; Top # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Top # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0A70..0A71 ; Top # Mn [2] GURMUKHI TIPPI..GURMUKHI ADDAK +0A81..0A82 ; Top # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0AC5 ; Top # Mn GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Top # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AFA..0AFF ; Top # Mn [6] GUJARATI SIGN SUKUN..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B01 ; Top # Mn ORIYA SIGN CANDRABINDU +0B3F ; Top # Mn ORIYA VOWEL SIGN I +0B55..0B56 ; Top # Mn [2] ORIYA SIGN OVERLINE..ORIYA AI LENGTH MARK +0B82 ; Top # Mn TAMIL SIGN ANUSVARA +0BC0 ; Top # Mn TAMIL VOWEL SIGN II +0BCD ; Top # Mn TAMIL SIGN VIRAMA +0C00 ; Top # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C04 ; Top # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C3E..0C40 ; Top # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C46..0C47 ; Top # Mn [2] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN EE +0C4A..0C4D ; Top # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA +0C55 ; Top # Mn TELUGU LENGTH MARK +0C81 ; Top # Mn KANNADA SIGN CANDRABINDU +0CBF ; Top # Mn KANNADA VOWEL SIGN I +0CC6 ; Top # Mn KANNADA VOWEL SIGN E +0CCC..0CCD ; Top # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA +0D00..0D01 ; Top # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU +0D3B..0D3C ; Top # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA +0D4D ; Top # Mn MALAYALAM SIGN VIRAMA +0D4E ; Top # Lo MALAYALAM LETTER DOT REPH +0D81 ; Top # Mn SINHALA SIGN CANDRABINDU +0DCA ; Top # Mn SINHALA SIGN AL-LAKUNA +0DD2..0DD3 ; Top # Mn [2] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN DIGA IS-PILLA +0E31 ; Top # Mn THAI CHARACTER MAI HAN-AKAT +0E34..0E37 ; Top # Mn [4] THAI CHARACTER SARA I..THAI CHARACTER SARA UEE +0E47..0E4E ; Top # Mn [8] THAI CHARACTER MAITAIKHU..THAI CHARACTER YAMAKKAN +0EB1 ; Top # Mn LAO VOWEL SIGN MAI KAN +0EB4..0EB7 ; Top # Mn [4] LAO VOWEL SIGN I..LAO VOWEL SIGN YY +0EBB ; Top # Mn LAO VOWEL SIGN MAI KON +0EC8..0ECE ; Top # Mn [7] LAO TONE MAI EK..LAO YAMAKKAN +0F39 ; Top # Mn TIBETAN MARK TSA -PHRU +0F72 ; Top # Mn TIBETAN VOWEL SIGN I +0F7A..0F7E ; Top # Mn [5] TIBETAN VOWEL SIGN E..TIBETAN SIGN RJES SU NGA RO +0F80 ; Top # Mn TIBETAN VOWEL SIGN REVERSED I +0F82..0F83 ; Top # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +0F86..0F87 ; Top # Mn [2] TIBETAN SIGN LCI RTAGS..TIBETAN SIGN YANG RTAGS +102D..102E ; Top # Mn [2] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN II +1032..1036 ; Top # Mn [5] MYANMAR VOWEL SIGN AI..MYANMAR SIGN ANUSVARA +103A ; Top # Mn MYANMAR SIGN ASAT +1071..1074 ; Top # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1085..1086 ; Top # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109D ; Top # Mn MYANMAR VOWEL SIGN AITON AI +1712 ; Top # Mn TAGALOG VOWEL SIGN I +1732 ; Top # Mn HANUNOO VOWEL SIGN I +1752 ; Top # Mn BUHID VOWEL SIGN I +1772 ; Top # Mn TAGBANWA VOWEL SIGN I +17B7..17BA ; Top # Mn [4] KHMER VOWEL SIGN I..KHMER VOWEL SIGN YY +17C6 ; Top # Mn KHMER SIGN NIKAHIT +17C9..17D1 ; Top # Mn [9] KHMER SIGN MUUSIKATOAN..KHMER SIGN VIRIAM +17D3 ; Top # Mn KHMER SIGN BATHAMASAT +17DD ; Top # Mn KHMER SIGN ATTHACAN +1920..1921 ; Top # Mn [2] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN I +1927..1928 ; Top # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Top # Mn LIMBU SIGN KEMPHRENG +1A17 ; Top # Mn BUGINESE VOWEL SIGN I +1A1B ; Top # Mn BUGINESE VOWEL SIGN AE +1A58..1A5A ; Top # Mn [3] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN LOW PA +1A62 ; Top # Mn TAI THAM VOWEL SIGN MAI SAT +1A65..1A68 ; Top # Mn [4] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN UUE +1A6B ; Top # Mn TAI THAM VOWEL SIGN O +1A73..1A7C ; Top # Mn [10] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN KHUEN-LUE KARAN +1B00..1B03 ; Top # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG +1B34 ; Top # Mn BALINESE SIGN REREKAN +1B36..1B37 ; Top # Mn [2] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN ULU SARI +1B42 ; Top # Mn BALINESE VOWEL SIGN PEPET +1B6B ; Top # Mn BALINESE MUSICAL SYMBOL COMBINING TEGEH +1B6D..1B73 ; Top # Mn [7] BALINESE MUSICAL SYMBOL COMBINING KEMPUL..BALINESE MUSICAL SYMBOL COMBINING GONG +1B80..1B81 ; Top # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR +1BA4 ; Top # Mn SUNDANESE VOWEL SIGN PANGHULU +1BA8..1BA9 ; Top # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE6 ; Top # Mn BATAK SIGN TOMPI +1BE8..1BE9 ; Top # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BED ; Top # Mn BATAK VOWEL SIGN KARO O +1BEF..1BF1 ; Top # Mn [3] BATAK VOWEL SIGN U FOR SIMALUNGUN SA..BATAK CONSONANT SIGN H +1C2D..1C33 ; Top # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +1C36 ; Top # Mn LEPCHA SIGN RAN +1CD0..1CD2 ; Top # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CDA..1CDB ; Top # Mn [2] VEDIC TONE DOUBLE SVARITA..VEDIC TONE TRIPLE SVARITA +1CE0 ; Top # Mn VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CF4 ; Top # Mn VEDIC TONE CANDRA ABOVE +1DFB ; Top # Mn COMBINING DELETION MARK +20F0 ; Top # Mn COMBINING ASTERISK ABOVE +A802 ; Top # Mn SYLOTI NAGRI SIGN DVISVARA +A806 ; Top # Mn SYLOTI NAGRI SIGN HASANTA +A80B ; Top # Mn SYLOTI NAGRI SIGN ANUSVARA +A826 ; Top # Mn SYLOTI NAGRI VOWEL SIGN E +A8C5 ; Top # Mn SAURASHTRA SIGN CANDRABINDU +A8E0..A8F1 ; Top # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +A8FF ; Top # Mn DEVANAGARI VOWEL SIGN AY +A926..A92A ; Top # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O +A94A ; Top # Mn REJANG VOWEL SIGN AI +A94F..A951 ; Top # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A980..A982 ; Top # Mn [3] JAVANESE SIGN PANYANGGA..JAVANESE SIGN LAYAR +A9B3 ; Top # Mn JAVANESE SIGN CECAK TELU +A9B6..A9B7 ; Top # Mn [2] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN WULU MELIK +A9BC ; Top # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Top # Mn MYANMAR SIGN SHAN SAW +AA29..AA2C ; Top # Mn [4] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN EI +AA2E ; Top # Mn CHAM VOWEL SIGN OE +AA31 ; Top # Mn CHAM VOWEL SIGN AU +AA43 ; Top # Mn CHAM CONSONANT SIGN FINAL NG +AA4C ; Top # Mn CHAM CONSONANT SIGN FINAL M +AA7C ; Top # Mn MYANMAR SIGN TAI LAING TONE-2 +AAB0 ; Top # Mn TAI VIET MAI KANG +AAB2..AAB3 ; Top # Mn [2] TAI VIET VOWEL I..TAI VIET VOWEL UE +AAB7..AAB8 ; Top # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AABE..AABF ; Top # Mn [2] TAI VIET VOWEL AM..TAI VIET TONE MAI EK +AAC1 ; Top # Mn TAI VIET TONE MAI THO +AAED ; Top # Mn MEETEI MAYEK VOWEL SIGN AAI +ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP +10A05 ; Top # Mn KHAROSHTHI VOWEL SIGN E +10A0F ; Top # Mn KHAROSHTHI SIGN VISARGA +10A38 ; Top # Mn KHAROSHTHI SIGN BAR ABOVE +11001 ; Top # Mn BRAHMI SIGN ANUSVARA +11038..1103B ; Top # Mn [4] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN II +11042..11046 ; Top # Mn [5] BRAHMI VOWEL SIGN E..BRAHMI VIRAMA +11070 ; Top # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11073..11074 ; Top # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O +11080..11081 ; Top # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +110B5..110B6 ; Top # Mn [2] KAITHI VOWEL SIGN E..KAITHI VOWEL SIGN AI +11100..11102 ; Top # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA +11127..11129 ; Top # Mn [3] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN II +1112D ; Top # Mn CHAKMA VOWEL SIGN AI +11130 ; Top # Mn CHAKMA VOWEL SIGN OI +11134 ; Top # Mn CHAKMA MAAYYAA +11180..11181 ; Top # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +111BC..111BE ; Top # Mn [3] SHARADA VOWEL SIGN E..SHARADA VOWEL SIGN O +111C2..111C3 ; Top # Lo [2] SHARADA SIGN JIHVAMULIYA..SHARADA SIGN UPADHMANIYA +111CB ; Top # Mn SHARADA VOWEL MODIFIER MARK +111CF ; Top # Mn SHARADA SIGN INVERTED CANDRABINDU +11230..11231 ; Top # Mn [2] KHOJKI VOWEL SIGN E..KHOJKI VOWEL SIGN AI +11234 ; Top # Mn KHOJKI SIGN ANUSVARA +11236..11237 ; Top # Mn [2] KHOJKI SIGN NUKTA..KHOJKI SIGN SHADDA +1123E ; Top # Mn KHOJKI SIGN SUKUN +112DF ; Top # Mn KHUDAWADI SIGN ANUSVARA +112E5..112E8 ; Top # Mn [4] KHUDAWADI VOWEL SIGN E..KHUDAWADI VOWEL SIGN AU +11300..11301 ; Top # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11340 ; Top # Mn GRANTHA VOWEL SIGN II +11366..1136C ; Top # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Top # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA +113CE ; Top # Mn TULU-TIGALARI SIGN VIRAMA +113D1 ; Top # Lo TULU-TIGALARI REPHA +113E1 ; Top # Mn TULU-TIGALARI VEDIC TONE SVARITA +1143E..1143F ; Top # Mn [2] NEWA VOWEL SIGN E..NEWA VOWEL SIGN AI +11443..11444 ; Top # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +1145E ; Top # Mn NEWA SANDHI MARK +114BA ; Top # Mn TIRHUTA VOWEL SIGN SHORT E +114BF..114C0 ; Top # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Top # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +11639..1163A ; Top # Mn [2] MODI VOWEL SIGN E..MODI VOWEL SIGN AI +1163D ; Top # Mn MODI SIGN ANUSVARA +11640 ; Top # Mn MODI SIGN ARDHACANDRA +116AB ; Top # Mn TAKRI SIGN ANUSVARA +116AD ; Top # Mn TAKRI VOWEL SIGN AA +116B2..116B5 ; Top # Mn [4] TAKRI VOWEL SIGN E..TAKRI VOWEL SIGN AU +1171F ; Top # Mn AHOM CONSONANT SIGN MEDIAL LIGATING RA +11722..11723 ; Top # Mn [2] AHOM VOWEL SIGN I..AHOM VOWEL SIGN II +11727 ; Top # Mn AHOM VOWEL SIGN AW +11729..1172B ; Top # Mn [3] AHOM VOWEL SIGN AI..AHOM SIGN KILLER +11833..11837 ; Top # Mn [5] DOGRA VOWEL SIGN E..DOGRA SIGN ANUSVARA +1193B..1193C ; Top # Mn [2] DIVES AKURU SIGN ANUSVARA..DIVES AKURU SIGN CANDRABINDU +1193F ; Top # Lo DIVES AKURU PREFIXED NASAL SIGN +11941 ; Top # Lo DIVES AKURU INITIAL RA +119DA..119DB ; Top # Mn [2] NANDINAGARI VOWEL SIGN E..NANDINAGARI VOWEL SIGN AI +11A01 ; Top # Mn ZANABAZAR SQUARE VOWEL SIGN I +11A04..11A09 ; Top # Mn [6] ZANABAZAR SQUARE VOWEL SIGN E..ZANABAZAR SQUARE VOWEL SIGN REVERSED I +11A35..11A38 ; Top # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A3A ; Top # Lo ZANABAZAR SQUARE CLUSTER-INITIAL LETTER RA +11A51 ; Top # Mn SOYOMBO VOWEL SIGN I +11A54..11A56 ; Top # Mn [3] SOYOMBO VOWEL SIGN E..SOYOMBO VOWEL SIGN OE +11A84..11A89 ; Top # Lo [6] SOYOMBO SIGN JIHVAMULIYA..SOYOMBO CLUSTER-INITIAL LETTER SA +11A96 ; Top # Mn SOYOMBO SIGN ANUSVARA +11A98 ; Top # Mn SOYOMBO GEMINATION MARK +11C30..11C31 ; Top # Mn [2] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN II +11C38..11C3D ; Top # Mn [6] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI SIGN ANUSVARA +11CB3 ; Top # Mn MARCHEN VOWEL SIGN E +11CB5..11CB6 ; Top # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D31..11D35 ; Top # Mn [5] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN UU +11D3A ; Top # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Top # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F..11D41 ; Top # Mn [3] MASARAM GONDI VOWEL SIGN AU..MASARAM GONDI SIGN VISARGA +11D43 ; Top # Mn MASARAM GONDI SIGN CANDRA +11D90..11D91 ; Top # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI +11D95 ; Top # Mn GUNJALA GONDI SIGN ANUSVARA +11EF3 ; Top # Mn MAKASAR VOWEL SIGN I +11F00..11F01 ; Top # Mn [2] KAWI SIGN CANDRABINDU..KAWI SIGN ANUSVARA +11F02 ; Top # Lo KAWI SIGN REPHA +11F36..11F37 ; Top # Mn [2] KAWI VOWEL SIGN I..KAWI VOWEL SIGN II +11F40 ; Top # Mn KAWI VOWEL SIGN EU +11F5A ; Top # Mn KAWI SIGN NUKTA +1611E..16129 ; Top # Mn [12] GURUNG KHEMA VOWEL SIGN AA..GURUNG KHEMA VOWEL LENGTH MARK +1612D ; Top # Mn GURUNG KHEMA SIGN ANUSVARA + +# Indic_Positional_Category=Bottom + +093C ; Bottom # Mn DEVANAGARI SIGN NUKTA +0941..0944 ; Bottom # Mn [4] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN VOCALIC RR +094D ; Bottom # Mn DEVANAGARI SIGN VIRAMA +0952 ; Bottom # Mn DEVANAGARI STRESS SIGN ANUDATTA +0956..0957 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN UE..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BC ; Bottom # Mn BENGALI SIGN NUKTA +09C1..09C4 ; Bottom # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09CD ; Bottom # Mn BENGALI SIGN VIRAMA +09E2..09E3 ; Bottom # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3C ; Bottom # Mn GURMUKHI SIGN NUKTA +0A41..0A42 ; Bottom # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A4D ; Bottom # Mn GURMUKHI SIGN VIRAMA +0A51 ; Bottom # Mn GURMUKHI SIGN UDAAT +0A75 ; Bottom # Mn GURMUKHI SIGN YAKASH +0ABC ; Bottom # Mn GUJARATI SIGN NUKTA +0AC1..0AC4 ; Bottom # Mn [4] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN VOCALIC RR +0ACD ; Bottom # Mn GUJARATI SIGN VIRAMA +0AE2..0AE3 ; Bottom # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3C ; Bottom # Mn ORIYA SIGN NUKTA +0B41..0B44 ; Bottom # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B4D ; Bottom # Mn ORIYA SIGN VIRAMA +0B62..0B63 ; Bottom # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0C3C ; Bottom # Mn TELUGU SIGN NUKTA +0C56 ; Bottom # Mn TELUGU AI LENGTH MARK +0C62..0C63 ; Bottom # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBC ; Bottom # Mn KANNADA SIGN NUKTA +0CE2..0CE3 ; Bottom # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D41..0D44 ; Bottom # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR +0D62..0D63 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DD4 ; Bottom # Mn SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Bottom # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0E38..0E3A ; Bottom # Mn [3] THAI CHARACTER SARA U..THAI CHARACTER PHINTHU +0EB8..0EBA ; Bottom # Mn [3] LAO VOWEL SIGN U..LAO SIGN PALI VIRAMA +0EBC ; Bottom # Mn LAO SEMIVOWEL SIGN LO +0F18..0F19 ; Bottom # Mn [2] TIBETAN ASTROLOGICAL SIGN -KHYUD PA..TIBETAN ASTROLOGICAL SIGN SDONG TSHUGS +0F35 ; Bottom # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Bottom # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0F71 ; Bottom # Mn TIBETAN VOWEL SIGN AA +0F74..0F75 ; Bottom # Mn [2] TIBETAN VOWEL SIGN U..TIBETAN VOWEL SIGN UU +0F84 ; Bottom # Mn TIBETAN MARK HALANTA +0F8D..0F97 ; Bottom # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Bottom # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +0FC6 ; Bottom # Mn TIBETAN SYMBOL PADMA GDAN +102F..1030 ; Bottom # Mn [2] MYANMAR VOWEL SIGN U..MYANMAR VOWEL SIGN UU +1037 ; Bottom # Mn MYANMAR SIGN DOT BELOW +103D..103E ; Bottom # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +1058..1059 ; Bottom # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +105E..1060 ; Bottom # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Bottom # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +108D ; Bottom # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +1713..1714 ; Bottom # Mn [2] TAGALOG VOWEL SIGN U..TAGALOG SIGN VIRAMA +1733 ; Bottom # Mn HANUNOO VOWEL SIGN U +1753 ; Bottom # Mn BUHID VOWEL SIGN U +1773 ; Bottom # Mn TAGBANWA VOWEL SIGN U +17BB..17BD ; Bottom # Mn [3] KHMER VOWEL SIGN U..KHMER VOWEL SIGN UA +1922 ; Bottom # Mn LIMBU VOWEL SIGN U +1932 ; Bottom # Mn LIMBU SMALL LETTER ANUSVARA +1939 ; Bottom # Mn LIMBU SIGN MUKPHRENG +193B ; Bottom # Mn LIMBU SIGN SA-I +1A18 ; Bottom # Mn BUGINESE VOWEL SIGN U +1A56 ; Bottom # Mn TAI THAM CONSONANT SIGN MEDIAL LA +1A5B..1A5E ; Bottom # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1A69..1A6A ; Bottom # Mn [2] TAI THAM VOWEL SIGN U..TAI THAM VOWEL SIGN UU +1A6C ; Bottom # Mn TAI THAM VOWEL SIGN OA BELOW +1A7F ; Bottom # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1B38..1B3A ; Bottom # Mn [3] BALINESE VOWEL SIGN SUKU..BALINESE VOWEL SIGN RA REPA +1B6C ; Bottom # Mn BALINESE MUSICAL SYMBOL COMBINING ENDEP +1BA2..1BA3 ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BA5 ; Bottom # Mn SUNDANESE VOWEL SIGN PANYUKU +1BAC..1BAD ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C2C ; Bottom # Mn LEPCHA VOWEL SIGN E +1C37 ; Bottom # Mn LEPCHA SIGN NUKTA +1CD5..1CD9 ; Bottom # Mn [5] VEDIC TONE YAJURVEDIC AGGRAVATED INDEPENDENT SVARITA..VEDIC TONE YAJURVEDIC KATHAKA INDEPENDENT SVARITA SCHROEDER +1CDC..1CDF ; Bottom # Mn [4] VEDIC TONE KATHAKA ANUDATTA..VEDIC TONE THREE DOTS BELOW +1CED ; Bottom # Mn VEDIC SIGN TIRYAK +A825 ; Bottom # Mn SYLOTI NAGRI VOWEL SIGN U +A82C ; Bottom # Mn SYLOTI NAGRI SIGN ALTERNATE HASANTA +A8C4 ; Bottom # Mn SAURASHTRA SIGN VIRAMA +A92B..A92D ; Bottom # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +A947..A949 ; Bottom # Mn [3] REJANG VOWEL SIGN I..REJANG VOWEL SIGN E +A94B..A94E ; Bottom # Mn [4] REJANG VOWEL SIGN O..REJANG VOWEL SIGN EA +A9B8..A9B9 ; Bottom # Mn [2] JAVANESE VOWEL SIGN SUKU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BD ; Bottom # Mn JAVANESE CONSONANT SIGN KERET +AA2D ; Bottom # Mn CHAM VOWEL SIGN U +AA32 ; Bottom # Mn CHAM VOWEL SIGN UE +AA35..AA36 ; Bottom # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +AAB4 ; Bottom # Mn TAI VIET VOWEL U +AAEC ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UU +ABE8 ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK +10A02..10A03 ; Bottom # Mn [2] KHAROSHTHI VOWEL SIGN U..KHAROSHTHI VOWEL SIGN VOCALIC R +10A0C..10A0E ; Bottom # Mn [3] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN ANUSVARA +10A39..10A3A ; Bottom # Mn [2] KHAROSHTHI SIGN CAUDA..KHAROSHTHI SIGN DOT BELOW +1103C..11041 ; Bottom # Mn [6] BRAHMI VOWEL SIGN U..BRAHMI VOWEL SIGN VOCALIC LL +110B3..110B4 ; Bottom # Mn [2] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN UU +110B9..110BA ; Bottom # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +110C2 ; Bottom # Mn KAITHI VOWEL SIGN VOCALIC R +1112A..1112B ; Bottom # Mn [2] CHAKMA VOWEL SIGN U..CHAKMA VOWEL SIGN UU +11131..11132 ; Bottom # Mn [2] CHAKMA O MARK..CHAKMA AU MARK +11173 ; Bottom # Mn MAHAJANI SIGN NUKTA +111B6..111BB ; Bottom # Mn [6] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN VOCALIC LL +111C9..111CA ; Bottom # Mn [2] SHARADA SANDHI MARK..SHARADA SIGN NUKTA +111CC ; Bottom # Mn SHARADA EXTRA SHORT VOWEL MARK +1122F ; Bottom # Mn KHOJKI VOWEL SIGN U +11241 ; Bottom # Mn KHOJKI VOWEL SIGN VOCALIC R +112E3..112E4 ; Bottom # Mn [2] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN UU +112E9..112EA ; Bottom # Mn [2] KHUDAWADI SIGN NUKTA..KHUDAWADI SIGN VIRAMA +1133B..1133C ; Bottom # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA +113BB..113C0 ; Bottom # Mn [6] TULU-TIGALARI VOWEL SIGN U..TULU-TIGALARI VOWEL SIGN VOCALIC LL +113D2 ; Bottom # Mn TULU-TIGALARI GEMINATION MARK +113E2 ; Bottom # Mn TULU-TIGALARI VEDIC TONE ANUDATTA +11438..1143D ; Bottom # Mn [6] NEWA VOWEL SIGN U..NEWA VOWEL SIGN VOCALIC LL +11442 ; Bottom # Mn NEWA SIGN VIRAMA +11446 ; Bottom # Mn NEWA SIGN NUKTA +114B3..114B8 ; Bottom # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114C2..114C3 ; Bottom # Mn [2] TIRHUTA SIGN VIRAMA..TIRHUTA SIGN NUKTA +115B2..115B5 ; Bottom # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115BF..115C0 ; Bottom # Mn [2] SIDDHAM SIGN VIRAMA..SIDDHAM SIGN NUKTA +115DC..115DD ; Bottom # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11633..11638 ; Bottom # Mn [6] MODI VOWEL SIGN U..MODI VOWEL SIGN VOCALIC LL +1163F ; Bottom # Mn MODI SIGN VIRAMA +116B0..116B1 ; Bottom # Mn [2] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN UU +116B7 ; Bottom # Mn TAKRI SIGN NUKTA +1171D ; Bottom # Mn AHOM CONSONANT SIGN MEDIAL LA +11724..11725 ; Bottom # Mn [2] AHOM VOWEL SIGN U..AHOM VOWEL SIGN UU +11728 ; Bottom # Mn AHOM VOWEL SIGN O +1182F..11832 ; Bottom # Mn [4] DOGRA VOWEL SIGN U..DOGRA VOWEL SIGN VOCALIC RR +11839..1183A ; Bottom # Mn [2] DOGRA SIGN VIRAMA..DOGRA SIGN NUKTA +11943 ; Bottom # Mn DIVES AKURU SIGN NUKTA +119D4..119D7 ; Bottom # Mn [4] NANDINAGARI VOWEL SIGN U..NANDINAGARI VOWEL SIGN VOCALIC RR +119E0 ; Bottom # Mn NANDINAGARI SIGN VIRAMA +11A02..11A03 ; Bottom # Mn [2] ZANABAZAR SQUARE VOWEL SIGN UE..ZANABAZAR SQUARE VOWEL SIGN U +11A0A ; Bottom # Mn ZANABAZAR SQUARE VOWEL LENGTH MARK +11A33..11A34 ; Bottom # Mn [2] ZANABAZAR SQUARE FINAL CONSONANT MARK..ZANABAZAR SQUARE SIGN VIRAMA +11A3B..11A3E ; Bottom # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11A52..11A53 ; Bottom # Mn [2] SOYOMBO VOWEL SIGN UE..SOYOMBO VOWEL SIGN U +11A59..11A5B ; Bottom # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11A8A..11A95 ; Bottom # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A +11C32..11C36 ; Bottom # Mn [5] BHAIKSUKI VOWEL SIGN U..BHAIKSUKI VOWEL SIGN VOCALIC L +11C3F ; Bottom # Mn BHAIKSUKI SIGN VIRAMA +11C92..11CA7 ; Bottom # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CAA..11CB0 ; Bottom # Mn [7] MARCHEN SUBJOINED LETTER RA..MARCHEN VOWEL SIGN AA +11CB2 ; Bottom # Mn MARCHEN VOWEL SIGN U +11D36 ; Bottom # Mn MASARAM GONDI VOWEL SIGN VOCALIC R +11D42 ; Bottom # Mn MASARAM GONDI SIGN NUKTA +11D44 ; Bottom # Mn MASARAM GONDI SIGN HALANTA +11D47 ; Bottom # Mn MASARAM GONDI RA-KARA +11EF4 ; Bottom # Mn MAKASAR VOWEL SIGN U +11F38..11F3A ; Bottom # Mn [3] KAWI VOWEL SIGN U..KAWI VOWEL SIGN VOCALIC R +1612E..1612F ; Bottom # Mn [2] GURUNG KHEMA CONSONANT SIGN MEDIAL RA..GURUNG KHEMA SIGN THOLHOMA + +# Indic_Positional_Category=Top_And_Bottom + +0C48 ; Top_And_Bottom # Mn TELUGU VOWEL SIGN AI +0F73 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN II +0F76..0F79 ; Top_And_Bottom # Mn [4] TIBETAN VOWEL SIGN VOCALIC R..TIBETAN VOWEL SIGN VOCALIC LL +0F81 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN REVERSED II +1B3C ; Top_And_Bottom # Mn BALINESE VOWEL SIGN LA LENGA +1112E..1112F ; Top_And_Bottom # Mn [2] CHAKMA VOWEL SIGN O..CHAKMA VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Right + +0AC9 ; Top_And_Right # Mc GUJARATI VOWEL SIGN CANDRA O +0B57 ; Top_And_Right # Mc ORIYA AU LENGTH MARK +0CC0 ; Top_And_Right # Mc KANNADA VOWEL SIGN II +0CC7..0CC8 ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +1925..1926 ; Top_And_Right # Mc [2] LIMBU VOWEL SIGN OO..LIMBU VOWEL SIGN AU +1B43 ; Top_And_Right # Mc BALINESE VOWEL SIGN PEPET TEDUNG +111BF ; Top_And_Right # Mc SHARADA VOWEL SIGN AU +11232..11233 ; Top_And_Right # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU +113B9..113BA ; Top_And_Right # Mc [2] TULU-TIGALARI VOWEL SIGN I..TULU-TIGALARI VOWEL SIGN II + +# Indic_Positional_Category=Top_And_Left + +0B48 ; Top_And_Left # Mc ORIYA VOWEL SIGN AI +0DDA ; Top_And_Left # Mc SINHALA VOWEL SIGN DIGA KOMBUVA +17BE ; Top_And_Left # Mc KHMER VOWEL SIGN OE +1C29 ; Top_And_Left # Mc LEPCHA VOWEL SIGN OO +114BB ; Top_And_Left # Mc TIRHUTA VOWEL SIGN AI +115B9 ; Top_And_Left # Mc SIDDHAM VOWEL SIGN AI + +# Indic_Positional_Category=Top_And_Left_And_Right + +0B4C ; Top_And_Left_And_Right # Mc ORIYA VOWEL SIGN AU +0DDD ; Top_And_Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA +17BF ; Top_And_Left_And_Right # Mc KHMER VOWEL SIGN YA +115BB ; Top_And_Left_And_Right # Mc SIDDHAM VOWEL SIGN AU + +# Indic_Positional_Category=Bottom_And_Right + +1B3B ; Bottom_And_Right # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +A9BE ; Bottom_And_Right # Mc JAVANESE CONSONANT SIGN PENGKAL +A9C0 ; Bottom_And_Right # Mc JAVANESE PANGKON +11942 ; Bottom_And_Right # Mc DIVES AKURU MEDIAL RA + +# Indic_Positional_Category=Bottom_And_Left + +A9BF ; Bottom_And_Left # Mc JAVANESE CONSONANT SIGN CAKRA + +# Indic_Positional_Category=Top_And_Bottom_And_Right + +1B3D ; Top_And_Bottom_And_Right # Mc BALINESE VOWEL SIGN LA LENGA TEDUNG + +# Indic_Positional_Category=Top_And_Bottom_And_Left + +103C ; Top_And_Bottom_And_Left # Mc MYANMAR CONSONANT SIGN MEDIAL RA +1171E ; Top_And_Bottom_And_Left # Mc AHOM CONSONANT SIGN MEDIAL RA + +# Indic_Positional_Category=Overstruck + +1CD4 ; Overstruck # Mn VEDIC SIGN YAJURVEDIC MIDLINE SVARITA +1CE2..1CE8 ; Overstruck # Mn [7] VEDIC SIGN VISARGA SVARITA..VEDIC SIGN VISARGA ANUDATTA WITH TAIL +10A01 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN I +10A06 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN O + +# EOF diff --git a/data/16.0.0-indic-syllabic-category.txt b/data/16.0.0-indic-syllabic-category.txt new file mode 100644 index 0000000..dc07604 --- /dev/null +++ b/data/16.0.0-indic-syllabic-category.txt @@ -0,0 +1,1400 @@ +# IndicSyllabicCategory-16.0.0.txt +# Date: 2024-04-30, 21:48:21 GMT +# © 2024 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use and license, see https://www.unicode.org/terms_of_use.html +# +# Unicode Character Database +# For documentation, see https://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Syllabic_Category enumerated property +# +# Scope: This property is aimed at two general problem +# areas involving the analysis and processing of Indic scripts: +# +# 1. Specification of syllabic structure. +# 2. Specification of segmentation rules. +# +# Both of these problem areas may benefit from having defined subtypes +# of Indic script characters which are relevant to how Indic +# syllables (or aksaras) are constructed. Note that rules for +# syllabic structure in Indic scripts may differ significantly +# from how phonological syllables are defined. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Syllabic_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as Indic in the structural sense used for the +# Indic_Syllabic_Category are the following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Dives Akuru, Dogra, Grantha, Gujarati, +# Gunjala Gondi, Gurmukhi, Gurung Khema, Hanunoo, Javanese, Kaithi, +# Kannada, Kawi, Kayah Li, Kharoshthi, Khmer, Khojki, Khudawadi, +# Kirat Rai, Lao, Lepcha, Limbu, Mahajani, Makasar, Malayalam, +# Marchen, Masaram Gondi, Meetei Mayek, Modi, Multani, Myanmar, +# Nandinagari, Newa, New Tai Lue, Oriya, Phags-pa, Rejang, +# Saurashtra, Sharada, Siddham, Sinhala, Soyombo, Sundanese, +# Syloti Nagri, Tagalog, Tagbanwa, Tai Le, Tai Tham, Tai Viet, Takri, +# Tamil, Telugu, Thai, Tibetan, Tirhuta, Tulu-Tigalari, and +# Zanabazar Square. +# +# All characters for all other scripts not in that list +# take the default value for this property, unless they +# are individually listed in this data file. +# + +# ================================================ + +# Property: Indic_Syllabic_Category +# +# All code points not explicitly listed for Indic_Syllabic_Category +# have the value Other. +# +# @missing: 0000..10FFFF; Other + +# ================================================ + +# Indic_Syllabic_Category=Bindu + +# Bindu/Anusvara (nasalization or -n) + +# [Not derivable] + +0900..0902 ; Bindu # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +0981 ; Bindu # Mn BENGALI SIGN CANDRABINDU +0982 ; Bindu # Mc BENGALI SIGN ANUSVARA +09FC ; Bindu # Lo BENGALI LETTER VEDIC ANUSVARA +0A01..0A02 ; Bindu # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A70 ; Bindu # Mn GURMUKHI TIPPI +0A81..0A82 ; Bindu # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0B01 ; Bindu # Mn ORIYA SIGN CANDRABINDU +0B02 ; Bindu # Mc ORIYA SIGN ANUSVARA +0B82 ; Bindu # Mn TAMIL SIGN ANUSVARA +0C00 ; Bindu # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C01..0C02 ; Bindu # Mc [2] TELUGU SIGN CANDRABINDU..TELUGU SIGN ANUSVARA +0C04 ; Bindu # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C80 ; Bindu # Lo KANNADA SIGN SPACING CANDRABINDU +0C81 ; Bindu # Mn KANNADA SIGN CANDRABINDU +0C82 ; Bindu # Mc KANNADA SIGN ANUSVARA +0CF3 ; Bindu # Mc KANNADA SIGN COMBINING ANUSVARA ABOVE RIGHT +0D00..0D01 ; Bindu # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU +0D02 ; Bindu # Mc MALAYALAM SIGN ANUSVARA +0D04 ; Bindu # Lo MALAYALAM LETTER VEDIC ANUSVARA +0D81 ; Bindu # Mn SINHALA SIGN CANDRABINDU +0D82 ; Bindu # Mc SINHALA SIGN ANUSVARAYA +0E4D ; Bindu # Mn THAI CHARACTER NIKHAHIT +0ECD ; Bindu # Mn LAO NIGGAHITA +0F7E ; Bindu # Mn TIBETAN SIGN RJES SU NGA RO +0F82..0F83 ; Bindu # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +1036 ; Bindu # Mn MYANMAR SIGN ANUSVARA +17C6 ; Bindu # Mn KHMER SIGN NIKAHIT +1932 ; Bindu # Mn LIMBU SMALL LETTER ANUSVARA +1A74 ; Bindu # Mn TAI THAM SIGN MAI KANG +1B00..1B02 ; Bindu # Mn [3] BALINESE SIGN ULU RICEM..BALINESE SIGN CECEK +1B80 ; Bindu # Mn SUNDANESE SIGN PANYECEK +1C34..1C35 ; Bindu # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A80B ; Bindu # Mn SYLOTI NAGRI SIGN ANUSVARA +A873 ; Bindu # Lo PHAGS-PA LETTER CANDRABINDU +A880 ; Bindu # Mc SAURASHTRA SIGN ANUSVARA +A8C5 ; Bindu # Mn SAURASHTRA SIGN CANDRABINDU +A8F2..A8F3 ; Bindu # Lo [2] DEVANAGARI SIGN SPACING CANDRABINDU..DEVANAGARI SIGN CANDRABINDU VIRAMA +A980..A981 ; Bindu # Mn [2] JAVANESE SIGN PANYANGGA..JAVANESE SIGN CECAK +10A0E ; Bindu # Mn KHAROSHTHI SIGN ANUSVARA +11000 ; Bindu # Mc BRAHMI SIGN CANDRABINDU +11001 ; Bindu # Mn BRAHMI SIGN ANUSVARA +11080..11081 ; Bindu # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +11100..11101 ; Bindu # Mn [2] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN ANUSVARA +11180..11181 ; Bindu # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +111CF ; Bindu # Mn SHARADA SIGN INVERTED CANDRABINDU +11234 ; Bindu # Mn KHOJKI SIGN ANUSVARA +112DF ; Bindu # Mn KHUDAWADI SIGN ANUSVARA +11300..11301 ; Bindu # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11302 ; Bindu # Mc GRANTHA SIGN ANUSVARA +1135E..1135F ; Bindu # Lo [2] GRANTHA LETTER VEDIC ANUSVARA..GRANTHA LETTER VEDIC DOUBLE ANUSVARA +113CA ; Bindu # Mc TULU-TIGALARI SIGN CANDRA ANUNASIKA +113CC ; Bindu # Mc TULU-TIGALARI SIGN ANUSVARA +11443..11444 ; Bindu # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +1145F ; Bindu # Lo NEWA LETTER VEDIC ANUSVARA +114BF..114C0 ; Bindu # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Bindu # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +1163D ; Bindu # Mn MODI SIGN ANUSVARA +116AB ; Bindu # Mn TAKRI SIGN ANUSVARA +11837 ; Bindu # Mn DOGRA SIGN ANUSVARA +1193B..1193C ; Bindu # Mn [2] DIVES AKURU SIGN ANUSVARA..DIVES AKURU SIGN CANDRABINDU +119DE ; Bindu # Mc NANDINAGARI SIGN ANUSVARA +11A35..11A38 ; Bindu # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A96 ; Bindu # Mn SOYOMBO SIGN ANUSVARA +11C3C..11C3D ; Bindu # Mn [2] BHAIKSUKI SIGN CANDRABINDU..BHAIKSUKI SIGN ANUSVARA +11CB5..11CB6 ; Bindu # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D40 ; Bindu # Mn MASARAM GONDI SIGN ANUSVARA +11D95 ; Bindu # Mn GUNJALA GONDI SIGN ANUSVARA +11F00..11F01 ; Bindu # Mn [2] KAWI SIGN CANDRABINDU..KAWI SIGN ANUSVARA +1612D ; Bindu # Mn GURUNG KHEMA SIGN ANUSVARA +16D40..16D41 ; Bindu # Lm [2] KIRAT RAI SIGN ANUSVARA..KIRAT RAI SIGN TONPI + +# ================================================ + +# Indic_Syllabic_Category=Visarga + +# Visarga (-h) +# Excludes letters for jihvamuliya and upadhmaniya, which are +# related, but structured somewhat differently. + +# [Not derivable] + +0903 ; Visarga # Mc DEVANAGARI SIGN VISARGA +0983 ; Visarga # Mc BENGALI SIGN VISARGA +0A03 ; Visarga # Mc GURMUKHI SIGN VISARGA +0A83 ; Visarga # Mc GUJARATI SIGN VISARGA +0B03 ; Visarga # Mc ORIYA SIGN VISARGA +0C03 ; Visarga # Mc TELUGU SIGN VISARGA +0C83 ; Visarga # Mc KANNADA SIGN VISARGA +0D03 ; Visarga # Mc MALAYALAM SIGN VISARGA +0D83 ; Visarga # Mc SINHALA SIGN VISARGAYA +0F7F ; Visarga # Mc TIBETAN SIGN RNAM BCAD +1038 ; Visarga # Mc MYANMAR SIGN VISARGA +17C7 ; Visarga # Mc KHMER SIGN REAHMUK +1B04 ; Visarga # Mc BALINESE SIGN BISAH +1B82 ; Visarga # Mc SUNDANESE SIGN PANGWISAD +A881 ; Visarga # Mc SAURASHTRA SIGN VISARGA +A983 ; Visarga # Mc JAVANESE SIGN WIGNYAN +AAF5 ; Visarga # Mc MEETEI MAYEK VOWEL SIGN VISARGA +10A0F ; Visarga # Mn KHAROSHTHI SIGN VISARGA +11002 ; Visarga # Mc BRAHMI SIGN VISARGA +11082 ; Visarga # Mc KAITHI SIGN VISARGA +11102 ; Visarga # Mn CHAKMA SIGN VISARGA +11182 ; Visarga # Mc SHARADA SIGN VISARGA +11303 ; Visarga # Mc GRANTHA SIGN VISARGA +113CD ; Visarga # Mc TULU-TIGALARI SIGN VISARGA +11445 ; Visarga # Mc NEWA SIGN VISARGA +114C1 ; Visarga # Mc TIRHUTA SIGN VISARGA +115BE ; Visarga # Mc SIDDHAM SIGN VISARGA +1163E ; Visarga # Mc MODI SIGN VISARGA +116AC ; Visarga # Mc TAKRI SIGN VISARGA +11838 ; Visarga # Mc DOGRA SIGN VISARGA +119DF ; Visarga # Mc NANDINAGARI SIGN VISARGA +11A39 ; Visarga # Mc ZANABAZAR SQUARE SIGN VISARGA +11A97 ; Visarga # Mc SOYOMBO SIGN VISARGA +11C3E ; Visarga # Mc BHAIKSUKI SIGN VISARGA +11D41 ; Visarga # Mn MASARAM GONDI SIGN VISARGA +11D96 ; Visarga # Mc GUNJALA GONDI SIGN VISARGA +11F03 ; Visarga # Mc KAWI SIGN VISARGA +16D42 ; Visarga # Lm KIRAT RAI SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Avagraha + +# Avagraha (elision of initial a- in sandhi) + +# [Not derivable] + +093D ; Avagraha # Lo DEVANAGARI SIGN AVAGRAHA +09BD ; Avagraha # Lo BENGALI SIGN AVAGRAHA +0ABD ; Avagraha # Lo GUJARATI SIGN AVAGRAHA +0B3D ; Avagraha # Lo ORIYA SIGN AVAGRAHA +0C3D ; Avagraha # Lo TELUGU SIGN AVAGRAHA +0CBD ; Avagraha # Lo KANNADA SIGN AVAGRAHA +0D3D ; Avagraha # Lo MALAYALAM SIGN AVAGRAHA +0F85 ; Avagraha # Po TIBETAN MARK PALUTA +17DC ; Avagraha # Lo KHMER SIGN AVAKRAHASANYA +1BBA ; Avagraha # Lo SUNDANESE AVAGRAHA +111C1 ; Avagraha # Lo SHARADA SIGN AVAGRAHA +1133D ; Avagraha # Lo GRANTHA SIGN AVAGRAHA +113B7 ; Avagraha # Lo TULU-TIGALARI SIGN AVAGRAHA +11447 ; Avagraha # Lo NEWA SIGN AVAGRAHA +114C4 ; Avagraha # Lo TIRHUTA SIGN AVAGRAHA +119E1 ; Avagraha # Lo NANDINAGARI SIGN AVAGRAHA +11A9D ; Avagraha # Lo SOYOMBO MARK PLUTA +11C40 ; Avagraha # Lo BHAIKSUKI SIGN AVAGRAHA + +# ================================================ + +# Indic_Syllabic_Category=Nukta + +# Nukta (diacritic for borrowed consonants or other consonant +# modifications). Note that while the resulting sound is typically a +# consonant, the base letter a nukta follows may be an independent +# vowel. For example, is used to transcribe ARABIC LETTER +# AIN. + +# [Not derivable] + +093C ; Nukta # Mn DEVANAGARI SIGN NUKTA +09BC ; Nukta # Mn BENGALI SIGN NUKTA +0A3C ; Nukta # Mn GURMUKHI SIGN NUKTA +0ABC ; Nukta # Mn GUJARATI SIGN NUKTA +0AFD..0AFF ; Nukta # Mn [3] GUJARATI SIGN THREE-DOT NUKTA ABOVE..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B3C ; Nukta # Mn ORIYA SIGN NUKTA +0C3C ; Nukta # Mn TELUGU SIGN NUKTA +0CBC ; Nukta # Mn KANNADA SIGN NUKTA +0F39 ; Nukta # Mn TIBETAN MARK TSA -PHRU +1B34 ; Nukta # Mn BALINESE SIGN REREKAN +1BE6 ; Nukta # Mn BATAK SIGN TOMPI +1C37 ; Nukta # Mn LEPCHA SIGN NUKTA +A9B3 ; Nukta # Mn JAVANESE SIGN CECAK TELU +10A38..10A3A ; Nukta # Mn [3] KHAROSHTHI SIGN BAR ABOVE..KHAROSHTHI SIGN DOT BELOW +110BA ; Nukta # Mn KAITHI SIGN NUKTA +11173 ; Nukta # Mn MAHAJANI SIGN NUKTA +111CA ; Nukta # Mn SHARADA SIGN NUKTA +11236 ; Nukta # Mn KHOJKI SIGN NUKTA +112E9 ; Nukta # Mn KHUDAWADI SIGN NUKTA +1133B..1133C ; Nukta # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA +11446 ; Nukta # Mn NEWA SIGN NUKTA +114C3 ; Nukta # Mn TIRHUTA SIGN NUKTA +115C0 ; Nukta # Mn SIDDHAM SIGN NUKTA +116B7 ; Nukta # Mn TAKRI SIGN NUKTA +1183A ; Nukta # Mn DOGRA SIGN NUKTA +11943 ; Nukta # Mn DIVES AKURU SIGN NUKTA +11D42 ; Nukta # Mn MASARAM GONDI SIGN NUKTA +11F5A ; Nukta # Mn KAWI SIGN NUKTA + +# ================================================ + +# Indic_Syllabic_Category=Virama + +# Virama (kills inherent vowel of consonant; may act as a Pure_Killer +# or Invisible_Stacker depending on context) +# Only includes characters that can act both as visible killer viramas +# and consonant stackers. Separate property values exist for characters +# that can only act as pure killers, only as reordering killers, or only +# as consonant stackers. + +# [Derivation: (ccc=9) - (InSC=Pure_Killer) - (InSC=Invisible_Stacker) +# - (InSC=Reordering_Killer) - (InSC=Number_Joiner) - 2D7F] + +094D ; Virama # Mn DEVANAGARI SIGN VIRAMA +09CD ; Virama # Mn BENGALI SIGN VIRAMA +0A4D ; Virama # Mn GURMUKHI SIGN VIRAMA +0ACD ; Virama # Mn GUJARATI SIGN VIRAMA +0B4D ; Virama # Mn ORIYA SIGN VIRAMA +0BCD ; Virama # Mn TAMIL SIGN VIRAMA +0C4D ; Virama # Mn TELUGU SIGN VIRAMA +0CCD ; Virama # Mn KANNADA SIGN VIRAMA +0D4D ; Virama # Mn MALAYALAM SIGN VIRAMA +0DCA ; Virama # Mn SINHALA SIGN AL-LAKUNA +1B44 ; Virama # Mc BALINESE ADEG ADEG +A806 ; Virama # Mn SYLOTI NAGRI SIGN HASANTA +A8C4 ; Virama # Mn SAURASHTRA SIGN VIRAMA +A9C0 ; Virama # Mc JAVANESE PANGKON +11046 ; Virama # Mn BRAHMI VIRAMA +110B9 ; Virama # Mn KAITHI SIGN VIRAMA +111C0 ; Virama # Mc SHARADA SIGN VIRAMA +11235 ; Virama # Mc KHOJKI SIGN VIRAMA +1134D ; Virama # Mc GRANTHA SIGN VIRAMA +11442 ; Virama # Mn NEWA SIGN VIRAMA +114C2 ; Virama # Mn TIRHUTA SIGN VIRAMA +115BF ; Virama # Mn SIDDHAM SIGN VIRAMA +1163F ; Virama # Mn MODI SIGN VIRAMA +116B6 ; Virama # Mc TAKRI SIGN VIRAMA +11839 ; Virama # Mn DOGRA SIGN VIRAMA +119E0 ; Virama # Mn NANDINAGARI SIGN VIRAMA +11C3F ; Virama # Mn BHAIKSUKI SIGN VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Pure_Killer + +# Pure killer (kills inherent vowel of consonant; always visible; +# has no conjuct formation, consonant stacking, or reordering +# behavior) + +# [Not derivable] + +0D3B..0D3C ; Pure_Killer # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA +0E3A ; Pure_Killer # Mn THAI CHARACTER PHINTHU +0E4E ; Pure_Killer # Mn THAI CHARACTER YAMAKKAN +0EBA ; Pure_Killer # Mn LAO SIGN PALI VIRAMA +0F84 ; Pure_Killer # Mn TIBETAN MARK HALANTA +103A ; Pure_Killer # Mn MYANMAR SIGN ASAT +1714 ; Pure_Killer # Mn TAGALOG SIGN VIRAMA +1715 ; Pure_Killer # Mc TAGALOG SIGN PAMUDPOD +1734 ; Pure_Killer # Mc HANUNOO SIGN PAMUDPOD +17D1 ; Pure_Killer # Mn KHMER SIGN VIRIAM +1A7A ; Pure_Killer # Mn TAI THAM SIGN RA HAAM +1BAA ; Pure_Killer # Mc SUNDANESE SIGN PAMAAEH +A82C ; Pure_Killer # Mn SYLOTI NAGRI SIGN ALTERNATE HASANTA +A953 ; Pure_Killer # Mc REJANG VIRAMA +ABED ; Pure_Killer # Mn MEETEI MAYEK APUN IYEK +11070 ; Pure_Killer # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11134 ; Pure_Killer # Mn CHAKMA MAAYYAA +112EA ; Pure_Killer # Mn KHUDAWADI SIGN VIRAMA +113CE ; Pure_Killer # Mn TULU-TIGALARI SIGN VIRAMA +113CF ; Pure_Killer # Mc TULU-TIGALARI SIGN LOOPED VIRAMA +1172B ; Pure_Killer # Mn AHOM SIGN KILLER +1193D ; Pure_Killer # Mc DIVES AKURU SIGN HALANTA +11A34 ; Pure_Killer # Mn ZANABAZAR SQUARE SIGN VIRAMA +11D44 ; Pure_Killer # Mn MASARAM GONDI SIGN HALANTA +11F41 ; Pure_Killer # Mc KAWI SIGN KILLER +1612F ; Pure_Killer # Mn GURUNG KHEMA SIGN THOLHOMA +16D6B..16D6C ; Pure_Killer # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT + +# ================================================ + +# Indic_Syllabic_Category=Reordering_Killer + +# Reordering killer (kills inherent vowel of consonant; always visible; +# may cause consonant reordering) + +# [Not derivable] + +1BF2..1BF3 ; Reordering_Killer # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN + +# ================================================ + +# Indic_Syllabic_Category=Invisible_Stacker + +# Invisible stacker (usually kills inherent vowel of consonant; is not visible +# by itself; causes conjunct formation or consonant +# stacking) +# +# Note that in some scripts, such as Kharoshthi and Masaram Gondi, an invisible +# stacker may have a second function, changing the shape and/or location of the +# consonant preceding it, even when there is no consonant following the +# invisible stacker. + +# [Not derivable] + +1039 ; Invisible_Stacker # Mn MYANMAR SIGN VIRAMA +17D2 ; Invisible_Stacker # Mn KHMER SIGN COENG +1A60 ; Invisible_Stacker # Mn TAI THAM SIGN SAKOT +1BAB ; Invisible_Stacker # Mn SUNDANESE SIGN VIRAMA +AAF6 ; Invisible_Stacker # Mn MEETEI MAYEK VIRAMA +10A3F ; Invisible_Stacker # Mn KHAROSHTHI VIRAMA +11133 ; Invisible_Stacker # Mn CHAKMA VIRAMA +113D0 ; Invisible_Stacker # Mn TULU-TIGALARI CONJOINER +1193E ; Invisible_Stacker # Mn DIVES AKURU VIRAMA +11A47 ; Invisible_Stacker # Mn ZANABAZAR SQUARE SUBJOINER +11A99 ; Invisible_Stacker # Mn SOYOMBO SUBJOINER +11D45 ; Invisible_Stacker # Mn MASARAM GONDI VIRAMA +11D97 ; Invisible_Stacker # Mn GUNJALA GONDI VIRAMA +11F42 ; Invisible_Stacker # Mn KAWI CONJOINER + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Independent + +# Independent Vowels (contrasted with matras) + +# [Not derivable] + +0904..0914 ; Vowel_Independent # Lo [17] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER AU +0960..0961 ; Vowel_Independent # Lo [2] DEVANAGARI LETTER VOCALIC RR..DEVANAGARI LETTER VOCALIC LL +0972..0977 ; Vowel_Independent # Lo [6] DEVANAGARI LETTER CANDRA A..DEVANAGARI LETTER UUE +0985..098C ; Vowel_Independent # Lo [8] BENGALI LETTER A..BENGALI LETTER VOCALIC L +098F..0990 ; Vowel_Independent # Lo [2] BENGALI LETTER E..BENGALI LETTER AI +0993..0994 ; Vowel_Independent # Lo [2] BENGALI LETTER O..BENGALI LETTER AU +09E0..09E1 ; Vowel_Independent # Lo [2] BENGALI LETTER VOCALIC RR..BENGALI LETTER VOCALIC LL +0A05..0A0A ; Vowel_Independent # Lo [6] GURMUKHI LETTER A..GURMUKHI LETTER UU +0A0F..0A10 ; Vowel_Independent # Lo [2] GURMUKHI LETTER EE..GURMUKHI LETTER AI +0A13..0A14 ; Vowel_Independent # Lo [2] GURMUKHI LETTER OO..GURMUKHI LETTER AU +0A85..0A8D ; Vowel_Independent # Lo [9] GUJARATI LETTER A..GUJARATI VOWEL CANDRA E +0A8F..0A91 ; Vowel_Independent # Lo [3] GUJARATI LETTER E..GUJARATI VOWEL CANDRA O +0A93..0A94 ; Vowel_Independent # Lo [2] GUJARATI LETTER O..GUJARATI LETTER AU +0AE0..0AE1 ; Vowel_Independent # Lo [2] GUJARATI LETTER VOCALIC RR..GUJARATI LETTER VOCALIC LL +0B05..0B0C ; Vowel_Independent # Lo [8] ORIYA LETTER A..ORIYA LETTER VOCALIC L +0B0F..0B10 ; Vowel_Independent # Lo [2] ORIYA LETTER E..ORIYA LETTER AI +0B13..0B14 ; Vowel_Independent # Lo [2] ORIYA LETTER O..ORIYA LETTER AU +0B60..0B61 ; Vowel_Independent # Lo [2] ORIYA LETTER VOCALIC RR..ORIYA LETTER VOCALIC LL +0B85..0B8A ; Vowel_Independent # Lo [6] TAMIL LETTER A..TAMIL LETTER UU +0B8E..0B90 ; Vowel_Independent # Lo [3] TAMIL LETTER E..TAMIL LETTER AI +0B92..0B94 ; Vowel_Independent # Lo [3] TAMIL LETTER O..TAMIL LETTER AU +0C05..0C0C ; Vowel_Independent # Lo [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L +0C0E..0C10 ; Vowel_Independent # Lo [3] TELUGU LETTER E..TELUGU LETTER AI +0C12..0C14 ; Vowel_Independent # Lo [3] TELUGU LETTER O..TELUGU LETTER AU +0C60..0C61 ; Vowel_Independent # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL +0C85..0C8C ; Vowel_Independent # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L +0C8E..0C90 ; Vowel_Independent # Lo [3] KANNADA LETTER E..KANNADA LETTER AI +0C92..0C94 ; Vowel_Independent # Lo [3] KANNADA LETTER O..KANNADA LETTER AU +0CE0..0CE1 ; Vowel_Independent # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL +0D05..0D0C ; Vowel_Independent # Lo [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L +0D0E..0D10 ; Vowel_Independent # Lo [3] MALAYALAM LETTER E..MALAYALAM LETTER AI +0D12..0D14 ; Vowel_Independent # Lo [3] MALAYALAM LETTER O..MALAYALAM LETTER AU +0D5F..0D61 ; Vowel_Independent # Lo [3] MALAYALAM LETTER ARCHAIC II..MALAYALAM LETTER VOCALIC LL +0D85..0D96 ; Vowel_Independent # Lo [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA +1021..102A ; Vowel_Independent # Lo [10] MYANMAR LETTER A..MYANMAR LETTER AU +1052..1055 ; Vowel_Independent # Lo [4] MYANMAR LETTER VOCALIC R..MYANMAR LETTER VOCALIC LL +1700..1702 ; Vowel_Independent # Lo [3] TAGALOG LETTER A..TAGALOG LETTER U +1720..1722 ; Vowel_Independent # Lo [3] HANUNOO LETTER A..HANUNOO LETTER U +1740..1742 ; Vowel_Independent # Lo [3] BUHID LETTER A..BUHID LETTER U +1760..1762 ; Vowel_Independent # Lo [3] TAGBANWA LETTER A..TAGBANWA LETTER U +17A3..17B3 ; Vowel_Independent # Lo [17] KHMER INDEPENDENT VOWEL QAQ..KHMER INDEPENDENT VOWEL QAU +1A4D..1A52 ; Vowel_Independent # Lo [6] TAI THAM LETTER I..TAI THAM LETTER OO +1B05..1B12 ; Vowel_Independent # Lo [14] BALINESE LETTER AKARA..BALINESE LETTER OKARA TEDUNG +1B83..1B89 ; Vowel_Independent # Lo [7] SUNDANESE LETTER A..SUNDANESE LETTER EU +1BE4..1BE5 ; Vowel_Independent # Lo [2] BATAK LETTER I..BATAK LETTER U +A800..A801 ; Vowel_Independent # Lo [2] SYLOTI NAGRI LETTER A..SYLOTI NAGRI LETTER I +A803..A805 ; Vowel_Independent # Lo [3] SYLOTI NAGRI LETTER U..SYLOTI NAGRI LETTER O +A882..A891 ; Vowel_Independent # Lo [16] SAURASHTRA LETTER A..SAURASHTRA LETTER AU +A8FE ; Vowel_Independent # Lo DEVANAGARI LETTER AY +A984..A988 ; Vowel_Independent # Lo [5] JAVANESE LETTER A..JAVANESE LETTER U +A98C..A98E ; Vowel_Independent # Lo [3] JAVANESE LETTER E..JAVANESE LETTER O +AA00..AA05 ; Vowel_Independent # Lo [6] CHAM LETTER A..CHAM LETTER O +AAE0..AAE1 ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER E..MEETEI MAYEK LETTER O +ABCE..ABCF ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER UN..MEETEI MAYEK LETTER I +ABD1 ; Vowel_Independent # Lo MEETEI MAYEK LETTER ATIYA +11005..11012 ; Vowel_Independent # Lo [14] BRAHMI LETTER A..BRAHMI LETTER AU +11071..11072 ; Vowel_Independent # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11083..1108C ; Vowel_Independent # Lo [10] KAITHI LETTER A..KAITHI LETTER AU +11103..11106 ; Vowel_Independent # Lo [4] CHAKMA LETTER AA..CHAKMA LETTER E +11183..11190 ; Vowel_Independent # Lo [14] SHARADA LETTER A..SHARADA LETTER AU +11200..11207 ; Vowel_Independent # Lo [8] KHOJKI LETTER A..KHOJKI LETTER AU +11240 ; Vowel_Independent # Lo KHOJKI LETTER SHORT I +11280..11283 ; Vowel_Independent # Lo [4] MULTANI LETTER A..MULTANI LETTER E +112B0..112B9 ; Vowel_Independent # Lo [10] KHUDAWADI LETTER A..KHUDAWADI LETTER AU +11305..1130C ; Vowel_Independent # Lo [8] GRANTHA LETTER A..GRANTHA LETTER VOCALIC L +1130F..11310 ; Vowel_Independent # Lo [2] GRANTHA LETTER EE..GRANTHA LETTER AI +11313..11314 ; Vowel_Independent # Lo [2] GRANTHA LETTER OO..GRANTHA LETTER AU +11360..11361 ; Vowel_Independent # Lo [2] GRANTHA LETTER VOCALIC RR..GRANTHA LETTER VOCALIC LL +11380..11389 ; Vowel_Independent # Lo [10] TULU-TIGALARI LETTER A..TULU-TIGALARI LETTER VOCALIC LL +1138B ; Vowel_Independent # Lo TULU-TIGALARI LETTER EE +1138E ; Vowel_Independent # Lo TULU-TIGALARI LETTER AI +11390..11391 ; Vowel_Independent # Lo [2] TULU-TIGALARI LETTER OO..TULU-TIGALARI LETTER AU +11400..1140D ; Vowel_Independent # Lo [14] NEWA LETTER A..NEWA LETTER AU +11481..1148E ; Vowel_Independent # Lo [14] TIRHUTA LETTER A..TIRHUTA LETTER AU +11580..1158D ; Vowel_Independent # Lo [14] SIDDHAM LETTER A..SIDDHAM LETTER AU +115D8..115DB ; Vowel_Independent # Lo [4] SIDDHAM LETTER THREE-CIRCLE ALTERNATE I..SIDDHAM LETTER ALTERNATE U +11600..1160D ; Vowel_Independent # Lo [14] MODI LETTER A..MODI LETTER AU +11680..11689 ; Vowel_Independent # Lo [10] TAKRI LETTER A..TAKRI LETTER AU +11800..11809 ; Vowel_Independent # Lo [10] DOGRA LETTER A..DOGRA LETTER AU +11900..11906 ; Vowel_Independent # Lo [7] DIVES AKURU LETTER A..DIVES AKURU LETTER E +11909 ; Vowel_Independent # Lo DIVES AKURU LETTER O +119A0..119A7 ; Vowel_Independent # Lo [8] NANDINAGARI LETTER A..NANDINAGARI LETTER VOCALIC RR +119AA..119AD ; Vowel_Independent # Lo [4] NANDINAGARI LETTER E..NANDINAGARI LETTER AU +11A00 ; Vowel_Independent # Lo ZANABAZAR SQUARE LETTER A +11A50 ; Vowel_Independent # Lo SOYOMBO LETTER A +11C00..11C08 ; Vowel_Independent # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L +11C0A..11C0D ; Vowel_Independent # Lo [4] BHAIKSUKI LETTER E..BHAIKSUKI LETTER AU +11D00..11D06 ; Vowel_Independent # Lo [7] MASARAM GONDI LETTER A..MASARAM GONDI LETTER E +11D08..11D09 ; Vowel_Independent # Lo [2] MASARAM GONDI LETTER AI..MASARAM GONDI LETTER O +11D0B ; Vowel_Independent # Lo MASARAM GONDI LETTER AU +11D60..11D65 ; Vowel_Independent # Lo [6] GUNJALA GONDI LETTER A..GUNJALA GONDI LETTER UU +11D67..11D68 ; Vowel_Independent # Lo [2] GUNJALA GONDI LETTER EE..GUNJALA GONDI LETTER AI +11D6A..11D6B ; Vowel_Independent # Lo [2] GUNJALA GONDI LETTER OO..GUNJALA GONDI LETTER AU +11F04..11F10 ; Vowel_Independent # Lo [13] KAWI LETTER A..KAWI LETTER O +16100 ; Vowel_Independent # Lo GURUNG KHEMA LETTER A + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Dependent + +# Dependent Vowels (contrasted with independent vowels and/or with +# complex placement). Known as matras in Indic scripts. Also +# includes vowel modifiers that follow dependent (and sometimes +# independent) vowels. + +# [Not derivable] + +093A ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN OE +093B ; Vowel_Dependent # Mc DEVANAGARI VOWEL SIGN OOE +093E..0940 ; Vowel_Dependent # Mc [3] DEVANAGARI VOWEL SIGN AA..DEVANAGARI VOWEL SIGN II +0941..0948 ; Vowel_Dependent # Mn [8] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN AI +0949..094C ; Vowel_Dependent # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094E..094F ; Vowel_Dependent # Mc [2] DEVANAGARI VOWEL SIGN PRISHTHAMATRA E..DEVANAGARI VOWEL SIGN AW +0955..0957 ; Vowel_Dependent # Mn [3] DEVANAGARI VOWEL SIGN CANDRA LONG E..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Vowel_Dependent # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BE..09C0 ; Vowel_Dependent # Mc [3] BENGALI VOWEL SIGN AA..BENGALI VOWEL SIGN II +09C1..09C4 ; Vowel_Dependent # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09C7..09C8 ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +09CB..09CC ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +09D7 ; Vowel_Dependent # Mc BENGALI AU LENGTH MARK +09E2..09E3 ; Vowel_Dependent # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3E..0A40 ; Vowel_Dependent # Mc [3] GURMUKHI VOWEL SIGN AA..GURMUKHI VOWEL SIGN II +0A41..0A42 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A47..0A48 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0ABE..0AC0 ; Vowel_Dependent # Mc [3] GUJARATI VOWEL SIGN AA..GUJARATI VOWEL SIGN II +0AC1..0AC5 ; Vowel_Dependent # Mn [5] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AC9 ; Vowel_Dependent # Mc GUJARATI VOWEL SIGN CANDRA O +0ACB..0ACC ; Vowel_Dependent # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0AE2..0AE3 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3E ; Vowel_Dependent # Mc ORIYA VOWEL SIGN AA +0B3F ; Vowel_Dependent # Mn ORIYA VOWEL SIGN I +0B40 ; Vowel_Dependent # Mc ORIYA VOWEL SIGN II +0B41..0B44 ; Vowel_Dependent # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B47..0B48 ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI +0B4B..0B4C ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN O..ORIYA VOWEL SIGN AU +0B55..0B56 ; Vowel_Dependent # Mn [2] ORIYA SIGN OVERLINE..ORIYA AI LENGTH MARK +0B57 ; Vowel_Dependent # Mc ORIYA AU LENGTH MARK +0B62..0B63 ; Vowel_Dependent # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BBE..0BBF ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC0 ; Vowel_Dependent # Mn TAMIL VOWEL SIGN II +0BC1..0BC2 ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BC6..0BC8 ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0BCA..0BCC ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0BD7 ; Vowel_Dependent # Mc TAMIL AU LENGTH MARK +0C3E..0C40 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C41..0C44 ; Vowel_Dependent # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C46..0C48 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI +0C4A..0C4C ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C55..0C56 ; Vowel_Dependent # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK +0C62..0C63 ; Vowel_Dependent # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBE ; Vowel_Dependent # Mc KANNADA VOWEL SIGN AA +0CBF ; Vowel_Dependent # Mn KANNADA VOWEL SIGN I +0CC0..0CC4 ; Vowel_Dependent # Mc [5] KANNADA VOWEL SIGN II..KANNADA VOWEL SIGN VOCALIC RR +0CC6 ; Vowel_Dependent # Mn KANNADA VOWEL SIGN E +0CC7..0CC8 ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +0CCC ; Vowel_Dependent # Mn KANNADA VOWEL SIGN AU +0CD5..0CD6 ; Vowel_Dependent # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CE2..0CE3 ; Vowel_Dependent # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D3E..0D40 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D44 ; Vowel_Dependent # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR +0D46..0D48 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0D4A..0D4C ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0D57 ; Vowel_Dependent # Mc MALAYALAM AU LENGTH MARK +0D62..0D63 ; Vowel_Dependent # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DCF..0DD1 ; Vowel_Dependent # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD2..0DD4 ; Vowel_Dependent # Mn [3] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Vowel_Dependent # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0DD8..0DDF ; Vowel_Dependent # Mc [8] SINHALA VOWEL SIGN GAETTA-PILLA..SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Vowel_Dependent # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Vowel_Dependent # Lo THAI CHARACTER SARA A +0E31 ; Vowel_Dependent # Mn THAI CHARACTER MAI HAN-AKAT +0E32..0E33 ; Vowel_Dependent # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E34..0E39 ; Vowel_Dependent # Mn [6] THAI CHARACTER SARA I..THAI CHARACTER SARA UU +0E40..0E45 ; Vowel_Dependent # Lo [6] THAI CHARACTER SARA E..THAI CHARACTER LAKKHANGYAO +0E47 ; Vowel_Dependent # Mn THAI CHARACTER MAITAIKHU +0EB0 ; Vowel_Dependent # Lo LAO VOWEL SIGN A +0EB1 ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KAN +0EB2..0EB3 ; Vowel_Dependent # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0EB4..0EB9 ; Vowel_Dependent # Mn [6] LAO VOWEL SIGN I..LAO VOWEL SIGN UU +0EBB ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KON +0EC0..0EC4 ; Vowel_Dependent # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +0F71..0F7D ; Vowel_Dependent # Mn [13] TIBETAN VOWEL SIGN AA..TIBETAN VOWEL SIGN OO +0F80..0F81 ; Vowel_Dependent # Mn [2] TIBETAN VOWEL SIGN REVERSED I..TIBETAN VOWEL SIGN REVERSED II +102B..102C ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +102D..1030 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN UU +1031 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN E +1032..1035 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +1056..1057 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1058..1059 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1062 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1071..1074 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1083..1084 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN SHAN AA..MYANMAR VOWEL SIGN SHAN E +1085..1086 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109C ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN AITON A +109D ; Vowel_Dependent # Mn MYANMAR VOWEL SIGN AITON AI +1712..1713 ; Vowel_Dependent # Mn [2] TAGALOG VOWEL SIGN I..TAGALOG VOWEL SIGN U +1732..1733 ; Vowel_Dependent # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1752..1753 ; Vowel_Dependent # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U +1772..1773 ; Vowel_Dependent # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U +17B6 ; Vowel_Dependent # Mc KHMER VOWEL SIGN AA +17B7..17BD ; Vowel_Dependent # Mn [7] KHMER VOWEL SIGN I..KHMER VOWEL SIGN UA +17BE..17C5 ; Vowel_Dependent # Mc [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU +17C8 ; Vowel_Dependent # Mc KHMER SIGN YUUKALEAPINTU +1920..1922 ; Vowel_Dependent # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U +1923..1926 ; Vowel_Dependent # Mc [4] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AU +1927..1928 ; Vowel_Dependent # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Vowel_Dependent # Mn LIMBU SIGN KEMPHRENG +19B0..19C0 ; Vowel_Dependent # Lo [17] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN IY +1A17..1A18 ; Vowel_Dependent # Mn [2] BUGINESE VOWEL SIGN I..BUGINESE VOWEL SIGN U +1A19..1A1A ; Vowel_Dependent # Mc [2] BUGINESE VOWEL SIGN E..BUGINESE VOWEL SIGN O +1A1B ; Vowel_Dependent # Mn BUGINESE VOWEL SIGN AE +1A61 ; Vowel_Dependent # Mc TAI THAM VOWEL SIGN A +1A62 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN MAI SAT +1A63..1A64 ; Vowel_Dependent # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A65..1A6C ; Vowel_Dependent # Mn [8] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN OA BELOW +1A6D..1A72 ; Vowel_Dependent # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI +1A73 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN OA ABOVE +1B35 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN TEDUNG +1B36..1B3A ; Vowel_Dependent # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA +1B3B ; Vowel_Dependent # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +1B3C ; Vowel_Dependent # Mn BALINESE VOWEL SIGN LA LENGA +1B3D..1B41 ; Vowel_Dependent # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1B42 ; Vowel_Dependent # Mn BALINESE VOWEL SIGN PEPET +1B43 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN PEPET TEDUNG +1BA4..1BA5 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PANGHULU..SUNDANESE VOWEL SIGN PANYUKU +1BA6..1BA7 ; Vowel_Dependent # Mc [2] SUNDANESE VOWEL SIGN PANAELAENG..SUNDANESE VOWEL SIGN PANOLONG +1BA8..1BA9 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE7 ; Vowel_Dependent # Mc BATAK VOWEL SIGN E +1BE8..1BE9 ; Vowel_Dependent # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BEA..1BEC ; Vowel_Dependent # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BED ; Vowel_Dependent # Mn BATAK VOWEL SIGN KARO O +1BEE ; Vowel_Dependent # Mc BATAK VOWEL SIGN U +1BEF ; Vowel_Dependent # Mn BATAK VOWEL SIGN U FOR SIMALUNGUN SA +1C26..1C2B ; Vowel_Dependent # Mc [6] LEPCHA VOWEL SIGN AA..LEPCHA VOWEL SIGN UU +1C2C ; Vowel_Dependent # Mn LEPCHA VOWEL SIGN E +A802 ; Vowel_Dependent # Mn SYLOTI NAGRI SIGN DVISVARA +A823..A824 ; Vowel_Dependent # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A825..A826 ; Vowel_Dependent # Mn [2] SYLOTI NAGRI VOWEL SIGN U..SYLOTI NAGRI VOWEL SIGN E +A827 ; Vowel_Dependent # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Vowel_Dependent # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A8FF ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN AY +A947..A94E ; Vowel_Dependent # Mn [8] REJANG VOWEL SIGN I..REJANG VOWEL SIGN EA +A9B4..A9B5 ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9B6..A9B9 ; Vowel_Dependent # Mn [4] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BA..A9BB ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +A9BC ; Vowel_Dependent # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Vowel_Dependent # Mn MYANMAR SIGN SHAN SAW +AA29..AA2E ; Vowel_Dependent # Mn [6] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN OE +AA2F..AA30 ; Vowel_Dependent # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA31..AA32 ; Vowel_Dependent # Mn [2] CHAM VOWEL SIGN AU..CHAM VOWEL SIGN UE +AAB0 ; Vowel_Dependent # Mn TAI VIET MAI KANG +AAB1 ; Vowel_Dependent # Lo TAI VIET VOWEL AA +AAB2..AAB4 ; Vowel_Dependent # Mn [3] TAI VIET VOWEL I..TAI VIET VOWEL U +AAB5..AAB6 ; Vowel_Dependent # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB7..AAB8 ; Vowel_Dependent # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AAB9..AABD ; Vowel_Dependent # Lo [5] TAI VIET VOWEL UEA..TAI VIET VOWEL AN +AABE ; Vowel_Dependent # Mn TAI VIET VOWEL AM +AAEB ; Vowel_Dependent # Mc MEETEI MAYEK VOWEL SIGN II +AAEC..AAED ; Vowel_Dependent # Mn [2] MEETEI MAYEK VOWEL SIGN UU..MEETEI MAYEK VOWEL SIGN AAI +AAEE..AAEF ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN AU..MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE5 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN ANAP +ABE6..ABE7 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE8 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABE9..ABEA ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +10A01..10A03 ; Vowel_Dependent # Mn [3] KHAROSHTHI VOWEL SIGN I..KHAROSHTHI VOWEL SIGN VOCALIC R +10A05..10A06 ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O +10A0C..10A0D ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN DOUBLE RING BELOW +11038..11045 ; Vowel_Dependent # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +11073..11074 ; Vowel_Dependent # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O +110B0..110B2 ; Vowel_Dependent # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II +110B3..110B6 ; Vowel_Dependent # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI +110B7..110B8 ; Vowel_Dependent # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +110C2 ; Vowel_Dependent # Mn KAITHI VOWEL SIGN VOCALIC R +11127..1112B ; Vowel_Dependent # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU +1112C ; Vowel_Dependent # Mc CHAKMA VOWEL SIGN E +1112D..11132 ; Vowel_Dependent # Mn [6] CHAKMA VOWEL SIGN AI..CHAKMA AU MARK +11145..11146 ; Vowel_Dependent # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI +111B3..111B5 ; Vowel_Dependent # Mc [3] SHARADA VOWEL SIGN AA..SHARADA VOWEL SIGN II +111B6..111BE ; Vowel_Dependent # Mn [9] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN O +111BF ; Vowel_Dependent # Mc SHARADA VOWEL SIGN AU +111CB..111CC ; Vowel_Dependent # Mn [2] SHARADA VOWEL MODIFIER MARK..SHARADA EXTRA SHORT VOWEL MARK +111CE ; Vowel_Dependent # Mc SHARADA VOWEL SIGN PRISHTHAMATRA E +1122C..1122E ; Vowel_Dependent # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +1122F..11231 ; Vowel_Dependent # Mn [3] KHOJKI VOWEL SIGN U..KHOJKI VOWEL SIGN AI +11232..11233 ; Vowel_Dependent # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU +11241 ; Vowel_Dependent # Mn KHOJKI VOWEL SIGN VOCALIC R +112E0..112E2 ; Vowel_Dependent # Mc [3] KHUDAWADI VOWEL SIGN AA..KHUDAWADI VOWEL SIGN II +112E3..112E8 ; Vowel_Dependent # Mn [6] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN AU +1133E..1133F ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11340 ; Vowel_Dependent # Mn GRANTHA VOWEL SIGN II +11341..11344 ; Vowel_Dependent # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +11347..11348 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +1134B..1134C ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +11357 ; Vowel_Dependent # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +113B8..113BA ; Vowel_Dependent # Mc [3] TULU-TIGALARI VOWEL SIGN AA..TULU-TIGALARI VOWEL SIGN II +113BB..113C0 ; Vowel_Dependent # Mn [6] TULU-TIGALARI VOWEL SIGN U..TULU-TIGALARI VOWEL SIGN VOCALIC LL +113C2 ; Vowel_Dependent # Mc TULU-TIGALARI VOWEL SIGN EE +113C5 ; Vowel_Dependent # Mc TULU-TIGALARI VOWEL SIGN AI +113C7..113C9 ; Vowel_Dependent # Mc [3] TULU-TIGALARI VOWEL SIGN OO..TULU-TIGALARI AU LENGTH MARK +11435..11437 ; Vowel_Dependent # Mc [3] NEWA VOWEL SIGN AA..NEWA VOWEL SIGN II +11438..1143F ; Vowel_Dependent # Mn [8] NEWA VOWEL SIGN U..NEWA VOWEL SIGN AI +11440..11441 ; Vowel_Dependent # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +114B0..114B2 ; Vowel_Dependent # Mc [3] TIRHUTA VOWEL SIGN AA..TIRHUTA VOWEL SIGN II +114B3..114B8 ; Vowel_Dependent # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114B9 ; Vowel_Dependent # Mc TIRHUTA VOWEL SIGN E +114BA ; Vowel_Dependent # Mn TIRHUTA VOWEL SIGN SHORT E +114BB..114BE ; Vowel_Dependent # Mc [4] TIRHUTA VOWEL SIGN AI..TIRHUTA VOWEL SIGN AU +115AF..115B1 ; Vowel_Dependent # Mc [3] SIDDHAM VOWEL SIGN AA..SIDDHAM VOWEL SIGN II +115B2..115B5 ; Vowel_Dependent # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115B8..115BB ; Vowel_Dependent # Mc [4] SIDDHAM VOWEL SIGN E..SIDDHAM VOWEL SIGN AU +115DC..115DD ; Vowel_Dependent # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11630..11632 ; Vowel_Dependent # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +11633..1163A ; Vowel_Dependent # Mn [8] MODI VOWEL SIGN U..MODI VOWEL SIGN AI +1163B..1163C ; Vowel_Dependent # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +11640 ; Vowel_Dependent # Mn MODI SIGN ARDHACANDRA +116AD ; Vowel_Dependent # Mn TAKRI VOWEL SIGN AA +116AE..116AF ; Vowel_Dependent # Mc [2] TAKRI VOWEL SIGN I..TAKRI VOWEL SIGN II +116B0..116B5 ; Vowel_Dependent # Mn [6] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN AU +11720..11721 ; Vowel_Dependent # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +11722..11725 ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN I..AHOM VOWEL SIGN UU +11726 ; Vowel_Dependent # Mc AHOM VOWEL SIGN E +11727..1172A ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN AW..AHOM VOWEL SIGN AM +1182C..1182E ; Vowel_Dependent # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II +1182F..11836 ; Vowel_Dependent # Mn [8] DOGRA VOWEL SIGN U..DOGRA VOWEL SIGN AU +11930..11935 ; Vowel_Dependent # Mc [6] DIVES AKURU VOWEL SIGN AA..DIVES AKURU VOWEL SIGN E +11937..11938 ; Vowel_Dependent # Mc [2] DIVES AKURU VOWEL SIGN AI..DIVES AKURU VOWEL SIGN O +119D1..119D3 ; Vowel_Dependent # Mc [3] NANDINAGARI VOWEL SIGN AA..NANDINAGARI VOWEL SIGN II +119D4..119D7 ; Vowel_Dependent # Mn [4] NANDINAGARI VOWEL SIGN U..NANDINAGARI VOWEL SIGN VOCALIC RR +119DA..119DB ; Vowel_Dependent # Mn [2] NANDINAGARI VOWEL SIGN E..NANDINAGARI VOWEL SIGN AI +119DC..119DD ; Vowel_Dependent # Mc [2] NANDINAGARI VOWEL SIGN O..NANDINAGARI VOWEL SIGN AU +119E4 ; Vowel_Dependent # Mc NANDINAGARI VOWEL SIGN PRISHTHAMATRA E +11A01..11A0A ; Vowel_Dependent # Mn [10] ZANABAZAR SQUARE VOWEL SIGN I..ZANABAZAR SQUARE VOWEL LENGTH MARK +11A51..11A56 ; Vowel_Dependent # Mn [6] SOYOMBO VOWEL SIGN I..SOYOMBO VOWEL SIGN OE +11A57..11A58 ; Vowel_Dependent # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A59..11A5B ; Vowel_Dependent # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11C2F ; Vowel_Dependent # Mc BHAIKSUKI VOWEL SIGN AA +11C30..11C36 ; Vowel_Dependent # Mn [7] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN VOCALIC L +11C38..11C3B ; Vowel_Dependent # Mn [4] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI VOWEL SIGN AU +11CB0 ; Vowel_Dependent # Mn MARCHEN VOWEL SIGN AA +11CB1 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN I +11CB2..11CB3 ; Vowel_Dependent # Mn [2] MARCHEN VOWEL SIGN U..MARCHEN VOWEL SIGN E +11CB4 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN O +11D31..11D36 ; Vowel_Dependent # Mn [6] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN VOCALIC R +11D3A ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Vowel_Dependent # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN AU +11D43 ; Vowel_Dependent # Mn MASARAM GONDI SIGN CANDRA +11D8A..11D8E ; Vowel_Dependent # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU +11D90..11D91 ; Vowel_Dependent # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI +11D93..11D94 ; Vowel_Dependent # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU +11EF3..11EF4 ; Vowel_Dependent # Mn [2] MAKASAR VOWEL SIGN I..MAKASAR VOWEL SIGN U +11EF5..11EF6 ; Vowel_Dependent # Mc [2] MAKASAR VOWEL SIGN E..MAKASAR VOWEL SIGN O +11F34..11F35 ; Vowel_Dependent # Mc [2] KAWI VOWEL SIGN AA..KAWI VOWEL SIGN ALTERNATE AA +11F36..11F3A ; Vowel_Dependent # Mn [5] KAWI VOWEL SIGN I..KAWI VOWEL SIGN VOCALIC R +11F3E..11F3F ; Vowel_Dependent # Mc [2] KAWI VOWEL SIGN E..KAWI VOWEL SIGN AI +11F40 ; Vowel_Dependent # Mn KAWI VOWEL SIGN EU +1611E..16129 ; Vowel_Dependent # Mn [12] GURUNG KHEMA VOWEL SIGN AA..GURUNG KHEMA VOWEL LENGTH MARK +16D63..16D6A ; Vowel_Dependent # Lo [8] KIRAT RAI VOWEL SIGN AA..KIRAT RAI VOWEL SIGN AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel + +# (Other) Vowels (reanalyzed as ordinary alphabetic letters or marks) + +# [Not derivable] + +1963..196D ; Vowel # Lo [11] TAI LE LETTER A..TAI LE LETTER AI +A85E..A861 ; Vowel # Lo [4] PHAGS-PA LETTER I..PHAGS-PA LETTER O +A866 ; Vowel # Lo PHAGS-PA LETTER EE +A922..A925 ; Vowel # Lo [4] KAYAH LI LETTER A..KAYAH LI LETTER OO +A926..A92A ; Vowel # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O +11150..11154 ; Vowel # Lo [5] MAHAJANI LETTER A..MAHAJANI LETTER O + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Placeholder + +# Consonant Placeholder +# This includes generic placeholders used for +# Indic script layout (NBSP and dotted circle), as well as a few script- +# specific vowel-holder characters which are not technically +# consonants, but serve instead as bases for placement of vowel marks. + +# [Not derivable] + +002D ; Consonant_Placeholder # Pd HYPHEN-MINUS +00A0 ; Consonant_Placeholder # Zs NO-BREAK SPACE +00D7 ; Consonant_Placeholder # Sm MULTIPLICATION SIGN +0980 ; Consonant_Placeholder # Lo BENGALI ANJI +0A72..0A73 ; Consonant_Placeholder # Lo [2] GURMUKHI IRI..GURMUKHI URA +104B ; Consonant_Placeholder # Po MYANMAR SIGN SECTION +104E ; Consonant_Placeholder # Po MYANMAR SYMBOL AFOREMENTIONED +1900 ; Consonant_Placeholder # Lo LIMBU VOWEL-CARRIER LETTER +1CFA ; Consonant_Placeholder # Lo VEDIC SIGN DOUBLE ANUSVARA ANTARGOMUKHA +2010..2014 ; Consonant_Placeholder # Pd [5] HYPHEN..EM DASH +25CC ; Consonant_Placeholder # So DOTTED CIRCLE +AA74..AA76 ; Consonant_Placeholder # Lo [3] MYANMAR LOGOGRAM KHAMTI OAY..MYANMAR LOGOGRAM KHAMTI HM +11A3F ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL HEAD MARK +11A45 ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL DOUBLE-LINED HEAD MARK +11EF2 ; Consonant_Placeholder # Lo MAKASAR ANGKA + +# ================================================ + +# Indic_Syllabic_Category=Consonant + +# Consonant (ordinary abugida consonants, with inherent vowels) + +# [Not derivable] + +0915..0939 ; Consonant # Lo [37] DEVANAGARI LETTER KA..DEVANAGARI LETTER HA +0958..095F ; Consonant # Lo [8] DEVANAGARI LETTER QA..DEVANAGARI LETTER YYA +0978..097F ; Consonant # Lo [8] DEVANAGARI LETTER MARWARI DDA..DEVANAGARI LETTER BBA +0995..09A8 ; Consonant # Lo [20] BENGALI LETTER KA..BENGALI LETTER NA +09AA..09B0 ; Consonant # Lo [7] BENGALI LETTER PA..BENGALI LETTER RA +09B2 ; Consonant # Lo BENGALI LETTER LA +09B6..09B9 ; Consonant # Lo [4] BENGALI LETTER SHA..BENGALI LETTER HA +09DC..09DD ; Consonant # Lo [2] BENGALI LETTER RRA..BENGALI LETTER RHA +09DF ; Consonant # Lo BENGALI LETTER YYA +09F0..09F1 ; Consonant # Lo [2] BENGALI LETTER RA WITH MIDDLE DIAGONAL..BENGALI LETTER RA WITH LOWER DIAGONAL +0A15..0A28 ; Consonant # Lo [20] GURMUKHI LETTER KA..GURMUKHI LETTER NA +0A2A..0A30 ; Consonant # Lo [7] GURMUKHI LETTER PA..GURMUKHI LETTER RA +0A32..0A33 ; Consonant # Lo [2] GURMUKHI LETTER LA..GURMUKHI LETTER LLA +0A35..0A36 ; Consonant # Lo [2] GURMUKHI LETTER VA..GURMUKHI LETTER SHA +0A38..0A39 ; Consonant # Lo [2] GURMUKHI LETTER SA..GURMUKHI LETTER HA +0A59..0A5C ; Consonant # Lo [4] GURMUKHI LETTER KHHA..GURMUKHI LETTER RRA +0A5E ; Consonant # Lo GURMUKHI LETTER FA +0A95..0AA8 ; Consonant # Lo [20] GUJARATI LETTER KA..GUJARATI LETTER NA +0AAA..0AB0 ; Consonant # Lo [7] GUJARATI LETTER PA..GUJARATI LETTER RA +0AB2..0AB3 ; Consonant # Lo [2] GUJARATI LETTER LA..GUJARATI LETTER LLA +0AB5..0AB9 ; Consonant # Lo [5] GUJARATI LETTER VA..GUJARATI LETTER HA +0AF9 ; Consonant # Lo GUJARATI LETTER ZHA +0B15..0B28 ; Consonant # Lo [20] ORIYA LETTER KA..ORIYA LETTER NA +0B2A..0B30 ; Consonant # Lo [7] ORIYA LETTER PA..ORIYA LETTER RA +0B32..0B33 ; Consonant # Lo [2] ORIYA LETTER LA..ORIYA LETTER LLA +0B35..0B39 ; Consonant # Lo [5] ORIYA LETTER VA..ORIYA LETTER HA +0B5C..0B5D ; Consonant # Lo [2] ORIYA LETTER RRA..ORIYA LETTER RHA +0B5F ; Consonant # Lo ORIYA LETTER YYA +0B71 ; Consonant # Lo ORIYA LETTER WA +0B95 ; Consonant # Lo TAMIL LETTER KA +0B99..0B9A ; Consonant # Lo [2] TAMIL LETTER NGA..TAMIL LETTER CA +0B9C ; Consonant # Lo TAMIL LETTER JA +0B9E..0B9F ; Consonant # Lo [2] TAMIL LETTER NYA..TAMIL LETTER TTA +0BA3..0BA4 ; Consonant # Lo [2] TAMIL LETTER NNA..TAMIL LETTER TA +0BA8..0BAA ; Consonant # Lo [3] TAMIL LETTER NA..TAMIL LETTER PA +0BAE..0BB9 ; Consonant # Lo [12] TAMIL LETTER MA..TAMIL LETTER HA +0C15..0C28 ; Consonant # Lo [20] TELUGU LETTER KA..TELUGU LETTER NA +0C2A..0C39 ; Consonant # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C58..0C5A ; Consonant # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C95..0CA8 ; Consonant # Lo [20] KANNADA LETTER KA..KANNADA LETTER NA +0CAA..0CB3 ; Consonant # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA +0CB5..0CB9 ; Consonant # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA +0CDE ; Consonant # Lo KANNADA LETTER FA +0D15..0D3A ; Consonant # Lo [38] MALAYALAM LETTER KA..MALAYALAM LETTER TTTA +0D9A..0DB1 ; Consonant # Lo [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA +0DB3..0DBB ; Consonant # Lo [9] SINHALA LETTER SANYAKA DAYANNA..SINHALA LETTER RAYANNA +0DBD ; Consonant # Lo SINHALA LETTER DANTAJA LAYANNA +0DC0..0DC6 ; Consonant # Lo [7] SINHALA LETTER VAYANNA..SINHALA LETTER FAYANNA +0E01..0E2E ; Consonant # Lo [46] THAI CHARACTER KO KAI..THAI CHARACTER HO NOKHUK +0E81..0E82 ; Consonant # Lo [2] LAO LETTER KO..LAO LETTER KHO SUNG +0E84 ; Consonant # Lo LAO LETTER KHO TAM +0E86..0E8A ; Consonant # Lo [5] LAO LETTER PALI GHA..LAO LETTER SO TAM +0E8C..0EA3 ; Consonant # Lo [24] LAO LETTER PALI JHA..LAO LETTER LO LING +0EA5 ; Consonant # Lo LAO LETTER LO LOOT +0EA7..0EAE ; Consonant # Lo [8] LAO LETTER WO..LAO LETTER HO TAM +0EDC..0EDF ; Consonant # Lo [4] LAO HO NO..LAO LETTER KHMU NYO +0F40..0F47 ; Consonant # Lo [8] TIBETAN LETTER KA..TIBETAN LETTER JA +0F49..0F6C ; Consonant # Lo [36] TIBETAN LETTER NYA..TIBETAN LETTER RRA +1000..1020 ; Consonant # Lo [33] MYANMAR LETTER KA..MYANMAR LETTER LLA +103F ; Consonant # Lo MYANMAR LETTER GREAT SA +1050..1051 ; Consonant # Lo [2] MYANMAR LETTER SHA..MYANMAR LETTER SSA +105A..105D ; Consonant # Lo [4] MYANMAR LETTER MON NGA..MYANMAR LETTER MON BBE +1061 ; Consonant # Lo MYANMAR LETTER SGAW KAREN SHA +1065..1066 ; Consonant # Lo [2] MYANMAR LETTER WESTERN PWO KAREN THA..MYANMAR LETTER WESTERN PWO KAREN PWA +106E..1070 ; Consonant # Lo [3] MYANMAR LETTER EASTERN PWO KAREN NNA..MYANMAR LETTER EASTERN PWO KAREN GHWA +1075..1081 ; Consonant # Lo [13] MYANMAR LETTER SHAN KA..MYANMAR LETTER SHAN HA +108E ; Consonant # Lo MYANMAR LETTER RUMAI PALAUNG FA +1703..1711 ; Consonant # Lo [15] TAGALOG LETTER KA..TAGALOG LETTER HA +171F ; Consonant # Lo TAGALOG LETTER ARCHAIC RA +1723..1731 ; Consonant # Lo [15] HANUNOO LETTER KA..HANUNOO LETTER HA +1743..1751 ; Consonant # Lo [15] BUHID LETTER KA..BUHID LETTER HA +1763..176C ; Consonant # Lo [10] TAGBANWA LETTER KA..TAGBANWA LETTER YA +176E..1770 ; Consonant # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA +1780..17A2 ; Consonant # Lo [35] KHMER LETTER KA..KHMER LETTER QA +1901..191E ; Consonant # Lo [30] LIMBU LETTER KA..LIMBU LETTER TRA +1950..1962 ; Consonant # Lo [19] TAI LE LETTER KA..TAI LE LETTER NA +1980..19AB ; Consonant # Lo [44] NEW TAI LUE LETTER HIGH QA..NEW TAI LUE LETTER LOW SUA +1A00..1A16 ; Consonant # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA +1A20..1A4C ; Consonant # Lo [45] TAI THAM LETTER HIGH KA..TAI THAM LETTER LOW HA +1A53..1A54 ; Consonant # Lo [2] TAI THAM LETTER LAE..TAI THAM LETTER GREAT SA +1B13..1B33 ; Consonant # Lo [33] BALINESE LETTER KA..BALINESE LETTER HA +1B45..1B4C ; Consonant # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA +1B8A..1BA0 ; Consonant # Lo [23] SUNDANESE LETTER KA..SUNDANESE LETTER HA +1BAE..1BAF ; Consonant # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA +1BBB..1BBD ; Consonant # Lo [3] SUNDANESE LETTER REU..SUNDANESE LETTER BHA +1BC0..1BE3 ; Consonant # Lo [36] BATAK LETTER A..BATAK LETTER MBA +1C00..1C23 ; Consonant # Lo [36] LEPCHA LETTER KA..LEPCHA LETTER A +1C4D..1C4F ; Consonant # Lo [3] LEPCHA LETTER TTA..LEPCHA LETTER DDA +A807..A80A ; Consonant # Lo [4] SYLOTI NAGRI LETTER KO..SYLOTI NAGRI LETTER GHO +A80C..A822 ; Consonant # Lo [23] SYLOTI NAGRI LETTER CO..SYLOTI NAGRI LETTER HO +A840..A85D ; Consonant # Lo [30] PHAGS-PA LETTER KA..PHAGS-PA LETTER A +A862..A865 ; Consonant # Lo [4] PHAGS-PA LETTER QA..PHAGS-PA LETTER GGA +A869..A870 ; Consonant # Lo [8] PHAGS-PA LETTER TTA..PHAGS-PA LETTER ASPIRATED FA +A872 ; Consonant # Lo PHAGS-PA SUPERFIXED LETTER RA +A892..A8B3 ; Consonant # Lo [34] SAURASHTRA LETTER KA..SAURASHTRA LETTER LLA +A90A..A921 ; Consonant # Lo [24] KAYAH LI LETTER KA..KAYAH LI LETTER CA +A930..A946 ; Consonant # Lo [23] REJANG LETTER KA..REJANG LETTER A +A989..A98B ; Consonant # Lo [3] JAVANESE LETTER PA CEREK..JAVANESE LETTER NGA LELET RASWADI +A98F..A9B2 ; Consonant # Lo [36] JAVANESE LETTER KA..JAVANESE LETTER HA +A9E0..A9E4 ; Consonant # Lo [5] MYANMAR LETTER SHAN GHA..MYANMAR LETTER SHAN BHA +A9E7..A9EF ; Consonant # Lo [9] MYANMAR LETTER TAI LAING NYA..MYANMAR LETTER TAI LAING NNA +A9FA..A9FE ; Consonant # Lo [5] MYANMAR LETTER TAI LAING LLA..MYANMAR LETTER TAI LAING BHA +AA06..AA28 ; Consonant # Lo [35] CHAM LETTER KA..CHAM LETTER HA +AA60..AA6F ; Consonant # Lo [16] MYANMAR LETTER KHAMTI GA..MYANMAR LETTER KHAMTI FA +AA71..AA73 ; Consonant # Lo [3] MYANMAR LETTER KHAMTI XA..MYANMAR LETTER KHAMTI RA +AA7A ; Consonant # Lo MYANMAR LETTER AITON RA +AA7E..AA7F ; Consonant # Lo [2] MYANMAR LETTER SHWE PALAUNG CHA..MYANMAR LETTER SHWE PALAUNG SHA +AA80..AAAF ; Consonant # Lo [48] TAI VIET LETTER LOW KO..TAI VIET LETTER HIGH O +AAE2..AAEA ; Consonant # Lo [9] MEETEI MAYEK LETTER CHA..MEETEI MAYEK LETTER SSA +ABC0..ABCD ; Consonant # Lo [14] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER HUK +ABD0 ; Consonant # Lo MEETEI MAYEK LETTER PHAM +ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTER BHAM +10A00 ; Consonant # Lo KHAROSHTHI LETTER A +10A10..10A13 ; Consonant # Lo [4] KHAROSHTHI LETTER KA..KHAROSHTHI LETTER GHA +10A15..10A17 ; Consonant # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA +10A19..10A35 ; Consonant # Lo [29] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER VHA +11013..11037 ; Consonant # Lo [37] BRAHMI LETTER KA..BRAHMI LETTER OLD TAMIL NNNA +11075 ; Consonant # Lo BRAHMI LETTER OLD TAMIL LLA +1108D..110AF ; Consonant # Lo [35] KAITHI LETTER KA..KAITHI LETTER HA +11107..11126 ; Consonant # Lo [32] CHAKMA LETTER KAA..CHAKMA LETTER HAA +11144 ; Consonant # Lo CHAKMA LETTER LHAA +11147 ; Consonant # Lo CHAKMA LETTER VAA +11155..11172 ; Consonant # Lo [30] MAHAJANI LETTER KA..MAHAJANI LETTER RRA +11191..111B2 ; Consonant # Lo [34] SHARADA LETTER KA..SHARADA LETTER HA +11208..11211 ; Consonant # Lo [10] KHOJKI LETTER KA..KHOJKI LETTER JJA +11213..1122B ; Consonant # Lo [25] KHOJKI LETTER NYA..KHOJKI LETTER LLA +1123F ; Consonant # Lo KHOJKI LETTER QA +11284..11286 ; Consonant # Lo [3] MULTANI LETTER KA..MULTANI LETTER GA +11288 ; Consonant # Lo MULTANI LETTER GHA +1128A..1128D ; Consonant # Lo [4] MULTANI LETTER CA..MULTANI LETTER JJA +1128F..1129D ; Consonant # Lo [15] MULTANI LETTER NYA..MULTANI LETTER BA +1129F..112A8 ; Consonant # Lo [10] MULTANI LETTER BHA..MULTANI LETTER RHA +112BA..112DE ; Consonant # Lo [37] KHUDAWADI LETTER KA..KHUDAWADI LETTER HA +11315..11328 ; Consonant # Lo [20] GRANTHA LETTER KA..GRANTHA LETTER NA +1132A..11330 ; Consonant # Lo [7] GRANTHA LETTER PA..GRANTHA LETTER RA +11332..11333 ; Consonant # Lo [2] GRANTHA LETTER LA..GRANTHA LETTER LLA +11335..11339 ; Consonant # Lo [5] GRANTHA LETTER VA..GRANTHA LETTER HA +11392..113B5 ; Consonant # Lo [36] TULU-TIGALARI LETTER KA..TULU-TIGALARI LETTER LLLA +1140E..11434 ; Consonant # Lo [39] NEWA LETTER KA..NEWA LETTER HA +1148F..114AF ; Consonant # Lo [33] TIRHUTA LETTER KA..TIRHUTA LETTER HA +1158E..115AE ; Consonant # Lo [33] SIDDHAM LETTER KA..SIDDHAM LETTER HA +1160E..1162F ; Consonant # Lo [34] MODI LETTER KA..MODI LETTER LLA +1168A..116AA ; Consonant # Lo [33] TAKRI LETTER KA..TAKRI LETTER RRA +116B8 ; Consonant # Lo TAKRI LETTER ARCHAIC KHA +11700..1171A ; Consonant # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA +11740..11746 ; Consonant # Lo [7] AHOM LETTER CA..AHOM LETTER LLA +1180A..1182B ; Consonant # Lo [34] DOGRA LETTER KA..DOGRA LETTER RRA +1190C..11913 ; Consonant # Lo [8] DIVES AKURU LETTER KA..DIVES AKURU LETTER JA +11915..11916 ; Consonant # Lo [2] DIVES AKURU LETTER NYA..DIVES AKURU LETTER TTA +11918..1192F ; Consonant # Lo [24] DIVES AKURU LETTER DDA..DIVES AKURU LETTER ZA +119AE..119D0 ; Consonant # Lo [35] NANDINAGARI LETTER KA..NANDINAGARI LETTER RRA +11A0B..11A32 ; Consonant # Lo [40] ZANABAZAR SQUARE LETTER KA..ZANABAZAR SQUARE LETTER KSSA +11A5C..11A83 ; Consonant # Lo [40] SOYOMBO LETTER KA..SOYOMBO LETTER KSSA +11C0E..11C2E ; Consonant # Lo [33] BHAIKSUKI LETTER KA..BHAIKSUKI LETTER HA +11C72..11C8F ; Consonant # Lo [30] MARCHEN LETTER KA..MARCHEN LETTER A +11D0C..11D30 ; Consonant # Lo [37] MASARAM GONDI LETTER KA..MASARAM GONDI LETTER TRA +11D6C..11D89 ; Consonant # Lo [30] GUNJALA GONDI LETTER YA..GUNJALA GONDI LETTER SA +11EE0..11EF1 ; Consonant # Lo [18] MAKASAR LETTER KA..MAKASAR LETTER A +11F12..11F33 ; Consonant # Lo [34] KAWI LETTER KA..KAWI LETTER JNYA +16101..1611D ; Consonant # Lo [29] GURUNG KHEMA LETTER KA..GURUNG KHEMA LETTER SA +16D43..16D62 ; Consonant # Lo [32] KIRAT RAI LETTER A..KIRAT RAI LETTER HA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Dead + +# Dead Consonant (special consonant with killed vowel) + +# [Not derivable] + +09CE ; Consonant_Dead # Lo BENGALI LETTER KHANDA TA +0C5D ; Consonant_Dead # Lo TELUGU LETTER NAKAARA POLLU +0CDD ; Consonant_Dead # Lo KANNADA LETTER NAKAARA POLLU +0D54..0D56 ; Consonant_Dead # Lo [3] MALAYALAM LETTER CHILLU M..MALAYALAM LETTER CHILLU LLL +0D7A..0D7F ; Consonant_Dead # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K +1CF2..1CF3 ; Consonant_Dead # Lo [2] VEDIC SIGN ARDHAVISARGA..VEDIC SIGN ROTATED ARDHAVISARGA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_With_Stacker + +# Consonants that may make stacked ligatures with the next consonant +# without the use of a virama + +# [Not derivable] + +0CF1..0CF2 ; Consonant_With_Stacker # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA +1CF5..1CF6 ; Consonant_With_Stacker # Lo [2] VEDIC SIGN JIHVAMULIYA..VEDIC SIGN UPADHMANIYA +11003..11004 ; Consonant_With_Stacker # Lo [2] BRAHMI SIGN JIHVAMULIYA..BRAHMI SIGN UPADHMANIYA +11460..11461 ; Consonant_With_Stacker # Lo [2] NEWA SIGN JIHVAMULIYA..NEWA SIGN UPADHMANIYA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Prefixed + +# Cluster-initial consonants + +# [Not derivable] + +111C2..111C3 ; Consonant_Prefixed # Lo [2] SHARADA SIGN JIHVAMULIYA..SHARADA SIGN UPADHMANIYA +1193F ; Consonant_Prefixed # Lo DIVES AKURU PREFIXED NASAL SIGN +11A3A ; Consonant_Prefixed # Lo ZANABAZAR SQUARE CLUSTER-INITIAL LETTER RA +11A84..11A89 ; Consonant_Prefixed # Lo [6] SOYOMBO SIGN JIHVAMULIYA..SOYOMBO CLUSTER-INITIAL LETTER SA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Preceding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when preceding the main +# consonant. + +# [Not derivable] + +0D4E ; Consonant_Preceding_Repha # Lo MALAYALAM LETTER DOT REPH +113D1 ; Consonant_Preceding_Repha # Lo TULU-TIGALARI REPHA +11941 ; Consonant_Preceding_Repha # Lo DIVES AKURU INITIAL RA +11D46 ; Consonant_Preceding_Repha # Lo MASARAM GONDI REPHA +11F02 ; Consonant_Preceding_Repha # Lo KAWI SIGN REPHA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Initial_Postfixed + +# Consonants that succeed the main consonant in character sequences, but are +# pronounced before it. + +# [Not derivable] + +1A5A ; Consonant_Initial_Postfixed # Mn TAI THAM CONSONANT SIGN LOW PA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Succeeding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when succeeding the main +# consonant. + +# [Not derivable] + +17CC ; Consonant_Succeeding_Repha # Mn KHMER SIGN ROBAT + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Subjoined + +# Subjoined Consonant (C2 form subtending a base consonant in Tibetan, etc.) + +# [Not derivable] + +0F8D..0F97 ; Consonant_Subjoined # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Consonant_Subjoined # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +1929..192B ; Consonant_Subjoined # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1A57 ; Consonant_Subjoined # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A5B..1A5E ; Consonant_Subjoined # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1BA1 ; Consonant_Subjoined # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA2..1BA3 ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BAC..1BAD ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C24..1C25 ; Consonant_Subjoined # Mc [2] LEPCHA SUBJOINED LETTER YA..LEPCHA SUBJOINED LETTER RA +A867..A868 ; Consonant_Subjoined # Lo [2] PHAGS-PA SUBJOINED LETTER WA..PHAGS-PA SUBJOINED LETTER YA +A871 ; Consonant_Subjoined # Lo PHAGS-PA SUBJOINED LETTER RA +11C92..11CA7 ; Consonant_Subjoined # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CA9 ; Consonant_Subjoined # Mc MARCHEN SUBJOINED LETTER YA +11CAA..11CAF ; Consonant_Subjoined # Mn [6] MARCHEN SUBJOINED LETTER RA..MARCHEN SUBJOINED LETTER A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Medial + +# Medial Consonant (medial liquid, occurring in clusters) + +# [Not derivable] + +0A75 ; Consonant_Medial # Mn GURMUKHI SIGN YAKASH +0EBC ; Consonant_Medial # Mn LAO SEMIVOWEL SIGN LO +0EBD ; Consonant_Medial # Lo LAO SEMIVOWEL SIGN NYO +103B..103C ; Consonant_Medial # Mc [2] MYANMAR CONSONANT SIGN MEDIAL YA..MYANMAR CONSONANT SIGN MEDIAL RA +103D..103E ; Consonant_Medial # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +105E..1060 ; Consonant_Medial # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Consonant_Medial # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +1A55 ; Consonant_Medial # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A56 ; Consonant_Medial # Mn TAI THAM CONSONANT SIGN MEDIAL LA +A8B4 ; Consonant_Medial # Mc SAURASHTRA CONSONANT SIGN HAARU +A9BD ; Consonant_Medial # Mn JAVANESE CONSONANT SIGN KERET +A9BE..A9BF ; Consonant_Medial # Mc [2] JAVANESE CONSONANT SIGN PENGKAL..JAVANESE CONSONANT SIGN CAKRA +AA33..AA34 ; Consonant_Medial # Mc [2] CHAM CONSONANT SIGN YA..CHAM CONSONANT SIGN RA +AA35..AA36 ; Consonant_Medial # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +1171D ; Consonant_Medial # Mn AHOM CONSONANT SIGN MEDIAL LA +1171E ; Consonant_Medial # Mc AHOM CONSONANT SIGN MEDIAL RA +1171F ; Consonant_Medial # Mn AHOM CONSONANT SIGN MEDIAL LIGATING RA +11940 ; Consonant_Medial # Mc DIVES AKURU MEDIAL YA +11942 ; Consonant_Medial # Mc DIVES AKURU MEDIAL RA +11A3B..11A3E ; Consonant_Medial # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11D47 ; Consonant_Medial # Mn MASARAM GONDI RA-KARA +1612A..1612C ; Consonant_Medial # Mc [3] GURUNG KHEMA CONSONANT SIGN MEDIAL YA..GURUNG KHEMA CONSONANT SIGN MEDIAL HA +1612E ; Consonant_Medial # Mn GURUNG KHEMA CONSONANT SIGN MEDIAL RA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Final + +# Final Consonant (special final forms which do not take vowels) + +# [Not derivable] + +1930..1931 ; Consonant_Final # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Consonant_Final # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +1939 ; Consonant_Final # Mn LIMBU SIGN MUKPHRENG +19C1..19C7 ; Consonant_Final # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B +1A58..1A59 ; Consonant_Final # Mn [2] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN FINAL NGA +1B03 ; Consonant_Final # Mn BALINESE SIGN SURANG +1B81 ; Consonant_Final # Mn SUNDANESE SIGN PANGLAYAR +1BBE..1BBF ; Consonant_Final # Lo [2] SUNDANESE LETTER FINAL K..SUNDANESE LETTER FINAL M +1BF0..1BF1 ; Consonant_Final # Mn [2] BATAK CONSONANT SIGN NG..BATAK CONSONANT SIGN H +1C2D..1C33 ; Consonant_Final # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +A94F..A951 ; Consonant_Final # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A952 ; Consonant_Final # Mc REJANG CONSONANT SIGN H +A982 ; Consonant_Final # Mn JAVANESE SIGN LAYAR +AA40..AA42 ; Consonant_Final # Lo [3] CHAM LETTER FINAL K..CHAM LETTER FINAL NG +AA43 ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL NG +AA44..AA4B ; Consonant_Final # Lo [8] CHAM LETTER FINAL CH..CHAM LETTER FINAL SS +AA4C ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL M +AA4D ; Consonant_Final # Mc CHAM CONSONANT SIGN FINAL H +ABDB..ABE2 ; Consonant_Final # Lo [8] MEETEI MAYEK LETTER KOK LONSUM..MEETEI MAYEK LETTER I LONSUM +11A8A..11A95 ; Consonant_Final # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Head_Letter + +# Head Letter (Tibetan) + +# [Not derivable] + +0F88..0F8C ; Consonant_Head_Letter # Lo [5] TIBETAN SIGN LCE TSA CAN..TIBETAN SIGN INVERTED MCHU CAN + +# ================================================ + +# Indic_Syllabic_Category=Modifying_Letter + +# Reanalyzed letters not participating in the abugida structure, but +# serving to modify the sound of an adjacent vowel or consonant. +# Note that this is not the same as General_Category=Modifier_Letter. + +# [Not derivable] + +0B83 ; Modifying_Letter # Lo TAMIL SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Tone_Letter + +# Tone Letter (spacing lexical tone mark with status as a letter) + +# [Not derivable] + +1970..1974 ; Tone_Letter # Lo [5] TAI LE LETTER TONE-2..TAI LE LETTER TONE-6 +AAC0 ; Tone_Letter # Lo TAI VIET TONE MAI NUENG +AAC2 ; Tone_Letter # Lo TAI VIET TONE MAI SONG + +# ================================================ + +# Indic_Syllabic_Category=Tone_Mark + +# Tone Mark (nonspacing or spacing lexical tone mark) + +# [Not derivable] + +0E48..0E4B ; Tone_Mark # Mn [4] THAI CHARACTER MAI EK..THAI CHARACTER MAI CHATTAWA +0EC8..0ECB ; Tone_Mark # Mn [4] LAO TONE MAI EK..LAO TONE MAI CATAWA +1037 ; Tone_Mark # Mn MYANMAR SIGN DOT BELOW +1063..1064 ; Tone_Mark # Mc [2] MYANMAR TONE MARK SGAW KAREN HATHI..MYANMAR TONE MARK SGAW KAREN KE PHO +1069..106D ; Tone_Mark # Mc [5] MYANMAR SIGN WESTERN PWO KAREN TONE-1..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1087..108C ; Tone_Mark # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108D ; Tone_Mark # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +108F ; Tone_Mark # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109B ; Tone_Mark # Mc [2] MYANMAR SIGN KHAMTI TONE-1..MYANMAR SIGN KHAMTI TONE-3 +19C8..19C9 ; Tone_Mark # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A75..1A79 ; Tone_Mark # Mn [5] TAI THAM SIGN TONE-1..TAI THAM SIGN KHUEN TONE-5 +A92B..A92D ; Tone_Mark # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +AA7B ; Tone_Mark # Mc MYANMAR SIGN PAO KAREN TONE +AA7C ; Tone_Mark # Mn MYANMAR SIGN TAI LAING TONE-2 +AA7D ; Tone_Mark # Mc MYANMAR SIGN TAI LAING TONE-5 +AABF ; Tone_Mark # Mn TAI VIET TONE MAI EK +AAC1 ; Tone_Mark # Mn TAI VIET TONE MAI THO +ABEC ; Tone_Mark # Mc MEETEI MAYEK LUM IYEK + +# ================================================ + +# Indic_Syllabic_Category=Gemination_Mark + +# Gemination Mark (doubling of the preceding or following consonant) +# +# U+0A71 GURMUKHI ADDAK precedes the consonant it geminates, while the +# others follow the consonant they geminate. + +# [Not derivable] + +0A71 ; Gemination_Mark # Mn GURMUKHI ADDAK +0AFB ; Gemination_Mark # Mn GUJARATI SIGN SHADDA +11237 ; Gemination_Mark # Mn KHOJKI SIGN SHADDA +113D2 ; Gemination_Mark # Mn TULU-TIGALARI GEMINATION MARK +11A98 ; Gemination_Mark # Mn SOYOMBO GEMINATION MARK + +# ================================================ + +# Indic_Syllabic_Category=Cantillation_Mark + +# Cantillation Mark (recitation marks, such as svara markers for the Samaveda) + +# [Not derivable] + +0951..0952 ; Cantillation_Mark # Mn [2] DEVANAGARI STRESS SIGN UDATTA..DEVANAGARI STRESS SIGN ANUDATTA +0A51 ; Cantillation_Mark # Mn GURMUKHI SIGN UDAAT +0AFA ; Cantillation_Mark # Mn GUJARATI SIGN SUKUN +0AFC ; Cantillation_Mark # Mn GUJARATI SIGN MADDAH +1CD0..1CD2 ; Cantillation_Mark # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CD4..1CE0 ; Cantillation_Mark # Mn [13] VEDIC SIGN YAJURVEDIC MIDLINE SVARITA..VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CE1 ; Cantillation_Mark # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF4 ; Cantillation_Mark # Mn VEDIC TONE CANDRA ABOVE +1CF7 ; Cantillation_Mark # Mc VEDIC SIGN ATIKRAMA +1CF8..1CF9 ; Cantillation_Mark # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE +20F0 ; Cantillation_Mark # Mn COMBINING ASTERISK ABOVE +A8E0..A8F1 ; Cantillation_Mark # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +1123E ; Cantillation_Mark # Mn KHOJKI SIGN SUKUN +11366..1136C ; Cantillation_Mark # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Cantillation_Mark # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA +113E1..113E2 ; Cantillation_Mark # Mn [2] TULU-TIGALARI VEDIC TONE SVARITA..TULU-TIGALARI VEDIC TONE ANUDATTA + +# ================================================ + +# Indic_Syllabic_Category=Register_Shifter + +# Register Shifter (shifts register for consonants, akin to a tone mark) + +# [Not derivable] + +17C9..17CA ; Register_Shifter # Mn [2] KHMER SIGN MUUSIKATOAN..KHMER SIGN TRIISAP + +# ================================================ + +# Indic_Syllabic_Category=Syllable_Modifier + +# Syllable Modifier (miscellaneous combining characters that modify +# something in the orthographic syllable they succeed or appear in) + +# [Not derivable] + +00B2..00B3 ; Syllable_Modifier # No [2] SUPERSCRIPT TWO..SUPERSCRIPT THREE +09FE ; Syllable_Modifier # Mn BENGALI SANDHI MARK +0ECE ; Syllable_Modifier # Mn LAO YAMAKKAN +0F35 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0FC6 ; Syllable_Modifier # Mn TIBETAN SYMBOL PADMA GDAN +17CB ; Syllable_Modifier # Mn KHMER SIGN BANTOC +17CE..17D0 ; Syllable_Modifier # Mn [3] KHMER SIGN KAKABAT..KHMER SIGN SAMYOK SANNYA +17D3 ; Syllable_Modifier # Mn KHMER SIGN BATHAMASAT +17DD ; Syllable_Modifier # Mn KHMER SIGN ATTHACAN +193B ; Syllable_Modifier # Mn LIMBU SIGN SA-I +1A7B..1A7C ; Syllable_Modifier # Mn [2] TAI THAM SIGN MAI SAM..TAI THAM SIGN KHUEN-LUE KARAN +1A7F ; Syllable_Modifier # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1C36 ; Syllable_Modifier # Mn LEPCHA SIGN RAN +1DFB ; Syllable_Modifier # Mn COMBINING DELETION MARK +2074 ; Syllable_Modifier # No SUPERSCRIPT FOUR +2082..2084 ; Syllable_Modifier # No [3] SUBSCRIPT TWO..SUBSCRIPT FOUR +111C9 ; Syllable_Modifier # Mn SHARADA SANDHI MARK +1145E ; Syllable_Modifier # Mn NEWA SANDHI MARK +11A33 ; Syllable_Modifier # Mn ZANABAZAR SQUARE FINAL CONSONANT MARK + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Killer + +# Consonant Killer (signifies that the previous consonant or consonants are +# not pronounced) + +# [Not derivable] + +0E4C ; Consonant_Killer # Mn THAI CHARACTER THANTHAKHAT +17CD ; Consonant_Killer # Mn KHMER SIGN TOANDAKHIAT + +# ================================================ + +# Indic_Syllabic_Category=Non_Joiner + +# Non_Joiner (Zero Width Non-Joiner) + +# [Not derivable] + +200C ; Non_Joiner # Cf ZERO WIDTH NON-JOINER + +# ================================================ + +# Indic_Syllabic_Category=Joiner + +# Joiner (Zero Width Joiner) + +# [Not derivable] + +200D ; Joiner # Cf ZERO WIDTH JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number_Joiner + +# Number_Joiner (forms ligatures between numbers for multiplication) + +# [Not derivable] + +1107F ; Number_Joiner # Mn BRAHMI NUMBER JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number + +# Number (can be used as vowel-holders like consonant placeholders) +# Note: A number may even hold subjoined consonants which may in turn +# have been formed using a virama or a stacker, e.g. the sequence +# where THAI THAM LETTER LOW TA is subjoined to +# TAI THAM THAM DIGIT THREE using an invisible stacker. + +# [Not derivable] + +0030..0039 ; Number # Nd [10] DIGIT ZERO..DIGIT NINE +0966..096F ; Number # Nd [10] DEVANAGARI DIGIT ZERO..DEVANAGARI DIGIT NINE +09E6..09EF ; Number # Nd [10] BENGALI DIGIT ZERO..BENGALI DIGIT NINE +0A66..0A6F ; Number # Nd [10] GURMUKHI DIGIT ZERO..GURMUKHI DIGIT NINE +0AE6..0AEF ; Number # Nd [10] GUJARATI DIGIT ZERO..GUJARATI DIGIT NINE +0B66..0B6F ; Number # Nd [10] ORIYA DIGIT ZERO..ORIYA DIGIT NINE +0BE6..0BEF ; Number # Nd [10] TAMIL DIGIT ZERO..TAMIL DIGIT NINE +0C66..0C6F ; Number # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE +0CE6..0CEF ; Number # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE +0D66..0D6F ; Number # Nd [10] MALAYALAM DIGIT ZERO..MALAYALAM DIGIT NINE +0DE6..0DEF ; Number # Nd [10] SINHALA LITH DIGIT ZERO..SINHALA LITH DIGIT NINE +0E50..0E59 ; Number # Nd [10] THAI DIGIT ZERO..THAI DIGIT NINE +0ED0..0ED9 ; Number # Nd [10] LAO DIGIT ZERO..LAO DIGIT NINE +0F20..0F29 ; Number # Nd [10] TIBETAN DIGIT ZERO..TIBETAN DIGIT NINE +0F2A..0F33 ; Number # No [10] TIBETAN DIGIT HALF ONE..TIBETAN DIGIT HALF ZERO +1040..1049 ; Number # Nd [10] MYANMAR DIGIT ZERO..MYANMAR DIGIT NINE +1090..1099 ; Number # Nd [10] MYANMAR SHAN DIGIT ZERO..MYANMAR SHAN DIGIT NINE +17E0..17E9 ; Number # Nd [10] KHMER DIGIT ZERO..KHMER DIGIT NINE +1946..194F ; Number # Nd [10] LIMBU DIGIT ZERO..LIMBU DIGIT NINE +19D0..19D9 ; Number # Nd [10] NEW TAI LUE DIGIT ZERO..NEW TAI LUE DIGIT NINE +19DA ; Number # No NEW TAI LUE THAM DIGIT ONE +1A80..1A89 ; Number # Nd [10] TAI THAM HORA DIGIT ZERO..TAI THAM HORA DIGIT NINE +1A90..1A99 ; Number # Nd [10] TAI THAM THAM DIGIT ZERO..TAI THAM THAM DIGIT NINE +1B50..1B59 ; Number # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE +1BB0..1BB9 ; Number # Nd [10] SUNDANESE DIGIT ZERO..SUNDANESE DIGIT NINE +1C40..1C49 ; Number # Nd [10] LEPCHA DIGIT ZERO..LEPCHA DIGIT NINE +A8D0..A8D9 ; Number # Nd [10] SAURASHTRA DIGIT ZERO..SAURASHTRA DIGIT NINE +A900..A909 ; Number # Nd [10] KAYAH LI DIGIT ZERO..KAYAH LI DIGIT NINE +A9D0..A9D9 ; Number # Nd [10] JAVANESE DIGIT ZERO..JAVANESE DIGIT NINE +A9F0..A9F9 ; Number # Nd [10] MYANMAR TAI LAING DIGIT ZERO..MYANMAR TAI LAING DIGIT NINE +AA50..AA59 ; Number # Nd [10] CHAM DIGIT ZERO..CHAM DIGIT NINE +ABF0..ABF9 ; Number # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE +10A40..10A48 ; Number # No [9] KHAROSHTHI DIGIT ONE..KHAROSHTHI FRACTION ONE HALF +11066..1106F ; Number # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11136..1113F ; Number # Nd [10] CHAKMA DIGIT ZERO..CHAKMA DIGIT NINE +111D0..111D9 ; Number # Nd [10] SHARADA DIGIT ZERO..SHARADA DIGIT NINE +111E1..111F4 ; Number # No [20] SINHALA ARCHAIC DIGIT ONE..SINHALA ARCHAIC NUMBER ONE THOUSAND +112F0..112F9 ; Number # Nd [10] KHUDAWADI DIGIT ZERO..KHUDAWADI DIGIT NINE +11450..11459 ; Number # Nd [10] NEWA DIGIT ZERO..NEWA DIGIT NINE +114D0..114D9 ; Number # Nd [10] TIRHUTA DIGIT ZERO..TIRHUTA DIGIT NINE +11650..11659 ; Number # Nd [10] MODI DIGIT ZERO..MODI DIGIT NINE +116C0..116C9 ; Number # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE +116D0..116E3 ; Number # Nd [20] MYANMAR PAO DIGIT ZERO..MYANMAR EASTERN PWO KAREN DIGIT NINE +11730..11739 ; Number # Nd [10] AHOM DIGIT ZERO..AHOM DIGIT NINE +1173A..1173B ; Number # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY +11950..11959 ; Number # Nd [10] DIVES AKURU DIGIT ZERO..DIVES AKURU DIGIT NINE +11C50..11C59 ; Number # Nd [10] BHAIKSUKI DIGIT ZERO..BHAIKSUKI DIGIT NINE +11C5A..11C6C ; Number # No [19] BHAIKSUKI NUMBER ONE..BHAIKSUKI HUNDREDS UNIT MARK +11D50..11D59 ; Number # Nd [10] MASARAM GONDI DIGIT ZERO..MASARAM GONDI DIGIT NINE +11DA0..11DA9 ; Number # Nd [10] GUNJALA GONDI DIGIT ZERO..GUNJALA GONDI DIGIT NINE +11F50..11F59 ; Number # Nd [10] KAWI DIGIT ZERO..KAWI DIGIT NINE +16130..16139 ; Number # Nd [10] GURUNG KHEMA DIGIT ZERO..GURUNG KHEMA DIGIT NINE +16D70..16D79 ; Number # Nd [10] KIRAT RAI DIGIT ZERO..KIRAT RAI DIGIT NINE + +# ================================================ + +# Indic_Syllabic_Category=Brahmi_Joining_Number + +# Brahmi Joining Number (may be joined by a Number_Joiner of the same +# script, e.g. in Brahmi) +# +# Note: These are different from Numbers, in the way that there is no known +# evidence of Brahmi Joining Numbers taking vowels or subjoined consonants. +# Until such evidence is found, implementations may assume that Brahmi +# Joining Numbers only participate in shaping with other Brahmi Joining +# Numbers. + +# [Not derivable] + +11052..11065 ; Brahmi_Joining_Number # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND + +# EOF diff --git a/data/17.0.0-indic-positional-category.txt b/data/17.0.0-indic-positional-category.txt new file mode 100644 index 0000000..2dd7448 --- /dev/null +++ b/data/17.0.0-indic-positional-category.txt @@ -0,0 +1,842 @@ +# IndicPositionalCategory-17.0.0.txt +# Date: 2025-07-29, 13:35:52 GMT +# © 2025 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use and license, see https://www.unicode.org/terms_of_use.html +# +# Unicode Character Database +# For documentation, see https://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Positional_Category enumerated property +# +# Scope: This property is aimed at the problem of +# the specification of syllabic structure for Indic scripts. +# Because dependent vowels (matras), visible viramas, and other +# characters are placed in notional slots around the consonant (or +# consonant cluster) core of an Indic syllable, there may be +# cooccurrence constraints or other interactions. Also, it may be +# desirable, in cases where more than one such character may occur in +# sequence, as for example, in a top slot and a bottom slot, to +# specify preferred orders for spelling. As such, this property +# is designed primarily to supplement the Indic_Syllabic_Category +# property. +# +# In addition to combining marks associated with Indic scripts, the +# Indic_Positional_Category has non-trivial values for special signs +# associated with Indic_Syllabic_Category=Consonant_Prefixed +# or Indic_Syllabic_Category=Consonant_Preceding_Repha. Those signs +# have General_Category=Lo, rather than being combining marks. +# They occur in initial position in syllabic structure. However, when +# rendered, they appear as marks positioned with respect to another +# base letter (usually above it). Hence, having an explicit value for +# Indic_Positional_Category for those signs can be helpful. +# +# Note that this property is *not* intended as +# a prescriptive property regarding display or font design, +# for a number of reasons. Good font design requires information +# that is outside the context of a character encoding standard, +# and is best handled in other venues. For Indic dependent +# vowels and similar characters, in particular: +# +# 1. Matra placement may vary somewhat based on typeface design. +# 2. Matra placement, even within a single script, may vary +# somewhat according to historic period or local conventions. +# 3. Matra placement may be changed by explicit orthographic reform +# decisions. +# 4. Matras may ligate in various ways with a consonant (or even +# other elements of a syllable) instead of occurring in a +# discrete location. +# 5. Matra display may be contextually determined. This is +# notable, for example, in the Tamil script, where the shape +# and placement of -u and -uu vowels depends strongly on +# which consonant they adjoin. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Positional_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as containing dependent vowels or similar characters +# in the structural sense used for the Indic_Positional_Category are the +# following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Dives Akuru, Dogra, Grantha, Gujarati, +# Gunjala Gondi, Gurmukhi, Gurung Khema, Hanunoo, Javanese, Kaithi, +# Kannada, Kawi, Kayah Li, Kharoshthi, Khmer, Khojki, Khudawadi, +# Kirat Rai, Lao, Lepcha, Limbu, Makasar, Malayalam, Marchen, +# Masaram Gondi, Meetei Mayek, Modi, Myanmar, Nandinagari, Newa, +# New Tai Lue, Oriya, Rejang, Saurashtra, Sharada, Siddham, Sinhala, +# Soyombo, Sundanese, Syloti Nagri, Tagalog, Tagbanwa, Tai Tham, +# Tai Viet, Takri, Tamil, Telugu, Thai, Tibetan, Tirhuta, +# Tulu-Tigalari, and Zanabazar Square. +# +# All characters for all other scripts not in that list +# take the default value for this property. +# +# See IndicSyllabicCategory.txt for a slightly more extended +# list of Indic scripts, including those which do not have +# positional characters. Currently, those additional +# Indic scripts without positional characters are +# Multani, Phags-pa, and Tai Le. +# +# Notes: +# +# 1. The following characters are all assigned the positional category Right, +# but may have different positions in some cases: +# * U+0BC1 TAMIL VOWEL SIGN U and U+0BC2 TAMIL VOWEL SIGN UU have +# contextually variable placement in Tamil. +# * U+11341 GRANTHA VOWEL SIGN U and U+11342 GRANTHA VOWEL SIGN UU have +# contextually variable placement in Grantha. +# * U+11440 NEWA VOWEL SIGN O and U+11441 NEWA VOWEL SIGN AU have contextually +# variable placement in Newa. +# +# 2. The following characters are all assigned the positional category Top, +# but may have different positions in some cases: +# * U+1143E NEWA VOWEL SIGN E and U+1143F NEWA VOWEL SIGN AI have contextually +# variable placement in Newa. +# +# 3. The following characters are all assigned the positional category Bottom, +# but may have different positions in some cases: +# * U+0D41 MALAYALAM VOWEL SIGN U and U+0D42 MALAYALAM VOWEL SIGN UU form +# complex ligatures with consonants in older Malayalam orthography, and +# are spacing marks to the right of the base in reformed Malayalam +# orthography. +# * U+102F MYANMAR VOWEL SIGN U and U+1030 MYANMAR VOWEL SIGN UU have +# contextually variable placement in Myanmar. +# * U+1A69 TAI THAM VOWEL SIGN U and U+1A6A TAI THAM VOWEL SIGN UU have +# contextually variable placement in Tai Tham. +# * U+113BB TULU-TIGALARI VOWEL SIGN U and +# U+113BC TULU-TIGALARI VOWEL SIGN UU form complex ligatures with +# consonants. +# +# 4. The following character is assigned the positional category Left, but +# may have different positions in different styles: +# * U+119D2 NANDINAGARI VOWEL SIGN I has stylistically variable placement +# in Nandinagari. + + +# ================================================ + +# Property: Indic_Positional_Category +# +# All code points not explicitly listed for Indic_Positional_Category +# have the value Not_Applicable (NA). +# +# @missing: 0000..10FFFF; Not_Applicable + +# ------------------------------------------------ + +# Indic_Positional_Category=Right + +0903 ; Right # Mc DEVANAGARI SIGN VISARGA +093B ; Right # Mc DEVANAGARI VOWEL SIGN OOE +093E ; Right # Mc DEVANAGARI VOWEL SIGN AA +0940 ; Right # Mc DEVANAGARI VOWEL SIGN II +0949..094C ; Right # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094F ; Right # Mc DEVANAGARI VOWEL SIGN AW +0982..0983 ; Right # Mc [2] BENGALI SIGN ANUSVARA..BENGALI SIGN VISARGA +09BE ; Right # Mc BENGALI VOWEL SIGN AA +09C0 ; Right # Mc BENGALI VOWEL SIGN II +09D7 ; Right # Mc BENGALI AU LENGTH MARK +0A03 ; Right # Mc GURMUKHI SIGN VISARGA +0A3E ; Right # Mc GURMUKHI VOWEL SIGN AA +0A40 ; Right # Mc GURMUKHI VOWEL SIGN II +0A83 ; Right # Mc GUJARATI SIGN VISARGA +0ABE ; Right # Mc GUJARATI VOWEL SIGN AA +0AC0 ; Right # Mc GUJARATI VOWEL SIGN II +0ACB..0ACC ; Right # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0B02..0B03 ; Right # Mc [2] ORIYA SIGN ANUSVARA..ORIYA SIGN VISARGA +0B3E ; Right # Mc ORIYA VOWEL SIGN AA +0B40 ; Right # Mc ORIYA VOWEL SIGN II +0BBE..0BBF ; Right # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC1..0BC2 ; Right # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BD7 ; Right # Mc TAMIL AU LENGTH MARK +0C01..0C03 ; Right # Mc [3] TELUGU SIGN CANDRABINDU..TELUGU SIGN VISARGA +0C41..0C44 ; Right # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C82..0C83 ; Right # Mc [2] KANNADA SIGN ANUSVARA..KANNADA SIGN VISARGA +0CBE ; Right # Mc KANNADA VOWEL SIGN AA +0CC1..0CC4 ; Right # Mc [4] KANNADA VOWEL SIGN U..KANNADA VOWEL SIGN VOCALIC RR +0CD5..0CD6 ; Right # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CF3 ; Right # Mc KANNADA SIGN COMBINING ANUSVARA ABOVE RIGHT +0D02..0D03 ; Right # Mc [2] MALAYALAM SIGN ANUSVARA..MALAYALAM SIGN VISARGA +0D3E..0D40 ; Right # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D57 ; Right # Mc MALAYALAM AU LENGTH MARK +0D82..0D83 ; Right # Mc [2] SINHALA SIGN ANUSVARAYA..SINHALA SIGN VISARGAYA +0DCF..0DD1 ; Right # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD8 ; Right # Mc SINHALA VOWEL SIGN GAETTA-PILLA +0DDF ; Right # Mc SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Right # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Right # Lo THAI CHARACTER SARA A +0E32..0E33 ; Right # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E45 ; Right # Lo THAI CHARACTER LAKKHANGYAO +0EB0 ; Right # Lo LAO VOWEL SIGN A +0EB2..0EB3 ; Right # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0F3E ; Right # Mc TIBETAN SIGN YAR TSHES +0F7F ; Right # Mc TIBETAN SIGN RNAM BCAD +102B..102C ; Right # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +1038 ; Right # Mc MYANMAR SIGN VISARGA +103B ; Right # Mc MYANMAR CONSONANT SIGN MEDIAL YA +1056..1057 ; Right # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1062..1064 ; Right # Mc [3] MYANMAR VOWEL SIGN SGAW KAREN EU..MYANMAR TONE MARK SGAW KAREN KE PHO +1067..106D ; Right # Mc [7] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1083 ; Right # Mc MYANMAR VOWEL SIGN SHAN AA +1087..108C ; Right # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108F ; Right # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109C ; Right # Mc [3] MYANMAR SIGN KHAMTI TONE-1..MYANMAR VOWEL SIGN AITON A +1715 ; Right # Mc TAGALOG SIGN PAMUDPOD +1734 ; Right # Mc HANUNOO SIGN PAMUDPOD +17B6 ; Right # Mc KHMER VOWEL SIGN AA +17C7..17C8 ; Right # Mc [2] KHMER SIGN REAHMUK..KHMER SIGN YUUKALEAPINTU +1923..1924 ; Right # Mc [2] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AI +1929..192B ; Right # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1930..1931 ; Right # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Right # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +19B0..19B4 ; Right # Lo [5] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN UU +19B8..19B9 ; Right # Lo [2] NEW TAI LUE VOWEL SIGN OA..NEW TAI LUE VOWEL SIGN UE +19BB..19C0 ; Right # Lo [6] NEW TAI LUE VOWEL SIGN AAY..NEW TAI LUE VOWEL SIGN IY +19C8..19C9 ; Right # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A1A ; Right # Mc BUGINESE VOWEL SIGN O +1A57 ; Right # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A61 ; Right # Mc TAI THAM VOWEL SIGN A +1A63..1A64 ; Right # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A6D ; Right # Mc TAI THAM VOWEL SIGN OY +1B04 ; Right # Mc BALINESE SIGN BISAH +1B35 ; Right # Mc BALINESE VOWEL SIGN TEDUNG +1B44 ; Right # Mc BALINESE ADEG ADEG +1B82 ; Right # Mc SUNDANESE SIGN PANGWISAD +1BA1 ; Right # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA7 ; Right # Mc SUNDANESE VOWEL SIGN PANOLONG +1BAA ; Right # Mc SUNDANESE SIGN PAMAAEH +1BE7 ; Right # Mc BATAK VOWEL SIGN E +1BEA..1BEC ; Right # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BEE ; Right # Mc BATAK VOWEL SIGN U +1BF2..1BF3 ; Right # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +1C24..1C26 ; Right # Mc [3] LEPCHA SUBJOINED LETTER YA..LEPCHA VOWEL SIGN AA +1C2A..1C2B ; Right # Mc [2] LEPCHA VOWEL SIGN U..LEPCHA VOWEL SIGN UU +1CE1 ; Right # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF7 ; Right # Mc VEDIC SIGN ATIKRAMA +A823..A824 ; Right # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A827 ; Right # Mc SYLOTI NAGRI VOWEL SIGN OO +A880..A881 ; Right # Mc [2] SAURASHTRA SIGN ANUSVARA..SAURASHTRA SIGN VISARGA +A8B4..A8C3 ; Right # Mc [16] SAURASHTRA CONSONANT SIGN HAARU..SAURASHTRA VOWEL SIGN AU +A952..A953 ; Right # Mc [2] REJANG CONSONANT SIGN H..REJANG VIRAMA +A983 ; Right # Mc JAVANESE SIGN WIGNYAN +A9B4..A9B5 ; Right # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +AA33 ; Right # Mc CHAM CONSONANT SIGN YA +AA4D ; Right # Mc CHAM CONSONANT SIGN FINAL H +AA7B ; Right # Mc MYANMAR SIGN PAO KAREN TONE +AA7D ; Right # Mc MYANMAR SIGN TAI LAING TONE-5 +AAB1 ; Right # Lo TAI VIET VOWEL AA +AABA ; Right # Lo TAI VIET VOWEL UA +AABD ; Right # Lo TAI VIET VOWEL AN +AAEF ; Right # Mc MEETEI MAYEK VOWEL SIGN AAU +AAF5 ; Right # Mc MEETEI MAYEK VOWEL SIGN VISARGA +ABE3..ABE4 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE6..ABE7 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE9..ABEA ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +ABEC ; Right # Mc MEETEI MAYEK LUM IYEK +11000 ; Right # Mc BRAHMI SIGN CANDRABINDU +11002 ; Right # Mc BRAHMI SIGN VISARGA +11082 ; Right # Mc KAITHI SIGN VISARGA +110B0 ; Right # Mc KAITHI VOWEL SIGN AA +110B2 ; Right # Mc KAITHI VOWEL SIGN II +110B7..110B8 ; Right # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11145..11146 ; Right # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI +11182 ; Right # Mc SHARADA SIGN VISARGA +111B3 ; Right # Mc SHARADA VOWEL SIGN AA +111B5 ; Right # Mc SHARADA VOWEL SIGN II +111C0 ; Right # Mc SHARADA SIGN VIRAMA +1122C..1122E ; Right # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +11235 ; Right # Mc KHOJKI SIGN VIRAMA +112E0 ; Right # Mc KHUDAWADI VOWEL SIGN AA +112E2 ; Right # Mc KHUDAWADI VOWEL SIGN II +11302..11303 ; Right # Mc [2] GRANTHA SIGN ANUSVARA..GRANTHA SIGN VISARGA +1133E..1133F ; Right # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11341..11344 ; Right # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +1134D ; Right # Mc GRANTHA SIGN VIRAMA +11357 ; Right # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Right # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +113B8 ; Right # Mc TULU-TIGALARI VOWEL SIGN AA +113C9..113CA ; Right # Mc [2] TULU-TIGALARI AU LENGTH MARK..TULU-TIGALARI SIGN CANDRA ANUNASIKA +113CC..113CD ; Right # Mc [2] TULU-TIGALARI SIGN ANUSVARA..TULU-TIGALARI SIGN VISARGA +113CF ; Right # Mc TULU-TIGALARI SIGN LOOPED VIRAMA +11435 ; Right # Mc NEWA VOWEL SIGN AA +11437 ; Right # Mc NEWA VOWEL SIGN II +11440..11441 ; Right # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +11445 ; Right # Mc NEWA SIGN VISARGA +114B0 ; Right # Mc TIRHUTA VOWEL SIGN AA +114B2 ; Right # Mc TIRHUTA VOWEL SIGN II +114BD ; Right # Mc TIRHUTA VOWEL SIGN SHORT O +114C1 ; Right # Mc TIRHUTA SIGN VISARGA +115AF ; Right # Mc SIDDHAM VOWEL SIGN AA +115B1 ; Right # Mc SIDDHAM VOWEL SIGN II +115BE ; Right # Mc SIDDHAM SIGN VISARGA +11630..11632 ; Right # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +1163B..1163C ; Right # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +1163E ; Right # Mc MODI SIGN VISARGA +116AC ; Right # Mc TAKRI SIGN VISARGA +116AF ; Right # Mc TAKRI VOWEL SIGN II +116B6 ; Right # Mc TAKRI SIGN VIRAMA +11720..11721 ; Right # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +1182C ; Right # Mc DOGRA VOWEL SIGN AA +1182E ; Right # Mc DOGRA VOWEL SIGN II +11838 ; Right # Mc DOGRA SIGN VISARGA +11930..11934 ; Right # Mc [5] DIVES AKURU VOWEL SIGN AA..DIVES AKURU VOWEL SIGN UU +1193D ; Right # Mc DIVES AKURU SIGN HALANTA +11940 ; Right # Mc DIVES AKURU MEDIAL YA +119D1 ; Right # Mc NANDINAGARI VOWEL SIGN AA +119D3 ; Right # Mc NANDINAGARI VOWEL SIGN II +119DC..119DF ; Right # Mc [4] NANDINAGARI VOWEL SIGN O..NANDINAGARI SIGN VISARGA +11A39 ; Right # Mc ZANABAZAR SQUARE SIGN VISARGA +11A57..11A58 ; Right # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A97 ; Right # Mc SOYOMBO SIGN VISARGA +11B61 ; Right # Mc SHARADA VOWEL SIGN OOE +11B65 ; Right # Mc SHARADA VOWEL SIGN SHORT O +11B67 ; Right # Mc SHARADA VOWEL SIGN CANDRA O +11C2F ; Right # Mc BHAIKSUKI VOWEL SIGN AA +11C3E ; Right # Mc BHAIKSUKI SIGN VISARGA +11CA9 ; Right # Mc MARCHEN SUBJOINED LETTER YA +11CB4 ; Right # Mc MARCHEN VOWEL SIGN O +11D46 ; Right # Lo MASARAM GONDI REPHA +11D8A..11D8E ; Right # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU +11D93..11D94 ; Right # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU +11D96 ; Right # Mc GUNJALA GONDI SIGN VISARGA +11EF6 ; Right # Mc MAKASAR VOWEL SIGN O +11F03 ; Right # Mc KAWI SIGN VISARGA +11F34..11F35 ; Right # Mc [2] KAWI VOWEL SIGN AA..KAWI VOWEL SIGN ALTERNATE AA +11F41 ; Right # Mc KAWI SIGN KILLER +1612C ; Right # Mc GURUNG KHEMA CONSONANT SIGN MEDIAL HA +16D40..16D42 ; Right # Lm [3] KIRAT RAI SIGN ANUSVARA..KIRAT RAI SIGN VISARGA +16D63..16D6A ; Right # Lo [8] KIRAT RAI VOWEL SIGN AA..KIRAT RAI VOWEL SIGN AU +16D6B..16D6C ; Right # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT + +# Indic_Positional_Category=Left + +093F ; Left # Mc DEVANAGARI VOWEL SIGN I +094E ; Left # Mc DEVANAGARI VOWEL SIGN PRISHTHAMATRA E +09BF ; Left # Mc BENGALI VOWEL SIGN I +09C7..09C8 ; Left # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +0A3F ; Left # Mc GURMUKHI VOWEL SIGN I +0ABF ; Left # Mc GUJARATI VOWEL SIGN I +0B47 ; Left # Mc ORIYA VOWEL SIGN E +0BC6..0BC8 ; Left # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0D46..0D48 ; Left # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0DD9 ; Left # Mc SINHALA VOWEL SIGN KOMBUVA +0DDB ; Left # Mc SINHALA VOWEL SIGN KOMBU DEKA +0F3F ; Left # Mc TIBETAN SIGN MAR TSHES +1031 ; Left # Mc MYANMAR VOWEL SIGN E +1084 ; Left # Mc MYANMAR VOWEL SIGN SHAN E +17C1..17C3 ; Left # Mc [3] KHMER VOWEL SIGN E..KHMER VOWEL SIGN AI +1A19 ; Left # Mc BUGINESE VOWEL SIGN E +1A55 ; Left # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A6E..1A72 ; Left # Mc [5] TAI THAM VOWEL SIGN E..TAI THAM VOWEL SIGN THAM AI +1B3E..1B3F ; Left # Mc [2] BALINESE VOWEL SIGN TALING..BALINESE VOWEL SIGN TALING REPA +1BA6 ; Left # Mc SUNDANESE VOWEL SIGN PANAELAENG +1C27..1C28 ; Left # Mc [2] LEPCHA VOWEL SIGN I..LEPCHA VOWEL SIGN O +1C34..1C35 ; Left # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A9BA..A9BB ; Left # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +AA2F..AA30 ; Left # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA34 ; Left # Mc CHAM CONSONANT SIGN RA +AAEB ; Left # Mc MEETEI MAYEK VOWEL SIGN II +AAEE ; Left # Mc MEETEI MAYEK VOWEL SIGN AU +110B1 ; Left # Mc KAITHI VOWEL SIGN I +1112C ; Left # Mc CHAKMA VOWEL SIGN E +111B4 ; Left # Mc SHARADA VOWEL SIGN I +111CE ; Left # Mc SHARADA VOWEL SIGN PRISHTHAMATRA E +112E1 ; Left # Mc KHUDAWADI VOWEL SIGN I +11347..11348 ; Left # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +113C2 ; Left # Mc TULU-TIGALARI VOWEL SIGN EE +113C5 ; Left # Mc TULU-TIGALARI VOWEL SIGN AI +11436 ; Left # Mc NEWA VOWEL SIGN I +114B1 ; Left # Mc TIRHUTA VOWEL SIGN I +114B9 ; Left # Mc TIRHUTA VOWEL SIGN E +115B0 ; Left # Mc SIDDHAM VOWEL SIGN I +115B8 ; Left # Mc SIDDHAM VOWEL SIGN E +116AE ; Left # Mc TAKRI VOWEL SIGN I +11726 ; Left # Mc AHOM VOWEL SIGN E +1182D ; Left # Mc DOGRA VOWEL SIGN I +11935 ; Left # Mc DIVES AKURU VOWEL SIGN E +11937 ; Left # Mc DIVES AKURU VOWEL SIGN AI +119D2 ; Left # Mc NANDINAGARI VOWEL SIGN I +119E4 ; Left # Mc NANDINAGARI VOWEL SIGN PRISHTHAMATRA E +11CB1 ; Left # Mc MARCHEN VOWEL SIGN I +11EF5 ; Left # Mc MAKASAR VOWEL SIGN E +11F3E..11F3F ; Left # Mc [2] KAWI VOWEL SIGN E..KAWI VOWEL SIGN AI +1612A..1612B ; Left # Mc [2] GURUNG KHEMA CONSONANT SIGN MEDIAL YA..GURUNG KHEMA CONSONANT SIGN MEDIAL VA + +# Indic_Positional_Category=Visual_Order_Left + +# These are dependent vowels that occur to the left of the consonant +# letter in a syllable, but which occur in scripts using the visual order +# model, instead of the logical order model. Because of the different +# model, these left-side vowels occur first in the backing store (before +# the consonant letter) and are not reordered during text rendering. +# +# [Derivation: Logical_Order_Exception=Yes] + +0E40..0E44 ; Visual_Order_Left # Lo [5] THAI CHARACTER SARA E..THAI CHARACTER SARA AI MAIMALAI +0EC0..0EC4 ; Visual_Order_Left # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +19B5..19B7 ; Visual_Order_Left # Lo [3] NEW TAI LUE VOWEL SIGN E..NEW TAI LUE VOWEL SIGN O +19BA ; Visual_Order_Left # Lo NEW TAI LUE VOWEL SIGN AY +AAB5..AAB6 ; Visual_Order_Left # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB9 ; Visual_Order_Left # Lo TAI VIET VOWEL UEA +AABB..AABC ; Visual_Order_Left # Lo [2] TAI VIET VOWEL AUE..TAI VIET VOWEL AY + +# Indic_Positional_Category=Left_And_Right + +09CB..09CC ; Left_And_Right # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +0B4B ; Left_And_Right # Mc ORIYA VOWEL SIGN O +0BCA..0BCC ; Left_And_Right # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0D4A..0D4C ; Left_And_Right # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0DDC ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA +0DDE ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA +17C0 ; Left_And_Right # Mc KHMER VOWEL SIGN IE +17C4..17C5 ; Left_And_Right # Mc [2] KHMER VOWEL SIGN OO..KHMER VOWEL SIGN AU +1B40..1B41 ; Left_And_Right # Mc [2] BALINESE VOWEL SIGN TALING TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1134B..1134C ; Left_And_Right # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +113C7..113C8 ; Left_And_Right # Mc [2] TULU-TIGALARI VOWEL SIGN OO..TULU-TIGALARI VOWEL SIGN AU +114BC ; Left_And_Right # Mc TIRHUTA VOWEL SIGN O +114BE ; Left_And_Right # Mc TIRHUTA VOWEL SIGN AU +115BA ; Left_And_Right # Mc SIDDHAM VOWEL SIGN O +11938 ; Left_And_Right # Mc DIVES AKURU VOWEL SIGN O + +# Indic_Positional_Category=Top + +0900..0902 ; Top # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +093A ; Top # Mn DEVANAGARI VOWEL SIGN OE +0945..0948 ; Top # Mn [4] DEVANAGARI VOWEL SIGN CANDRA E..DEVANAGARI VOWEL SIGN AI +0951 ; Top # Mn DEVANAGARI STRESS SIGN UDATTA +0955 ; Top # Mn DEVANAGARI VOWEL SIGN CANDRA LONG E +0981 ; Top # Mn BENGALI SIGN CANDRABINDU +09FE ; Top # Mn BENGALI SANDHI MARK +0A01..0A02 ; Top # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A47..0A48 ; Top # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Top # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0A70..0A71 ; Top # Mn [2] GURMUKHI TIPPI..GURMUKHI ADDAK +0A81..0A82 ; Top # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0AC5 ; Top # Mn GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Top # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AFA..0AFF ; Top # Mn [6] GUJARATI SIGN SUKUN..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B01 ; Top # Mn ORIYA SIGN CANDRABINDU +0B3F ; Top # Mn ORIYA VOWEL SIGN I +0B55..0B56 ; Top # Mn [2] ORIYA SIGN OVERLINE..ORIYA AI LENGTH MARK +0B82 ; Top # Mn TAMIL SIGN ANUSVARA +0BC0 ; Top # Mn TAMIL VOWEL SIGN II +0BCD ; Top # Mn TAMIL SIGN VIRAMA +0C00 ; Top # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C04 ; Top # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C3E..0C40 ; Top # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C46..0C47 ; Top # Mn [2] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN EE +0C4A..0C4D ; Top # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA +0C55 ; Top # Mn TELUGU LENGTH MARK +0C81 ; Top # Mn KANNADA SIGN CANDRABINDU +0CBF ; Top # Mn KANNADA VOWEL SIGN I +0CC6 ; Top # Mn KANNADA VOWEL SIGN E +0CCC..0CCD ; Top # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA +0D00..0D01 ; Top # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU +0D3B..0D3C ; Top # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA +0D4D ; Top # Mn MALAYALAM SIGN VIRAMA +0D4E ; Top # Lo MALAYALAM LETTER DOT REPH +0D81 ; Top # Mn SINHALA SIGN CANDRABINDU +0DCA ; Top # Mn SINHALA SIGN AL-LAKUNA +0DD2..0DD3 ; Top # Mn [2] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN DIGA IS-PILLA +0E31 ; Top # Mn THAI CHARACTER MAI HAN-AKAT +0E34..0E37 ; Top # Mn [4] THAI CHARACTER SARA I..THAI CHARACTER SARA UEE +0E47..0E4E ; Top # Mn [8] THAI CHARACTER MAITAIKHU..THAI CHARACTER YAMAKKAN +0EB1 ; Top # Mn LAO VOWEL SIGN MAI KAN +0EB4..0EB7 ; Top # Mn [4] LAO VOWEL SIGN I..LAO VOWEL SIGN YY +0EBB ; Top # Mn LAO VOWEL SIGN MAI KON +0EC8..0ECE ; Top # Mn [7] LAO TONE MAI EK..LAO YAMAKKAN +0F39 ; Top # Mn TIBETAN MARK TSA -PHRU +0F72 ; Top # Mn TIBETAN VOWEL SIGN I +0F7A..0F7E ; Top # Mn [5] TIBETAN VOWEL SIGN E..TIBETAN SIGN RJES SU NGA RO +0F80 ; Top # Mn TIBETAN VOWEL SIGN REVERSED I +0F82..0F83 ; Top # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +0F86..0F87 ; Top # Mn [2] TIBETAN SIGN LCI RTAGS..TIBETAN SIGN YANG RTAGS +102D..102E ; Top # Mn [2] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN II +1032..1036 ; Top # Mn [5] MYANMAR VOWEL SIGN AI..MYANMAR SIGN ANUSVARA +103A ; Top # Mn MYANMAR SIGN ASAT +1071..1074 ; Top # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1085..1086 ; Top # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109D ; Top # Mn MYANMAR VOWEL SIGN AITON AI +1712 ; Top # Mn TAGALOG VOWEL SIGN I +1732 ; Top # Mn HANUNOO VOWEL SIGN I +1752 ; Top # Mn BUHID VOWEL SIGN I +1772 ; Top # Mn TAGBANWA VOWEL SIGN I +17B7..17BA ; Top # Mn [4] KHMER VOWEL SIGN I..KHMER VOWEL SIGN YY +17C6 ; Top # Mn KHMER SIGN NIKAHIT +17C9..17D1 ; Top # Mn [9] KHMER SIGN MUUSIKATOAN..KHMER SIGN VIRIAM +17D3 ; Top # Mn KHMER SIGN BATHAMASAT +17DD ; Top # Mn KHMER SIGN ATTHACAN +1920..1921 ; Top # Mn [2] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN I +1927..1928 ; Top # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Top # Mn LIMBU SIGN KEMPHRENG +1A17 ; Top # Mn BUGINESE VOWEL SIGN I +1A1B ; Top # Mn BUGINESE VOWEL SIGN AE +1A58..1A5A ; Top # Mn [3] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN LOW PA +1A62 ; Top # Mn TAI THAM VOWEL SIGN MAI SAT +1A65..1A68 ; Top # Mn [4] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN UUE +1A6B ; Top # Mn TAI THAM VOWEL SIGN O +1A73..1A7C ; Top # Mn [10] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN KHUEN-LUE KARAN +1B00..1B03 ; Top # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG +1B34 ; Top # Mn BALINESE SIGN REREKAN +1B36..1B37 ; Top # Mn [2] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN ULU SARI +1B42 ; Top # Mn BALINESE VOWEL SIGN PEPET +1B6B ; Top # Mn BALINESE MUSICAL SYMBOL COMBINING TEGEH +1B6D..1B73 ; Top # Mn [7] BALINESE MUSICAL SYMBOL COMBINING KEMPUL..BALINESE MUSICAL SYMBOL COMBINING GONG +1B80..1B81 ; Top # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR +1BA4 ; Top # Mn SUNDANESE VOWEL SIGN PANGHULU +1BA8..1BA9 ; Top # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE6 ; Top # Mn BATAK SIGN TOMPI +1BE8..1BE9 ; Top # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BED ; Top # Mn BATAK VOWEL SIGN KARO O +1BEF..1BF1 ; Top # Mn [3] BATAK VOWEL SIGN U FOR SIMALUNGUN SA..BATAK CONSONANT SIGN H +1C2D..1C33 ; Top # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +1C36 ; Top # Mn LEPCHA SIGN RAN +1CD0..1CD2 ; Top # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CDA..1CDB ; Top # Mn [2] VEDIC TONE DOUBLE SVARITA..VEDIC TONE TRIPLE SVARITA +1CE0 ; Top # Mn VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CF4 ; Top # Mn VEDIC TONE CANDRA ABOVE +1DFB ; Top # Mn COMBINING DELETION MARK +20F0 ; Top # Mn COMBINING ASTERISK ABOVE +A802 ; Top # Mn SYLOTI NAGRI SIGN DVISVARA +A806 ; Top # Mn SYLOTI NAGRI SIGN HASANTA +A80B ; Top # Mn SYLOTI NAGRI SIGN ANUSVARA +A826 ; Top # Mn SYLOTI NAGRI VOWEL SIGN E +A8C5 ; Top # Mn SAURASHTRA SIGN CANDRABINDU +A8E0..A8F1 ; Top # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +A8FF ; Top # Mn DEVANAGARI VOWEL SIGN AY +A926..A92A ; Top # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O +A94A ; Top # Mn REJANG VOWEL SIGN AI +A94F..A951 ; Top # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A980..A982 ; Top # Mn [3] JAVANESE SIGN PANYANGGA..JAVANESE SIGN LAYAR +A9B3 ; Top # Mn JAVANESE SIGN CECAK TELU +A9B6..A9B7 ; Top # Mn [2] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN WULU MELIK +A9BC ; Top # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Top # Mn MYANMAR SIGN SHAN SAW +AA29..AA2C ; Top # Mn [4] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN EI +AA2E ; Top # Mn CHAM VOWEL SIGN OE +AA31 ; Top # Mn CHAM VOWEL SIGN AU +AA43 ; Top # Mn CHAM CONSONANT SIGN FINAL NG +AA4C ; Top # Mn CHAM CONSONANT SIGN FINAL M +AA7C ; Top # Mn MYANMAR SIGN TAI LAING TONE-2 +AAB0 ; Top # Mn TAI VIET MAI KANG +AAB2..AAB3 ; Top # Mn [2] TAI VIET VOWEL I..TAI VIET VOWEL UE +AAB7..AAB8 ; Top # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AABE..AABF ; Top # Mn [2] TAI VIET VOWEL AM..TAI VIET TONE MAI EK +AAC1 ; Top # Mn TAI VIET TONE MAI THO +AAED ; Top # Mn MEETEI MAYEK VOWEL SIGN AAI +ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP +10A05 ; Top # Mn KHAROSHTHI VOWEL SIGN E +10A0F ; Top # Mn KHAROSHTHI SIGN VISARGA +10A38 ; Top # Mn KHAROSHTHI SIGN BAR ABOVE +11001 ; Top # Mn BRAHMI SIGN ANUSVARA +11038..1103B ; Top # Mn [4] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN II +11042..11046 ; Top # Mn [5] BRAHMI VOWEL SIGN E..BRAHMI VIRAMA +11070 ; Top # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11073..11074 ; Top # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O +11080..11081 ; Top # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +110B5..110B6 ; Top # Mn [2] KAITHI VOWEL SIGN E..KAITHI VOWEL SIGN AI +11100..11102 ; Top # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA +11127..11129 ; Top # Mn [3] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN II +1112D ; Top # Mn CHAKMA VOWEL SIGN AI +11130 ; Top # Mn CHAKMA VOWEL SIGN OI +11134 ; Top # Mn CHAKMA MAAYYAA +11180..11181 ; Top # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +111BC..111BE ; Top # Mn [3] SHARADA VOWEL SIGN E..SHARADA VOWEL SIGN O +111C2..111C3 ; Top # Lo [2] SHARADA SIGN JIHVAMULIYA..SHARADA SIGN UPADHMANIYA +111CB ; Top # Mn SHARADA VOWEL MODIFIER MARK +111CF ; Top # Mn SHARADA SIGN INVERTED CANDRABINDU +11230..11231 ; Top # Mn [2] KHOJKI VOWEL SIGN E..KHOJKI VOWEL SIGN AI +11234 ; Top # Mn KHOJKI SIGN ANUSVARA +11236..11237 ; Top # Mn [2] KHOJKI SIGN NUKTA..KHOJKI SIGN SHADDA +1123E ; Top # Mn KHOJKI SIGN SUKUN +112DF ; Top # Mn KHUDAWADI SIGN ANUSVARA +112E5..112E8 ; Top # Mn [4] KHUDAWADI VOWEL SIGN E..KHUDAWADI VOWEL SIGN AU +11300..11301 ; Top # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11340 ; Top # Mn GRANTHA VOWEL SIGN II +11366..1136C ; Top # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Top # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA +113CE ; Top # Mn TULU-TIGALARI SIGN VIRAMA +113D1 ; Top # Lo TULU-TIGALARI REPHA +113E1 ; Top # Mn TULU-TIGALARI VEDIC TONE SVARITA +1143E..1143F ; Top # Mn [2] NEWA VOWEL SIGN E..NEWA VOWEL SIGN AI +11443..11444 ; Top # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +1145E ; Top # Mn NEWA SANDHI MARK +114BA ; Top # Mn TIRHUTA VOWEL SIGN SHORT E +114BF..114C0 ; Top # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Top # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +11639..1163A ; Top # Mn [2] MODI VOWEL SIGN E..MODI VOWEL SIGN AI +1163D ; Top # Mn MODI SIGN ANUSVARA +11640 ; Top # Mn MODI SIGN ARDHACANDRA +116AB ; Top # Mn TAKRI SIGN ANUSVARA +116AD ; Top # Mn TAKRI VOWEL SIGN AA +116B2..116B5 ; Top # Mn [4] TAKRI VOWEL SIGN E..TAKRI VOWEL SIGN AU +1171F ; Top # Mn AHOM CONSONANT SIGN MEDIAL LIGATING RA +11722..11723 ; Top # Mn [2] AHOM VOWEL SIGN I..AHOM VOWEL SIGN II +11727 ; Top # Mn AHOM VOWEL SIGN AW +11729..1172B ; Top # Mn [3] AHOM VOWEL SIGN AI..AHOM SIGN KILLER +11833..11837 ; Top # Mn [5] DOGRA VOWEL SIGN E..DOGRA SIGN ANUSVARA +1193B..1193C ; Top # Mn [2] DIVES AKURU SIGN ANUSVARA..DIVES AKURU SIGN CANDRABINDU +1193F ; Top # Lo DIVES AKURU PREFIXED NASAL SIGN +11941 ; Top # Lo DIVES AKURU INITIAL RA +119DA..119DB ; Top # Mn [2] NANDINAGARI VOWEL SIGN E..NANDINAGARI VOWEL SIGN AI +11A01 ; Top # Mn ZANABAZAR SQUARE VOWEL SIGN I +11A04..11A09 ; Top # Mn [6] ZANABAZAR SQUARE VOWEL SIGN E..ZANABAZAR SQUARE VOWEL SIGN REVERSED I +11A35..11A38 ; Top # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A51 ; Top # Mn SOYOMBO VOWEL SIGN I +11A54..11A56 ; Top # Mn [3] SOYOMBO VOWEL SIGN E..SOYOMBO VOWEL SIGN OE +11A84..11A89 ; Top # Lo [6] SOYOMBO SIGN JIHVAMULIYA..SOYOMBO CLUSTER-INITIAL LETTER SA +11A96 ; Top # Mn SOYOMBO SIGN ANUSVARA +11A98 ; Top # Mn SOYOMBO GEMINATION MARK +11B60 ; Top # Mn SHARADA VOWEL SIGN OE +11B64 ; Top # Mn SHARADA VOWEL SIGN SHORT E +11B66 ; Top # Mn SHARADA VOWEL SIGN CANDRA E +11C30..11C31 ; Top # Mn [2] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN II +11C38..11C3D ; Top # Mn [6] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI SIGN ANUSVARA +11CB3 ; Top # Mn MARCHEN VOWEL SIGN E +11CB5..11CB6 ; Top # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D31..11D35 ; Top # Mn [5] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN UU +11D3A ; Top # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Top # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F..11D41 ; Top # Mn [3] MASARAM GONDI VOWEL SIGN AU..MASARAM GONDI SIGN VISARGA +11D43 ; Top # Mn MASARAM GONDI SIGN CANDRA +11D90..11D91 ; Top # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI +11D95 ; Top # Mn GUNJALA GONDI SIGN ANUSVARA +11EF3 ; Top # Mn MAKASAR VOWEL SIGN I +11F00..11F01 ; Top # Mn [2] KAWI SIGN CANDRABINDU..KAWI SIGN ANUSVARA +11F02 ; Top # Lo KAWI SIGN REPHA +11F36..11F37 ; Top # Mn [2] KAWI VOWEL SIGN I..KAWI VOWEL SIGN II +11F40 ; Top # Mn KAWI VOWEL SIGN EU +11F5A ; Top # Mn KAWI SIGN NUKTA +1611E..16129 ; Top # Mn [12] GURUNG KHEMA VOWEL SIGN AA..GURUNG KHEMA VOWEL LENGTH MARK +1612D ; Top # Mn GURUNG KHEMA SIGN ANUSVARA + +# Indic_Positional_Category=Bottom + +093C ; Bottom # Mn DEVANAGARI SIGN NUKTA +0941..0944 ; Bottom # Mn [4] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN VOCALIC RR +094D ; Bottom # Mn DEVANAGARI SIGN VIRAMA +0952 ; Bottom # Mn DEVANAGARI STRESS SIGN ANUDATTA +0956..0957 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN UE..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BC ; Bottom # Mn BENGALI SIGN NUKTA +09C1..09C4 ; Bottom # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09CD ; Bottom # Mn BENGALI SIGN VIRAMA +09E2..09E3 ; Bottom # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3C ; Bottom # Mn GURMUKHI SIGN NUKTA +0A41..0A42 ; Bottom # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A4D ; Bottom # Mn GURMUKHI SIGN VIRAMA +0A51 ; Bottom # Mn GURMUKHI SIGN UDAAT +0A75 ; Bottom # Mn GURMUKHI SIGN YAKASH +0ABC ; Bottom # Mn GUJARATI SIGN NUKTA +0AC1..0AC4 ; Bottom # Mn [4] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN VOCALIC RR +0ACD ; Bottom # Mn GUJARATI SIGN VIRAMA +0AE2..0AE3 ; Bottom # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3C ; Bottom # Mn ORIYA SIGN NUKTA +0B41..0B44 ; Bottom # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B4D ; Bottom # Mn ORIYA SIGN VIRAMA +0B62..0B63 ; Bottom # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0C3C ; Bottom # Mn TELUGU SIGN NUKTA +0C56 ; Bottom # Mn TELUGU AI LENGTH MARK +0C62..0C63 ; Bottom # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBC ; Bottom # Mn KANNADA SIGN NUKTA +0CE2..0CE3 ; Bottom # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D41..0D44 ; Bottom # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR +0D62..0D63 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DD4 ; Bottom # Mn SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Bottom # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0E38..0E3A ; Bottom # Mn [3] THAI CHARACTER SARA U..THAI CHARACTER PHINTHU +0EB8..0EBA ; Bottom # Mn [3] LAO VOWEL SIGN U..LAO SIGN PALI VIRAMA +0EBC ; Bottom # Mn LAO SEMIVOWEL SIGN LO +0F18..0F19 ; Bottom # Mn [2] TIBETAN ASTROLOGICAL SIGN -KHYUD PA..TIBETAN ASTROLOGICAL SIGN SDONG TSHUGS +0F35 ; Bottom # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Bottom # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0F71 ; Bottom # Mn TIBETAN VOWEL SIGN AA +0F74..0F75 ; Bottom # Mn [2] TIBETAN VOWEL SIGN U..TIBETAN VOWEL SIGN UU +0F84 ; Bottom # Mn TIBETAN MARK HALANTA +0F8D..0F97 ; Bottom # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Bottom # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +0FC6 ; Bottom # Mn TIBETAN SYMBOL PADMA GDAN +102F..1030 ; Bottom # Mn [2] MYANMAR VOWEL SIGN U..MYANMAR VOWEL SIGN UU +1037 ; Bottom # Mn MYANMAR SIGN DOT BELOW +103D..103E ; Bottom # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +1058..1059 ; Bottom # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +105E..1060 ; Bottom # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Bottom # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +108D ; Bottom # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +1713..1714 ; Bottom # Mn [2] TAGALOG VOWEL SIGN U..TAGALOG SIGN VIRAMA +1733 ; Bottom # Mn HANUNOO VOWEL SIGN U +1753 ; Bottom # Mn BUHID VOWEL SIGN U +1773 ; Bottom # Mn TAGBANWA VOWEL SIGN U +17BB..17BD ; Bottom # Mn [3] KHMER VOWEL SIGN U..KHMER VOWEL SIGN UA +1922 ; Bottom # Mn LIMBU VOWEL SIGN U +1932 ; Bottom # Mn LIMBU SMALL LETTER ANUSVARA +1939 ; Bottom # Mn LIMBU SIGN MUKPHRENG +193B ; Bottom # Mn LIMBU SIGN SA-I +1A18 ; Bottom # Mn BUGINESE VOWEL SIGN U +1A56 ; Bottom # Mn TAI THAM CONSONANT SIGN MEDIAL LA +1A5B..1A5E ; Bottom # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1A69..1A6A ; Bottom # Mn [2] TAI THAM VOWEL SIGN U..TAI THAM VOWEL SIGN UU +1A6C ; Bottom # Mn TAI THAM VOWEL SIGN OA BELOW +1A7F ; Bottom # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1B38..1B3A ; Bottom # Mn [3] BALINESE VOWEL SIGN SUKU..BALINESE VOWEL SIGN RA REPA +1B6C ; Bottom # Mn BALINESE MUSICAL SYMBOL COMBINING ENDEP +1BA2..1BA3 ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BA5 ; Bottom # Mn SUNDANESE VOWEL SIGN PANYUKU +1BAC..1BAD ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C2C ; Bottom # Mn LEPCHA VOWEL SIGN E +1C37 ; Bottom # Mn LEPCHA SIGN NUKTA +1CD5..1CD9 ; Bottom # Mn [5] VEDIC TONE YAJURVEDIC AGGRAVATED INDEPENDENT SVARITA..VEDIC TONE YAJURVEDIC KATHAKA INDEPENDENT SVARITA SCHROEDER +1CDC..1CDF ; Bottom # Mn [4] VEDIC TONE KATHAKA ANUDATTA..VEDIC TONE THREE DOTS BELOW +1CED ; Bottom # Mn VEDIC SIGN TIRYAK +A825 ; Bottom # Mn SYLOTI NAGRI VOWEL SIGN U +A82C ; Bottom # Mn SYLOTI NAGRI SIGN ALTERNATE HASANTA +A8C4 ; Bottom # Mn SAURASHTRA SIGN VIRAMA +A92B..A92D ; Bottom # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +A947..A949 ; Bottom # Mn [3] REJANG VOWEL SIGN I..REJANG VOWEL SIGN E +A94B..A94E ; Bottom # Mn [4] REJANG VOWEL SIGN O..REJANG VOWEL SIGN EA +A9B8..A9B9 ; Bottom # Mn [2] JAVANESE VOWEL SIGN SUKU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BD ; Bottom # Mn JAVANESE CONSONANT SIGN KERET +AA2D ; Bottom # Mn CHAM VOWEL SIGN U +AA32 ; Bottom # Mn CHAM VOWEL SIGN UE +AA35..AA36 ; Bottom # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +AAB4 ; Bottom # Mn TAI VIET VOWEL U +AAEC ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UU +ABE8 ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK +10A02..10A03 ; Bottom # Mn [2] KHAROSHTHI VOWEL SIGN U..KHAROSHTHI VOWEL SIGN VOCALIC R +10A0C..10A0E ; Bottom # Mn [3] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN ANUSVARA +10A39..10A3A ; Bottom # Mn [2] KHAROSHTHI SIGN CAUDA..KHAROSHTHI SIGN DOT BELOW +1103C..11041 ; Bottom # Mn [6] BRAHMI VOWEL SIGN U..BRAHMI VOWEL SIGN VOCALIC LL +110B3..110B4 ; Bottom # Mn [2] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN UU +110B9..110BA ; Bottom # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +110C2 ; Bottom # Mn KAITHI VOWEL SIGN VOCALIC R +1112A..1112B ; Bottom # Mn [2] CHAKMA VOWEL SIGN U..CHAKMA VOWEL SIGN UU +11131..11132 ; Bottom # Mn [2] CHAKMA O MARK..CHAKMA AU MARK +11173 ; Bottom # Mn MAHAJANI SIGN NUKTA +111B6..111BB ; Bottom # Mn [6] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN VOCALIC LL +111C9..111CA ; Bottom # Mn [2] SHARADA SANDHI MARK..SHARADA SIGN NUKTA +111CC ; Bottom # Mn SHARADA EXTRA SHORT VOWEL MARK +1122F ; Bottom # Mn KHOJKI VOWEL SIGN U +11241 ; Bottom # Mn KHOJKI VOWEL SIGN VOCALIC R +112E3..112E4 ; Bottom # Mn [2] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN UU +112E9..112EA ; Bottom # Mn [2] KHUDAWADI SIGN NUKTA..KHUDAWADI SIGN VIRAMA +1133B..1133C ; Bottom # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA +113BB..113C0 ; Bottom # Mn [6] TULU-TIGALARI VOWEL SIGN U..TULU-TIGALARI VOWEL SIGN VOCALIC LL +113D2 ; Bottom # Mn TULU-TIGALARI GEMINATION MARK +113E2 ; Bottom # Mn TULU-TIGALARI VEDIC TONE ANUDATTA +11438..1143D ; Bottom # Mn [6] NEWA VOWEL SIGN U..NEWA VOWEL SIGN VOCALIC LL +11442 ; Bottom # Mn NEWA SIGN VIRAMA +11446 ; Bottom # Mn NEWA SIGN NUKTA +114B3..114B8 ; Bottom # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114C2..114C3 ; Bottom # Mn [2] TIRHUTA SIGN VIRAMA..TIRHUTA SIGN NUKTA +115B2..115B5 ; Bottom # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115BF..115C0 ; Bottom # Mn [2] SIDDHAM SIGN VIRAMA..SIDDHAM SIGN NUKTA +115DC..115DD ; Bottom # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11633..11638 ; Bottom # Mn [6] MODI VOWEL SIGN U..MODI VOWEL SIGN VOCALIC LL +1163F ; Bottom # Mn MODI SIGN VIRAMA +116B0..116B1 ; Bottom # Mn [2] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN UU +116B7 ; Bottom # Mn TAKRI SIGN NUKTA +1171D ; Bottom # Mn AHOM CONSONANT SIGN MEDIAL LA +11724..11725 ; Bottom # Mn [2] AHOM VOWEL SIGN U..AHOM VOWEL SIGN UU +11728 ; Bottom # Mn AHOM VOWEL SIGN O +1182F..11832 ; Bottom # Mn [4] DOGRA VOWEL SIGN U..DOGRA VOWEL SIGN VOCALIC RR +11839..1183A ; Bottom # Mn [2] DOGRA SIGN VIRAMA..DOGRA SIGN NUKTA +11943 ; Bottom # Mn DIVES AKURU SIGN NUKTA +119D4..119D7 ; Bottom # Mn [4] NANDINAGARI VOWEL SIGN U..NANDINAGARI VOWEL SIGN VOCALIC RR +119E0 ; Bottom # Mn NANDINAGARI SIGN VIRAMA +11A02..11A03 ; Bottom # Mn [2] ZANABAZAR SQUARE VOWEL SIGN UE..ZANABAZAR SQUARE VOWEL SIGN U +11A0A ; Bottom # Mn ZANABAZAR SQUARE VOWEL LENGTH MARK +11A33..11A34 ; Bottom # Mn [2] ZANABAZAR SQUARE FINAL CONSONANT MARK..ZANABAZAR SQUARE SIGN VIRAMA +11A3B..11A3E ; Bottom # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11A52..11A53 ; Bottom # Mn [2] SOYOMBO VOWEL SIGN UE..SOYOMBO VOWEL SIGN U +11A59..11A5B ; Bottom # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11A8A..11A95 ; Bottom # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A +11B62..11B63 ; Bottom # Mn [2] SHARADA VOWEL SIGN UE..SHARADA VOWEL SIGN UUE +11C32..11C36 ; Bottom # Mn [5] BHAIKSUKI VOWEL SIGN U..BHAIKSUKI VOWEL SIGN VOCALIC L +11C3F ; Bottom # Mn BHAIKSUKI SIGN VIRAMA +11C92..11CA7 ; Bottom # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CAA..11CB0 ; Bottom # Mn [7] MARCHEN SUBJOINED LETTER RA..MARCHEN VOWEL SIGN AA +11CB2 ; Bottom # Mn MARCHEN VOWEL SIGN U +11D36 ; Bottom # Mn MASARAM GONDI VOWEL SIGN VOCALIC R +11D42 ; Bottom # Mn MASARAM GONDI SIGN NUKTA +11D44 ; Bottom # Mn MASARAM GONDI SIGN HALANTA +11D47 ; Bottom # Mn MASARAM GONDI RA-KARA +11EF4 ; Bottom # Mn MAKASAR VOWEL SIGN U +11F38..11F3A ; Bottom # Mn [3] KAWI VOWEL SIGN U..KAWI VOWEL SIGN VOCALIC R +1612E..1612F ; Bottom # Mn [2] GURUNG KHEMA CONSONANT SIGN MEDIAL RA..GURUNG KHEMA SIGN THOLHOMA + +# Indic_Positional_Category=Top_And_Bottom + +0C48 ; Top_And_Bottom # Mn TELUGU VOWEL SIGN AI +0F73 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN II +0F76..0F79 ; Top_And_Bottom # Mn [4] TIBETAN VOWEL SIGN VOCALIC R..TIBETAN VOWEL SIGN VOCALIC LL +0F81 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN REVERSED II +1B3C ; Top_And_Bottom # Mn BALINESE VOWEL SIGN LA LENGA +1112E..1112F ; Top_And_Bottom # Mn [2] CHAKMA VOWEL SIGN O..CHAKMA VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Right + +0AC9 ; Top_And_Right # Mc GUJARATI VOWEL SIGN CANDRA O +0B57 ; Top_And_Right # Mc ORIYA AU LENGTH MARK +0CC0 ; Top_And_Right # Mc KANNADA VOWEL SIGN II +0CC7..0CC8 ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +1925..1926 ; Top_And_Right # Mc [2] LIMBU VOWEL SIGN OO..LIMBU VOWEL SIGN AU +1B43 ; Top_And_Right # Mc BALINESE VOWEL SIGN PEPET TEDUNG +111BF ; Top_And_Right # Mc SHARADA VOWEL SIGN AU +11232..11233 ; Top_And_Right # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU +113B9..113BA ; Top_And_Right # Mc [2] TULU-TIGALARI VOWEL SIGN I..TULU-TIGALARI VOWEL SIGN II + +# Indic_Positional_Category=Top_And_Left + +0B48 ; Top_And_Left # Mc ORIYA VOWEL SIGN AI +0DDA ; Top_And_Left # Mc SINHALA VOWEL SIGN DIGA KOMBUVA +17BE ; Top_And_Left # Mc KHMER VOWEL SIGN OE +1C29 ; Top_And_Left # Mc LEPCHA VOWEL SIGN OO +114BB ; Top_And_Left # Mc TIRHUTA VOWEL SIGN AI +115B9 ; Top_And_Left # Mc SIDDHAM VOWEL SIGN AI + +# Indic_Positional_Category=Top_And_Left_And_Right + +0B4C ; Top_And_Left_And_Right # Mc ORIYA VOWEL SIGN AU +0DDD ; Top_And_Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA +17BF ; Top_And_Left_And_Right # Mc KHMER VOWEL SIGN YA +115BB ; Top_And_Left_And_Right # Mc SIDDHAM VOWEL SIGN AU + +# Indic_Positional_Category=Bottom_And_Right + +1B3B ; Bottom_And_Right # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +A9BE ; Bottom_And_Right # Mc JAVANESE CONSONANT SIGN PENGKAL +A9C0 ; Bottom_And_Right # Mc JAVANESE PANGKON +11942 ; Bottom_And_Right # Mc DIVES AKURU MEDIAL RA + +# Indic_Positional_Category=Bottom_And_Left + +A9BF ; Bottom_And_Left # Mc JAVANESE CONSONANT SIGN CAKRA + +# Indic_Positional_Category=Top_And_Bottom_And_Right + +1B3D ; Top_And_Bottom_And_Right # Mc BALINESE VOWEL SIGN LA LENGA TEDUNG + +# Indic_Positional_Category=Top_And_Bottom_And_Left + +103C ; Top_And_Bottom_And_Left # Mc MYANMAR CONSONANT SIGN MEDIAL RA +1171E ; Top_And_Bottom_And_Left # Mc AHOM CONSONANT SIGN MEDIAL RA + +# Indic_Positional_Category=Overstruck + +1CD4 ; Overstruck # Mn VEDIC SIGN YAJURVEDIC MIDLINE SVARITA +1CE2..1CE8 ; Overstruck # Mn [7] VEDIC SIGN VISARGA SVARITA..VEDIC SIGN VISARGA ANUDATTA WITH TAIL +10A01 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN I +10A06 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN O + +# EOF diff --git a/data/17.0.0-indic-syllabic-category.txt b/data/17.0.0-indic-syllabic-category.txt new file mode 100644 index 0000000..43287cc --- /dev/null +++ b/data/17.0.0-indic-syllabic-category.txt @@ -0,0 +1,1419 @@ +# IndicSyllabicCategory-17.0.0.txt +# Date: 2025-08-01, 04:02:23 GMT +# © 2025 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use and license, see https://www.unicode.org/terms_of_use.html +# +# Unicode Character Database +# For documentation, see https://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Syllabic_Category enumerated property +# +# Scope: This property is aimed at two general problem +# areas involving the analysis and processing of Indic scripts: +# +# 1. Specification of syllabic structure. +# 2. Specification of segmentation rules. +# +# Both of these problem areas may benefit from having defined subtypes +# of Indic script characters which are relevant to how Indic +# syllables (or aksaras) are constructed. Note that rules for +# syllabic structure in Indic scripts may differ significantly +# from how phonological syllables are defined. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Syllabic_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as Indic in the structural sense used for the +# Indic_Syllabic_Category are the following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Dives Akuru, Dogra, Grantha, Gujarati, +# Gunjala Gondi, Gurmukhi, Gurung Khema, Hanunoo, Javanese, Kaithi, +# Kannada, Kawi, Kayah Li, Kharoshthi, Khmer, Khojki, Khudawadi, +# Kirat Rai, Lao, Lepcha, Limbu, Mahajani, Makasar, Malayalam, +# Marchen, Masaram Gondi, Meetei Mayek, Modi, Multani, Myanmar, +# Nandinagari, Newa, New Tai Lue, Oriya, Phags-pa, Rejang, +# Saurashtra, Sharada, Siddham, Sinhala, Soyombo, Sundanese, +# Syloti Nagri, Tagalog, Tagbanwa, Tai Le, Tai Tham, Tai Viet, Takri, +# Tamil, Telugu, Thai, Tibetan, Tirhuta, Tulu-Tigalari, and +# Zanabazar Square. +# +# All characters for all other scripts not in that list +# take the default value for this property, unless they +# are individually listed in this data file. +# + +# ================================================ + +# Property: Indic_Syllabic_Category +# +# All code points not explicitly listed for Indic_Syllabic_Category +# have the value Other. +# +# @missing: 0000..10FFFF; Other + +# ================================================ + +# Indic_Syllabic_Category=Bindu + +# Bindu/Anusvara (nasalization or -n) + +# [Not derivable] + +0900..0902 ; Bindu # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +0981 ; Bindu # Mn BENGALI SIGN CANDRABINDU +0982 ; Bindu # Mc BENGALI SIGN ANUSVARA +09FC ; Bindu # Lo BENGALI LETTER VEDIC ANUSVARA +0A01..0A02 ; Bindu # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A70 ; Bindu # Mn GURMUKHI TIPPI +0A81..0A82 ; Bindu # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0B01 ; Bindu # Mn ORIYA SIGN CANDRABINDU +0B02 ; Bindu # Mc ORIYA SIGN ANUSVARA +0B82 ; Bindu # Mn TAMIL SIGN ANUSVARA +0C00 ; Bindu # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C01..0C02 ; Bindu # Mc [2] TELUGU SIGN CANDRABINDU..TELUGU SIGN ANUSVARA +0C04 ; Bindu # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C80 ; Bindu # Lo KANNADA SIGN SPACING CANDRABINDU +0C81 ; Bindu # Mn KANNADA SIGN CANDRABINDU +0C82 ; Bindu # Mc KANNADA SIGN ANUSVARA +0CF3 ; Bindu # Mc KANNADA SIGN COMBINING ANUSVARA ABOVE RIGHT +0D00..0D01 ; Bindu # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU +0D02 ; Bindu # Mc MALAYALAM SIGN ANUSVARA +0D04 ; Bindu # Lo MALAYALAM LETTER VEDIC ANUSVARA +0D81 ; Bindu # Mn SINHALA SIGN CANDRABINDU +0D82 ; Bindu # Mc SINHALA SIGN ANUSVARAYA +0E4D ; Bindu # Mn THAI CHARACTER NIKHAHIT +0ECD ; Bindu # Mn LAO NIGGAHITA +0F7E ; Bindu # Mn TIBETAN SIGN RJES SU NGA RO +0F82..0F83 ; Bindu # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +1036 ; Bindu # Mn MYANMAR SIGN ANUSVARA +17C6 ; Bindu # Mn KHMER SIGN NIKAHIT +1932 ; Bindu # Mn LIMBU SMALL LETTER ANUSVARA +1A74 ; Bindu # Mn TAI THAM SIGN MAI KANG +1B00..1B02 ; Bindu # Mn [3] BALINESE SIGN ULU RICEM..BALINESE SIGN CECEK +1B80 ; Bindu # Mn SUNDANESE SIGN PANYECEK +1C34..1C35 ; Bindu # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A80B ; Bindu # Mn SYLOTI NAGRI SIGN ANUSVARA +A873 ; Bindu # Lo PHAGS-PA LETTER CANDRABINDU +A880 ; Bindu # Mc SAURASHTRA SIGN ANUSVARA +A8C5 ; Bindu # Mn SAURASHTRA SIGN CANDRABINDU +A8F2..A8F3 ; Bindu # Lo [2] DEVANAGARI SIGN SPACING CANDRABINDU..DEVANAGARI SIGN CANDRABINDU VIRAMA +A980..A981 ; Bindu # Mn [2] JAVANESE SIGN PANYANGGA..JAVANESE SIGN CECAK +10A0E ; Bindu # Mn KHAROSHTHI SIGN ANUSVARA +11000 ; Bindu # Mc BRAHMI SIGN CANDRABINDU +11001 ; Bindu # Mn BRAHMI SIGN ANUSVARA +11080..11081 ; Bindu # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +11100..11101 ; Bindu # Mn [2] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN ANUSVARA +11180..11181 ; Bindu # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +111CF ; Bindu # Mn SHARADA SIGN INVERTED CANDRABINDU +11234 ; Bindu # Mn KHOJKI SIGN ANUSVARA +112DF ; Bindu # Mn KHUDAWADI SIGN ANUSVARA +11300..11301 ; Bindu # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11302 ; Bindu # Mc GRANTHA SIGN ANUSVARA +1135E..1135F ; Bindu # Lo [2] GRANTHA LETTER VEDIC ANUSVARA..GRANTHA LETTER VEDIC DOUBLE ANUSVARA +113CA ; Bindu # Mc TULU-TIGALARI SIGN CANDRA ANUNASIKA +113CC ; Bindu # Mc TULU-TIGALARI SIGN ANUSVARA +11443..11444 ; Bindu # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +1145F ; Bindu # Lo NEWA LETTER VEDIC ANUSVARA +114BF..114C0 ; Bindu # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Bindu # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +1163D ; Bindu # Mn MODI SIGN ANUSVARA +116AB ; Bindu # Mn TAKRI SIGN ANUSVARA +11837 ; Bindu # Mn DOGRA SIGN ANUSVARA +1193B..1193C ; Bindu # Mn [2] DIVES AKURU SIGN ANUSVARA..DIVES AKURU SIGN CANDRABINDU +119DE ; Bindu # Mc NANDINAGARI SIGN ANUSVARA +11A35..11A38 ; Bindu # Mn [4] ZANABAZAR SQUARE SIGN CANDRABINDU..ZANABAZAR SQUARE SIGN ANUSVARA +11A96 ; Bindu # Mn SOYOMBO SIGN ANUSVARA +11C3C..11C3D ; Bindu # Mn [2] BHAIKSUKI SIGN CANDRABINDU..BHAIKSUKI SIGN ANUSVARA +11CB5..11CB6 ; Bindu # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU +11D40 ; Bindu # Mn MASARAM GONDI SIGN ANUSVARA +11D95 ; Bindu # Mn GUNJALA GONDI SIGN ANUSVARA +11F00..11F01 ; Bindu # Mn [2] KAWI SIGN CANDRABINDU..KAWI SIGN ANUSVARA +1612D ; Bindu # Mn GURUNG KHEMA SIGN ANUSVARA +16D40..16D41 ; Bindu # Lm [2] KIRAT RAI SIGN ANUSVARA..KIRAT RAI SIGN TONPI + +# ================================================ + +# Indic_Syllabic_Category=Visarga + +# Visarga (-h) +# Excludes letters for jihvamuliya and upadhmaniya, which are +# related, but structured somewhat differently. + +# [Not derivable] + +0903 ; Visarga # Mc DEVANAGARI SIGN VISARGA +0983 ; Visarga # Mc BENGALI SIGN VISARGA +0A03 ; Visarga # Mc GURMUKHI SIGN VISARGA +0A83 ; Visarga # Mc GUJARATI SIGN VISARGA +0B03 ; Visarga # Mc ORIYA SIGN VISARGA +0C03 ; Visarga # Mc TELUGU SIGN VISARGA +0C83 ; Visarga # Mc KANNADA SIGN VISARGA +0D03 ; Visarga # Mc MALAYALAM SIGN VISARGA +0D83 ; Visarga # Mc SINHALA SIGN VISARGAYA +0F7F ; Visarga # Mc TIBETAN SIGN RNAM BCAD +1038 ; Visarga # Mc MYANMAR SIGN VISARGA +17C7 ; Visarga # Mc KHMER SIGN REAHMUK +1B04 ; Visarga # Mc BALINESE SIGN BISAH +1B82 ; Visarga # Mc SUNDANESE SIGN PANGWISAD +A881 ; Visarga # Mc SAURASHTRA SIGN VISARGA +A983 ; Visarga # Mc JAVANESE SIGN WIGNYAN +AAF5 ; Visarga # Mc MEETEI MAYEK VOWEL SIGN VISARGA +10A0F ; Visarga # Mn KHAROSHTHI SIGN VISARGA +11002 ; Visarga # Mc BRAHMI SIGN VISARGA +11082 ; Visarga # Mc KAITHI SIGN VISARGA +11102 ; Visarga # Mn CHAKMA SIGN VISARGA +11182 ; Visarga # Mc SHARADA SIGN VISARGA +11303 ; Visarga # Mc GRANTHA SIGN VISARGA +113CD ; Visarga # Mc TULU-TIGALARI SIGN VISARGA +11445 ; Visarga # Mc NEWA SIGN VISARGA +114C1 ; Visarga # Mc TIRHUTA SIGN VISARGA +115BE ; Visarga # Mc SIDDHAM SIGN VISARGA +1163E ; Visarga # Mc MODI SIGN VISARGA +116AC ; Visarga # Mc TAKRI SIGN VISARGA +11838 ; Visarga # Mc DOGRA SIGN VISARGA +119DF ; Visarga # Mc NANDINAGARI SIGN VISARGA +11A39 ; Visarga # Mc ZANABAZAR SQUARE SIGN VISARGA +11A97 ; Visarga # Mc SOYOMBO SIGN VISARGA +11C3E ; Visarga # Mc BHAIKSUKI SIGN VISARGA +11D41 ; Visarga # Mn MASARAM GONDI SIGN VISARGA +11D96 ; Visarga # Mc GUNJALA GONDI SIGN VISARGA +11F03 ; Visarga # Mc KAWI SIGN VISARGA +16D42 ; Visarga # Lm KIRAT RAI SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Avagraha + +# Avagraha (elision of initial a- in sandhi) + +# [Not derivable] + +093D ; Avagraha # Lo DEVANAGARI SIGN AVAGRAHA +09BD ; Avagraha # Lo BENGALI SIGN AVAGRAHA +0ABD ; Avagraha # Lo GUJARATI SIGN AVAGRAHA +0B3D ; Avagraha # Lo ORIYA SIGN AVAGRAHA +0C3D ; Avagraha # Lo TELUGU SIGN AVAGRAHA +0CBD ; Avagraha # Lo KANNADA SIGN AVAGRAHA +0D3D ; Avagraha # Lo MALAYALAM SIGN AVAGRAHA +0F85 ; Avagraha # Po TIBETAN MARK PALUTA +17DC ; Avagraha # Lo KHMER SIGN AVAKRAHASANYA +1BBA ; Avagraha # Lo SUNDANESE AVAGRAHA +111C1 ; Avagraha # Lo SHARADA SIGN AVAGRAHA +1133D ; Avagraha # Lo GRANTHA SIGN AVAGRAHA +113B7 ; Avagraha # Lo TULU-TIGALARI SIGN AVAGRAHA +11447 ; Avagraha # Lo NEWA SIGN AVAGRAHA +114C4 ; Avagraha # Lo TIRHUTA SIGN AVAGRAHA +119E1 ; Avagraha # Lo NANDINAGARI SIGN AVAGRAHA +11A9D ; Avagraha # Lo SOYOMBO MARK PLUTA +11C40 ; Avagraha # Lo BHAIKSUKI SIGN AVAGRAHA + +# ================================================ + +# Indic_Syllabic_Category=Nukta + +# Nukta (diacritic for borrowed consonants or other consonant +# modifications). Note that while the resulting sound is typically a +# consonant, the base letter a nukta follows may be an independent +# vowel. For example, is used to transcribe ARABIC LETTER +# AIN. + +# [Not derivable] + +093C ; Nukta # Mn DEVANAGARI SIGN NUKTA +09BC ; Nukta # Mn BENGALI SIGN NUKTA +0A3C ; Nukta # Mn GURMUKHI SIGN NUKTA +0ABC ; Nukta # Mn GUJARATI SIGN NUKTA +0AFD..0AFF ; Nukta # Mn [3] GUJARATI SIGN THREE-DOT NUKTA ABOVE..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE +0B3C ; Nukta # Mn ORIYA SIGN NUKTA +0C3C ; Nukta # Mn TELUGU SIGN NUKTA +0CBC ; Nukta # Mn KANNADA SIGN NUKTA +0F39 ; Nukta # Mn TIBETAN MARK TSA -PHRU +1B34 ; Nukta # Mn BALINESE SIGN REREKAN +1BE6 ; Nukta # Mn BATAK SIGN TOMPI +1C37 ; Nukta # Mn LEPCHA SIGN NUKTA +A9B3 ; Nukta # Mn JAVANESE SIGN CECAK TELU +10A38..10A3A ; Nukta # Mn [3] KHAROSHTHI SIGN BAR ABOVE..KHAROSHTHI SIGN DOT BELOW +110BA ; Nukta # Mn KAITHI SIGN NUKTA +11173 ; Nukta # Mn MAHAJANI SIGN NUKTA +111CA ; Nukta # Mn SHARADA SIGN NUKTA +11236 ; Nukta # Mn KHOJKI SIGN NUKTA +112E9 ; Nukta # Mn KHUDAWADI SIGN NUKTA +1133B..1133C ; Nukta # Mn [2] COMBINING BINDU BELOW..GRANTHA SIGN NUKTA +11446 ; Nukta # Mn NEWA SIGN NUKTA +114C3 ; Nukta # Mn TIRHUTA SIGN NUKTA +115C0 ; Nukta # Mn SIDDHAM SIGN NUKTA +116B7 ; Nukta # Mn TAKRI SIGN NUKTA +1183A ; Nukta # Mn DOGRA SIGN NUKTA +11943 ; Nukta # Mn DIVES AKURU SIGN NUKTA +11D42 ; Nukta # Mn MASARAM GONDI SIGN NUKTA +11F5A ; Nukta # Mn KAWI SIGN NUKTA + +# ================================================ + +# Indic_Syllabic_Category=Virama + +# Virama (kills inherent vowel of consonant; may act as a Pure_Killer +# or Invisible_Stacker depending on context) +# Only includes characters that can act both as visible killer viramas +# and consonant stackers. Separate property values exist for characters +# that can only act as pure killers, only as reordering killers, or only +# as consonant stackers. + +# [Derivation: (ccc=9) - (InSC=Pure_Killer) - (InSC=Invisible_Stacker) +# - (InSC=Reordering_Killer) - (InSC=Number_Joiner) - 2D7F] + +094D ; Virama # Mn DEVANAGARI SIGN VIRAMA +09CD ; Virama # Mn BENGALI SIGN VIRAMA +0A4D ; Virama # Mn GURMUKHI SIGN VIRAMA +0ACD ; Virama # Mn GUJARATI SIGN VIRAMA +0B4D ; Virama # Mn ORIYA SIGN VIRAMA +0BCD ; Virama # Mn TAMIL SIGN VIRAMA +0C4D ; Virama # Mn TELUGU SIGN VIRAMA +0CCD ; Virama # Mn KANNADA SIGN VIRAMA +0D4D ; Virama # Mn MALAYALAM SIGN VIRAMA +0DCA ; Virama # Mn SINHALA SIGN AL-LAKUNA +1B44 ; Virama # Mc BALINESE ADEG ADEG +A806 ; Virama # Mn SYLOTI NAGRI SIGN HASANTA +A8C4 ; Virama # Mn SAURASHTRA SIGN VIRAMA +A9C0 ; Virama # Mc JAVANESE PANGKON +11046 ; Virama # Mn BRAHMI VIRAMA +110B9 ; Virama # Mn KAITHI SIGN VIRAMA +111C0 ; Virama # Mc SHARADA SIGN VIRAMA +11235 ; Virama # Mc KHOJKI SIGN VIRAMA +1134D ; Virama # Mc GRANTHA SIGN VIRAMA +11442 ; Virama # Mn NEWA SIGN VIRAMA +114C2 ; Virama # Mn TIRHUTA SIGN VIRAMA +115BF ; Virama # Mn SIDDHAM SIGN VIRAMA +1163F ; Virama # Mn MODI SIGN VIRAMA +116B6 ; Virama # Mc TAKRI SIGN VIRAMA +11839 ; Virama # Mn DOGRA SIGN VIRAMA +119E0 ; Virama # Mn NANDINAGARI SIGN VIRAMA +11C3F ; Virama # Mn BHAIKSUKI SIGN VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Pure_Killer + +# Pure killer (kills inherent vowel of consonant; always visible; +# has no conjuct formation, consonant stacking, or reordering +# behavior) + +# [Not derivable] + +0D3B..0D3C ; Pure_Killer # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA +0E3A ; Pure_Killer # Mn THAI CHARACTER PHINTHU +0E4E ; Pure_Killer # Mn THAI CHARACTER YAMAKKAN +0EBA ; Pure_Killer # Mn LAO SIGN PALI VIRAMA +0F84 ; Pure_Killer # Mn TIBETAN MARK HALANTA +103A ; Pure_Killer # Mn MYANMAR SIGN ASAT +1714 ; Pure_Killer # Mn TAGALOG SIGN VIRAMA +1715 ; Pure_Killer # Mc TAGALOG SIGN PAMUDPOD +1734 ; Pure_Killer # Mc HANUNOO SIGN PAMUDPOD +17D1 ; Pure_Killer # Mn KHMER SIGN VIRIAM +1A7A ; Pure_Killer # Mn TAI THAM SIGN RA HAAM +1BAA ; Pure_Killer # Mc SUNDANESE SIGN PAMAAEH +A82C ; Pure_Killer # Mn SYLOTI NAGRI SIGN ALTERNATE HASANTA +A953 ; Pure_Killer # Mc REJANG VIRAMA +ABED ; Pure_Killer # Mn MEETEI MAYEK APUN IYEK +11070 ; Pure_Killer # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11134 ; Pure_Killer # Mn CHAKMA MAAYYAA +112EA ; Pure_Killer # Mn KHUDAWADI SIGN VIRAMA +113CE ; Pure_Killer # Mn TULU-TIGALARI SIGN VIRAMA +113CF ; Pure_Killer # Mc TULU-TIGALARI SIGN LOOPED VIRAMA +1172B ; Pure_Killer # Mn AHOM SIGN KILLER +1193D ; Pure_Killer # Mc DIVES AKURU SIGN HALANTA +11A34 ; Pure_Killer # Mn ZANABAZAR SQUARE SIGN VIRAMA +11D44 ; Pure_Killer # Mn MASARAM GONDI SIGN HALANTA +11F41 ; Pure_Killer # Mc KAWI SIGN KILLER +1612F ; Pure_Killer # Mn GURUNG KHEMA SIGN THOLHOMA +16D6B..16D6C ; Pure_Killer # Lm [2] KIRAT RAI SIGN VIRAMA..KIRAT RAI SIGN SAAT + +# ================================================ + +# Indic_Syllabic_Category=Reordering_Killer + +# Reordering killer (kills inherent vowel of consonant; always visible; +# may cause consonant reordering) + +# [Not derivable] + +1BF2..1BF3 ; Reordering_Killer # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN + +# ================================================ + +# Indic_Syllabic_Category=Invisible_Stacker + +# Invisible stacker (usually kills inherent vowel of consonant; is not visible +# by itself; causes conjunct formation or consonant +# stacking) +# +# Note that in some scripts, such as Kharoshthi and Masaram Gondi, an invisible +# stacker may have a second function, changing the shape and/or location of the +# consonant preceding it, even when there is no consonant following the +# invisible stacker. + +# [Not derivable] + +1039 ; Invisible_Stacker # Mn MYANMAR SIGN VIRAMA +17D2 ; Invisible_Stacker # Mn KHMER SIGN COENG +1A60 ; Invisible_Stacker # Mn TAI THAM SIGN SAKOT +1BAB ; Invisible_Stacker # Mn SUNDANESE SIGN VIRAMA +AAF6 ; Invisible_Stacker # Mn MEETEI MAYEK VIRAMA +10A3F ; Invisible_Stacker # Mn KHAROSHTHI VIRAMA +11133 ; Invisible_Stacker # Mn CHAKMA VIRAMA +113D0 ; Invisible_Stacker # Mn TULU-TIGALARI CONJOINER +1193E ; Invisible_Stacker # Mn DIVES AKURU VIRAMA +11A47 ; Invisible_Stacker # Mn ZANABAZAR SQUARE SUBJOINER +11A99 ; Invisible_Stacker # Mn SOYOMBO SUBJOINER +11D45 ; Invisible_Stacker # Mn MASARAM GONDI VIRAMA +11D97 ; Invisible_Stacker # Mn GUNJALA GONDI VIRAMA +11F42 ; Invisible_Stacker # Mn KAWI CONJOINER + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Independent + +# Independent Vowels (contrasted with matras) + +# [Not derivable] + +0904..0914 ; Vowel_Independent # Lo [17] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER AU +0960..0961 ; Vowel_Independent # Lo [2] DEVANAGARI LETTER VOCALIC RR..DEVANAGARI LETTER VOCALIC LL +0972..0977 ; Vowel_Independent # Lo [6] DEVANAGARI LETTER CANDRA A..DEVANAGARI LETTER UUE +0985..098C ; Vowel_Independent # Lo [8] BENGALI LETTER A..BENGALI LETTER VOCALIC L +098F..0990 ; Vowel_Independent # Lo [2] BENGALI LETTER E..BENGALI LETTER AI +0993..0994 ; Vowel_Independent # Lo [2] BENGALI LETTER O..BENGALI LETTER AU +09E0..09E1 ; Vowel_Independent # Lo [2] BENGALI LETTER VOCALIC RR..BENGALI LETTER VOCALIC LL +0A05..0A0A ; Vowel_Independent # Lo [6] GURMUKHI LETTER A..GURMUKHI LETTER UU +0A0F..0A10 ; Vowel_Independent # Lo [2] GURMUKHI LETTER EE..GURMUKHI LETTER AI +0A13..0A14 ; Vowel_Independent # Lo [2] GURMUKHI LETTER OO..GURMUKHI LETTER AU +0A85..0A8D ; Vowel_Independent # Lo [9] GUJARATI LETTER A..GUJARATI VOWEL CANDRA E +0A8F..0A91 ; Vowel_Independent # Lo [3] GUJARATI LETTER E..GUJARATI VOWEL CANDRA O +0A93..0A94 ; Vowel_Independent # Lo [2] GUJARATI LETTER O..GUJARATI LETTER AU +0AE0..0AE1 ; Vowel_Independent # Lo [2] GUJARATI LETTER VOCALIC RR..GUJARATI LETTER VOCALIC LL +0B05..0B0C ; Vowel_Independent # Lo [8] ORIYA LETTER A..ORIYA LETTER VOCALIC L +0B0F..0B10 ; Vowel_Independent # Lo [2] ORIYA LETTER E..ORIYA LETTER AI +0B13..0B14 ; Vowel_Independent # Lo [2] ORIYA LETTER O..ORIYA LETTER AU +0B60..0B61 ; Vowel_Independent # Lo [2] ORIYA LETTER VOCALIC RR..ORIYA LETTER VOCALIC LL +0B85..0B8A ; Vowel_Independent # Lo [6] TAMIL LETTER A..TAMIL LETTER UU +0B8E..0B90 ; Vowel_Independent # Lo [3] TAMIL LETTER E..TAMIL LETTER AI +0B92..0B94 ; Vowel_Independent # Lo [3] TAMIL LETTER O..TAMIL LETTER AU +0C05..0C0C ; Vowel_Independent # Lo [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L +0C0E..0C10 ; Vowel_Independent # Lo [3] TELUGU LETTER E..TELUGU LETTER AI +0C12..0C14 ; Vowel_Independent # Lo [3] TELUGU LETTER O..TELUGU LETTER AU +0C60..0C61 ; Vowel_Independent # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL +0C85..0C8C ; Vowel_Independent # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L +0C8E..0C90 ; Vowel_Independent # Lo [3] KANNADA LETTER E..KANNADA LETTER AI +0C92..0C94 ; Vowel_Independent # Lo [3] KANNADA LETTER O..KANNADA LETTER AU +0CE0..0CE1 ; Vowel_Independent # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL +0D05..0D0C ; Vowel_Independent # Lo [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L +0D0E..0D10 ; Vowel_Independent # Lo [3] MALAYALAM LETTER E..MALAYALAM LETTER AI +0D12..0D14 ; Vowel_Independent # Lo [3] MALAYALAM LETTER O..MALAYALAM LETTER AU +0D5F..0D61 ; Vowel_Independent # Lo [3] MALAYALAM LETTER ARCHAIC II..MALAYALAM LETTER VOCALIC LL +0D85..0D96 ; Vowel_Independent # Lo [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA +1021..102A ; Vowel_Independent # Lo [10] MYANMAR LETTER A..MYANMAR LETTER AU +1052..1055 ; Vowel_Independent # Lo [4] MYANMAR LETTER VOCALIC R..MYANMAR LETTER VOCALIC LL +1700..1702 ; Vowel_Independent # Lo [3] TAGALOG LETTER A..TAGALOG LETTER U +1720..1722 ; Vowel_Independent # Lo [3] HANUNOO LETTER A..HANUNOO LETTER U +1740..1742 ; Vowel_Independent # Lo [3] BUHID LETTER A..BUHID LETTER U +1760..1762 ; Vowel_Independent # Lo [3] TAGBANWA LETTER A..TAGBANWA LETTER U +17A3..17B3 ; Vowel_Independent # Lo [17] KHMER INDEPENDENT VOWEL QAQ..KHMER INDEPENDENT VOWEL QAU +1A4D..1A52 ; Vowel_Independent # Lo [6] TAI THAM LETTER I..TAI THAM LETTER OO +1B05..1B12 ; Vowel_Independent # Lo [14] BALINESE LETTER AKARA..BALINESE LETTER OKARA TEDUNG +1B83..1B89 ; Vowel_Independent # Lo [7] SUNDANESE LETTER A..SUNDANESE LETTER EU +1BE4..1BE5 ; Vowel_Independent # Lo [2] BATAK LETTER I..BATAK LETTER U +A800..A801 ; Vowel_Independent # Lo [2] SYLOTI NAGRI LETTER A..SYLOTI NAGRI LETTER I +A803..A805 ; Vowel_Independent # Lo [3] SYLOTI NAGRI LETTER U..SYLOTI NAGRI LETTER O +A882..A891 ; Vowel_Independent # Lo [16] SAURASHTRA LETTER A..SAURASHTRA LETTER AU +A8FE ; Vowel_Independent # Lo DEVANAGARI LETTER AY +A984..A988 ; Vowel_Independent # Lo [5] JAVANESE LETTER A..JAVANESE LETTER U +A98C..A98E ; Vowel_Independent # Lo [3] JAVANESE LETTER E..JAVANESE LETTER O +AA00..AA05 ; Vowel_Independent # Lo [6] CHAM LETTER A..CHAM LETTER O +AAE0..AAE1 ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER E..MEETEI MAYEK LETTER O +ABCE..ABCF ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER UN..MEETEI MAYEK LETTER I +ABD1 ; Vowel_Independent # Lo MEETEI MAYEK LETTER ATIYA +11005..11012 ; Vowel_Independent # Lo [14] BRAHMI LETTER A..BRAHMI LETTER AU +11071..11072 ; Vowel_Independent # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11083..1108C ; Vowel_Independent # Lo [10] KAITHI LETTER A..KAITHI LETTER AU +11103..11106 ; Vowel_Independent # Lo [4] CHAKMA LETTER AA..CHAKMA LETTER E +11183..11190 ; Vowel_Independent # Lo [14] SHARADA LETTER A..SHARADA LETTER AU +11200..11207 ; Vowel_Independent # Lo [8] KHOJKI LETTER A..KHOJKI LETTER AU +11240 ; Vowel_Independent # Lo KHOJKI LETTER SHORT I +11280..11283 ; Vowel_Independent # Lo [4] MULTANI LETTER A..MULTANI LETTER E +112B0..112B9 ; Vowel_Independent # Lo [10] KHUDAWADI LETTER A..KHUDAWADI LETTER AU +11305..1130C ; Vowel_Independent # Lo [8] GRANTHA LETTER A..GRANTHA LETTER VOCALIC L +1130F..11310 ; Vowel_Independent # Lo [2] GRANTHA LETTER EE..GRANTHA LETTER AI +11313..11314 ; Vowel_Independent # Lo [2] GRANTHA LETTER OO..GRANTHA LETTER AU +11360..11361 ; Vowel_Independent # Lo [2] GRANTHA LETTER VOCALIC RR..GRANTHA LETTER VOCALIC LL +11380..11389 ; Vowel_Independent # Lo [10] TULU-TIGALARI LETTER A..TULU-TIGALARI LETTER VOCALIC LL +1138B ; Vowel_Independent # Lo TULU-TIGALARI LETTER EE +1138E ; Vowel_Independent # Lo TULU-TIGALARI LETTER AI +11390..11391 ; Vowel_Independent # Lo [2] TULU-TIGALARI LETTER OO..TULU-TIGALARI LETTER AU +11400..1140D ; Vowel_Independent # Lo [14] NEWA LETTER A..NEWA LETTER AU +11481..1148E ; Vowel_Independent # Lo [14] TIRHUTA LETTER A..TIRHUTA LETTER AU +11580..1158D ; Vowel_Independent # Lo [14] SIDDHAM LETTER A..SIDDHAM LETTER AU +115D8..115DB ; Vowel_Independent # Lo [4] SIDDHAM LETTER THREE-CIRCLE ALTERNATE I..SIDDHAM LETTER ALTERNATE U +11600..1160D ; Vowel_Independent # Lo [14] MODI LETTER A..MODI LETTER AU +11680..11689 ; Vowel_Independent # Lo [10] TAKRI LETTER A..TAKRI LETTER AU +11800..11809 ; Vowel_Independent # Lo [10] DOGRA LETTER A..DOGRA LETTER AU +11900..11906 ; Vowel_Independent # Lo [7] DIVES AKURU LETTER A..DIVES AKURU LETTER E +11909 ; Vowel_Independent # Lo DIVES AKURU LETTER O +119A0..119A7 ; Vowel_Independent # Lo [8] NANDINAGARI LETTER A..NANDINAGARI LETTER VOCALIC RR +119AA..119AD ; Vowel_Independent # Lo [4] NANDINAGARI LETTER E..NANDINAGARI LETTER AU +11C00..11C08 ; Vowel_Independent # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L +11C0A..11C0D ; Vowel_Independent # Lo [4] BHAIKSUKI LETTER E..BHAIKSUKI LETTER AU +11D00..11D06 ; Vowel_Independent # Lo [7] MASARAM GONDI LETTER A..MASARAM GONDI LETTER E +11D08..11D09 ; Vowel_Independent # Lo [2] MASARAM GONDI LETTER AI..MASARAM GONDI LETTER O +11D0B ; Vowel_Independent # Lo MASARAM GONDI LETTER AU +11D60..11D65 ; Vowel_Independent # Lo [6] GUNJALA GONDI LETTER A..GUNJALA GONDI LETTER UU +11D67..11D68 ; Vowel_Independent # Lo [2] GUNJALA GONDI LETTER EE..GUNJALA GONDI LETTER AI +11D6A..11D6B ; Vowel_Independent # Lo [2] GUNJALA GONDI LETTER OO..GUNJALA GONDI LETTER AU +11F04..11F10 ; Vowel_Independent # Lo [13] KAWI LETTER A..KAWI LETTER O +16100 ; Vowel_Independent # Lo GURUNG KHEMA LETTER A + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Dependent + +# Dependent Vowels (contrasted with independent vowels and/or with +# complex placement). Known as matras in Indic scripts. Also +# includes vowel modifiers that follow dependent (and sometimes +# independent) vowels. + +# [Not derivable] + +093A ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN OE +093B ; Vowel_Dependent # Mc DEVANAGARI VOWEL SIGN OOE +093E..0940 ; Vowel_Dependent # Mc [3] DEVANAGARI VOWEL SIGN AA..DEVANAGARI VOWEL SIGN II +0941..0948 ; Vowel_Dependent # Mn [8] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN AI +0949..094C ; Vowel_Dependent # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094E..094F ; Vowel_Dependent # Mc [2] DEVANAGARI VOWEL SIGN PRISHTHAMATRA E..DEVANAGARI VOWEL SIGN AW +0955..0957 ; Vowel_Dependent # Mn [3] DEVANAGARI VOWEL SIGN CANDRA LONG E..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Vowel_Dependent # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BE..09C0 ; Vowel_Dependent # Mc [3] BENGALI VOWEL SIGN AA..BENGALI VOWEL SIGN II +09C1..09C4 ; Vowel_Dependent # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09C7..09C8 ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +09CB..09CC ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +09D7 ; Vowel_Dependent # Mc BENGALI AU LENGTH MARK +09E2..09E3 ; Vowel_Dependent # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3E..0A40 ; Vowel_Dependent # Mc [3] GURMUKHI VOWEL SIGN AA..GURMUKHI VOWEL SIGN II +0A41..0A42 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A47..0A48 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0ABE..0AC0 ; Vowel_Dependent # Mc [3] GUJARATI VOWEL SIGN AA..GUJARATI VOWEL SIGN II +0AC1..0AC5 ; Vowel_Dependent # Mn [5] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AC9 ; Vowel_Dependent # Mc GUJARATI VOWEL SIGN CANDRA O +0ACB..0ACC ; Vowel_Dependent # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0AE2..0AE3 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3E ; Vowel_Dependent # Mc ORIYA VOWEL SIGN AA +0B3F ; Vowel_Dependent # Mn ORIYA VOWEL SIGN I +0B40 ; Vowel_Dependent # Mc ORIYA VOWEL SIGN II +0B41..0B44 ; Vowel_Dependent # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B47..0B48 ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI +0B4B..0B4C ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN O..ORIYA VOWEL SIGN AU +0B55..0B56 ; Vowel_Dependent # Mn [2] ORIYA SIGN OVERLINE..ORIYA AI LENGTH MARK +0B57 ; Vowel_Dependent # Mc ORIYA AU LENGTH MARK +0B62..0B63 ; Vowel_Dependent # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BBE..0BBF ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC0 ; Vowel_Dependent # Mn TAMIL VOWEL SIGN II +0BC1..0BC2 ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BC6..0BC8 ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0BCA..0BCC ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0BD7 ; Vowel_Dependent # Mc TAMIL AU LENGTH MARK +0C3E..0C40 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C41..0C44 ; Vowel_Dependent # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C46..0C48 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI +0C4A..0C4C ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C55..0C56 ; Vowel_Dependent # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK +0C62..0C63 ; Vowel_Dependent # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBE ; Vowel_Dependent # Mc KANNADA VOWEL SIGN AA +0CBF ; Vowel_Dependent # Mn KANNADA VOWEL SIGN I +0CC0..0CC4 ; Vowel_Dependent # Mc [5] KANNADA VOWEL SIGN II..KANNADA VOWEL SIGN VOCALIC RR +0CC6 ; Vowel_Dependent # Mn KANNADA VOWEL SIGN E +0CC7..0CC8 ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +0CCC ; Vowel_Dependent # Mn KANNADA VOWEL SIGN AU +0CD5..0CD6 ; Vowel_Dependent # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CE2..0CE3 ; Vowel_Dependent # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D3E..0D40 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D44 ; Vowel_Dependent # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR +0D46..0D48 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0D4A..0D4C ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0D57 ; Vowel_Dependent # Mc MALAYALAM AU LENGTH MARK +0D62..0D63 ; Vowel_Dependent # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DCF..0DD1 ; Vowel_Dependent # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD2..0DD4 ; Vowel_Dependent # Mn [3] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Vowel_Dependent # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0DD8..0DDF ; Vowel_Dependent # Mc [8] SINHALA VOWEL SIGN GAETTA-PILLA..SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Vowel_Dependent # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Vowel_Dependent # Lo THAI CHARACTER SARA A +0E31 ; Vowel_Dependent # Mn THAI CHARACTER MAI HAN-AKAT +0E32..0E33 ; Vowel_Dependent # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E34..0E39 ; Vowel_Dependent # Mn [6] THAI CHARACTER SARA I..THAI CHARACTER SARA UU +0E40..0E45 ; Vowel_Dependent # Lo [6] THAI CHARACTER SARA E..THAI CHARACTER LAKKHANGYAO +0E47 ; Vowel_Dependent # Mn THAI CHARACTER MAITAIKHU +0EB0 ; Vowel_Dependent # Lo LAO VOWEL SIGN A +0EB1 ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KAN +0EB2..0EB3 ; Vowel_Dependent # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0EB4..0EB9 ; Vowel_Dependent # Mn [6] LAO VOWEL SIGN I..LAO VOWEL SIGN UU +0EBB ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KON +0EC0..0EC4 ; Vowel_Dependent # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +0F71..0F7D ; Vowel_Dependent # Mn [13] TIBETAN VOWEL SIGN AA..TIBETAN VOWEL SIGN OO +0F80..0F81 ; Vowel_Dependent # Mn [2] TIBETAN VOWEL SIGN REVERSED I..TIBETAN VOWEL SIGN REVERSED II +102B..102C ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +102D..1030 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN UU +1031 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN E +1032..1035 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +1056..1057 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1058..1059 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1062 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1071..1074 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1083..1084 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN SHAN AA..MYANMAR VOWEL SIGN SHAN E +1085..1086 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109C ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN AITON A +109D ; Vowel_Dependent # Mn MYANMAR VOWEL SIGN AITON AI +1712..1713 ; Vowel_Dependent # Mn [2] TAGALOG VOWEL SIGN I..TAGALOG VOWEL SIGN U +1732..1733 ; Vowel_Dependent # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1752..1753 ; Vowel_Dependent # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U +1772..1773 ; Vowel_Dependent # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U +17B6 ; Vowel_Dependent # Mc KHMER VOWEL SIGN AA +17B7..17BD ; Vowel_Dependent # Mn [7] KHMER VOWEL SIGN I..KHMER VOWEL SIGN UA +17BE..17C5 ; Vowel_Dependent # Mc [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU +17C8 ; Vowel_Dependent # Mc KHMER SIGN YUUKALEAPINTU +1920..1922 ; Vowel_Dependent # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U +1923..1926 ; Vowel_Dependent # Mc [4] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AU +1927..1928 ; Vowel_Dependent # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Vowel_Dependent # Mn LIMBU SIGN KEMPHRENG +19B0..19C0 ; Vowel_Dependent # Lo [17] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN IY +1A17..1A18 ; Vowel_Dependent # Mn [2] BUGINESE VOWEL SIGN I..BUGINESE VOWEL SIGN U +1A19..1A1A ; Vowel_Dependent # Mc [2] BUGINESE VOWEL SIGN E..BUGINESE VOWEL SIGN O +1A1B ; Vowel_Dependent # Mn BUGINESE VOWEL SIGN AE +1A61 ; Vowel_Dependent # Mc TAI THAM VOWEL SIGN A +1A62 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN MAI SAT +1A63..1A64 ; Vowel_Dependent # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A65..1A6C ; Vowel_Dependent # Mn [8] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN OA BELOW +1A6D..1A72 ; Vowel_Dependent # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI +1A73 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN OA ABOVE +1B35 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN TEDUNG +1B36..1B3A ; Vowel_Dependent # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA +1B3B ; Vowel_Dependent # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +1B3C ; Vowel_Dependent # Mn BALINESE VOWEL SIGN LA LENGA +1B3D..1B41 ; Vowel_Dependent # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1B42 ; Vowel_Dependent # Mn BALINESE VOWEL SIGN PEPET +1B43 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN PEPET TEDUNG +1BA4..1BA5 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PANGHULU..SUNDANESE VOWEL SIGN PANYUKU +1BA6..1BA7 ; Vowel_Dependent # Mc [2] SUNDANESE VOWEL SIGN PANAELAENG..SUNDANESE VOWEL SIGN PANOLONG +1BA8..1BA9 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE7 ; Vowel_Dependent # Mc BATAK VOWEL SIGN E +1BE8..1BE9 ; Vowel_Dependent # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BEA..1BEC ; Vowel_Dependent # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BED ; Vowel_Dependent # Mn BATAK VOWEL SIGN KARO O +1BEE ; Vowel_Dependent # Mc BATAK VOWEL SIGN U +1BEF ; Vowel_Dependent # Mn BATAK VOWEL SIGN U FOR SIMALUNGUN SA +1C26..1C2B ; Vowel_Dependent # Mc [6] LEPCHA VOWEL SIGN AA..LEPCHA VOWEL SIGN UU +1C2C ; Vowel_Dependent # Mn LEPCHA VOWEL SIGN E +A802 ; Vowel_Dependent # Mn SYLOTI NAGRI SIGN DVISVARA +A823..A824 ; Vowel_Dependent # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A825..A826 ; Vowel_Dependent # Mn [2] SYLOTI NAGRI VOWEL SIGN U..SYLOTI NAGRI VOWEL SIGN E +A827 ; Vowel_Dependent # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Vowel_Dependent # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A8FF ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN AY +A947..A94E ; Vowel_Dependent # Mn [8] REJANG VOWEL SIGN I..REJANG VOWEL SIGN EA +A9B4..A9B5 ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9B6..A9B9 ; Vowel_Dependent # Mn [4] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BA..A9BB ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +A9BC ; Vowel_Dependent # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Vowel_Dependent # Mn MYANMAR SIGN SHAN SAW +AA29..AA2E ; Vowel_Dependent # Mn [6] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN OE +AA2F..AA30 ; Vowel_Dependent # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA31..AA32 ; Vowel_Dependent # Mn [2] CHAM VOWEL SIGN AU..CHAM VOWEL SIGN UE +AAB0 ; Vowel_Dependent # Mn TAI VIET MAI KANG +AAB1 ; Vowel_Dependent # Lo TAI VIET VOWEL AA +AAB2..AAB4 ; Vowel_Dependent # Mn [3] TAI VIET VOWEL I..TAI VIET VOWEL U +AAB5..AAB6 ; Vowel_Dependent # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB7..AAB8 ; Vowel_Dependent # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AAB9..AABD ; Vowel_Dependent # Lo [5] TAI VIET VOWEL UEA..TAI VIET VOWEL AN +AABE ; Vowel_Dependent # Mn TAI VIET VOWEL AM +AAEB ; Vowel_Dependent # Mc MEETEI MAYEK VOWEL SIGN II +AAEC..AAED ; Vowel_Dependent # Mn [2] MEETEI MAYEK VOWEL SIGN UU..MEETEI MAYEK VOWEL SIGN AAI +AAEE..AAEF ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN AU..MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE5 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN ANAP +ABE6..ABE7 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE8 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABE9..ABEA ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +10A01..10A03 ; Vowel_Dependent # Mn [3] KHAROSHTHI VOWEL SIGN I..KHAROSHTHI VOWEL SIGN VOCALIC R +10A05..10A06 ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O +10A0C..10A0D ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN DOUBLE RING BELOW +11038..11045 ; Vowel_Dependent # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +11073..11074 ; Vowel_Dependent # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O +110B0..110B2 ; Vowel_Dependent # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II +110B3..110B6 ; Vowel_Dependent # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI +110B7..110B8 ; Vowel_Dependent # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +110C2 ; Vowel_Dependent # Mn KAITHI VOWEL SIGN VOCALIC R +11127..1112B ; Vowel_Dependent # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU +1112C ; Vowel_Dependent # Mc CHAKMA VOWEL SIGN E +1112D..11132 ; Vowel_Dependent # Mn [6] CHAKMA VOWEL SIGN AI..CHAKMA AU MARK +11145..11146 ; Vowel_Dependent # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI +111B3..111B5 ; Vowel_Dependent # Mc [3] SHARADA VOWEL SIGN AA..SHARADA VOWEL SIGN II +111B6..111BE ; Vowel_Dependent # Mn [9] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN O +111BF ; Vowel_Dependent # Mc SHARADA VOWEL SIGN AU +111CB..111CC ; Vowel_Dependent # Mn [2] SHARADA VOWEL MODIFIER MARK..SHARADA EXTRA SHORT VOWEL MARK +111CE ; Vowel_Dependent # Mc SHARADA VOWEL SIGN PRISHTHAMATRA E +1122C..1122E ; Vowel_Dependent # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +1122F..11231 ; Vowel_Dependent # Mn [3] KHOJKI VOWEL SIGN U..KHOJKI VOWEL SIGN AI +11232..11233 ; Vowel_Dependent # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU +11241 ; Vowel_Dependent # Mn KHOJKI VOWEL SIGN VOCALIC R +112E0..112E2 ; Vowel_Dependent # Mc [3] KHUDAWADI VOWEL SIGN AA..KHUDAWADI VOWEL SIGN II +112E3..112E8 ; Vowel_Dependent # Mn [6] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN AU +1133E..1133F ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11340 ; Vowel_Dependent # Mn GRANTHA VOWEL SIGN II +11341..11344 ; Vowel_Dependent # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +11347..11348 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +1134B..1134C ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +11357 ; Vowel_Dependent # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +113B8..113BA ; Vowel_Dependent # Mc [3] TULU-TIGALARI VOWEL SIGN AA..TULU-TIGALARI VOWEL SIGN II +113BB..113C0 ; Vowel_Dependent # Mn [6] TULU-TIGALARI VOWEL SIGN U..TULU-TIGALARI VOWEL SIGN VOCALIC LL +113C2 ; Vowel_Dependent # Mc TULU-TIGALARI VOWEL SIGN EE +113C5 ; Vowel_Dependent # Mc TULU-TIGALARI VOWEL SIGN AI +113C7..113C9 ; Vowel_Dependent # Mc [3] TULU-TIGALARI VOWEL SIGN OO..TULU-TIGALARI AU LENGTH MARK +11435..11437 ; Vowel_Dependent # Mc [3] NEWA VOWEL SIGN AA..NEWA VOWEL SIGN II +11438..1143F ; Vowel_Dependent # Mn [8] NEWA VOWEL SIGN U..NEWA VOWEL SIGN AI +11440..11441 ; Vowel_Dependent # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +114B0..114B2 ; Vowel_Dependent # Mc [3] TIRHUTA VOWEL SIGN AA..TIRHUTA VOWEL SIGN II +114B3..114B8 ; Vowel_Dependent # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114B9 ; Vowel_Dependent # Mc TIRHUTA VOWEL SIGN E +114BA ; Vowel_Dependent # Mn TIRHUTA VOWEL SIGN SHORT E +114BB..114BE ; Vowel_Dependent # Mc [4] TIRHUTA VOWEL SIGN AI..TIRHUTA VOWEL SIGN AU +115AF..115B1 ; Vowel_Dependent # Mc [3] SIDDHAM VOWEL SIGN AA..SIDDHAM VOWEL SIGN II +115B2..115B5 ; Vowel_Dependent # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115B8..115BB ; Vowel_Dependent # Mc [4] SIDDHAM VOWEL SIGN E..SIDDHAM VOWEL SIGN AU +115DC..115DD ; Vowel_Dependent # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11630..11632 ; Vowel_Dependent # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +11633..1163A ; Vowel_Dependent # Mn [8] MODI VOWEL SIGN U..MODI VOWEL SIGN AI +1163B..1163C ; Vowel_Dependent # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +11640 ; Vowel_Dependent # Mn MODI SIGN ARDHACANDRA +116AD ; Vowel_Dependent # Mn TAKRI VOWEL SIGN AA +116AE..116AF ; Vowel_Dependent # Mc [2] TAKRI VOWEL SIGN I..TAKRI VOWEL SIGN II +116B0..116B5 ; Vowel_Dependent # Mn [6] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN AU +11720..11721 ; Vowel_Dependent # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +11722..11725 ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN I..AHOM VOWEL SIGN UU +11726 ; Vowel_Dependent # Mc AHOM VOWEL SIGN E +11727..1172A ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN AW..AHOM VOWEL SIGN AM +1182C..1182E ; Vowel_Dependent # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II +1182F..11836 ; Vowel_Dependent # Mn [8] DOGRA VOWEL SIGN U..DOGRA VOWEL SIGN AU +11930..11935 ; Vowel_Dependent # Mc [6] DIVES AKURU VOWEL SIGN AA..DIVES AKURU VOWEL SIGN E +11937..11938 ; Vowel_Dependent # Mc [2] DIVES AKURU VOWEL SIGN AI..DIVES AKURU VOWEL SIGN O +119D1..119D3 ; Vowel_Dependent # Mc [3] NANDINAGARI VOWEL SIGN AA..NANDINAGARI VOWEL SIGN II +119D4..119D7 ; Vowel_Dependent # Mn [4] NANDINAGARI VOWEL SIGN U..NANDINAGARI VOWEL SIGN VOCALIC RR +119DA..119DB ; Vowel_Dependent # Mn [2] NANDINAGARI VOWEL SIGN E..NANDINAGARI VOWEL SIGN AI +119DC..119DD ; Vowel_Dependent # Mc [2] NANDINAGARI VOWEL SIGN O..NANDINAGARI VOWEL SIGN AU +119E4 ; Vowel_Dependent # Mc NANDINAGARI VOWEL SIGN PRISHTHAMATRA E +11A01..11A0A ; Vowel_Dependent # Mn [10] ZANABAZAR SQUARE VOWEL SIGN I..ZANABAZAR SQUARE VOWEL LENGTH MARK +11A51..11A56 ; Vowel_Dependent # Mn [6] SOYOMBO VOWEL SIGN I..SOYOMBO VOWEL SIGN OE +11A57..11A58 ; Vowel_Dependent # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU +11A59..11A5B ; Vowel_Dependent # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK +11B60 ; Vowel_Dependent # Mn SHARADA VOWEL SIGN OE +11B61 ; Vowel_Dependent # Mc SHARADA VOWEL SIGN OOE +11B62..11B64 ; Vowel_Dependent # Mn [3] SHARADA VOWEL SIGN UE..SHARADA VOWEL SIGN SHORT E +11B65 ; Vowel_Dependent # Mc SHARADA VOWEL SIGN SHORT O +11B66 ; Vowel_Dependent # Mn SHARADA VOWEL SIGN CANDRA E +11B67 ; Vowel_Dependent # Mc SHARADA VOWEL SIGN CANDRA O +11C2F ; Vowel_Dependent # Mc BHAIKSUKI VOWEL SIGN AA +11C30..11C36 ; Vowel_Dependent # Mn [7] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN VOCALIC L +11C38..11C3B ; Vowel_Dependent # Mn [4] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI VOWEL SIGN AU +11CB0 ; Vowel_Dependent # Mn MARCHEN VOWEL SIGN AA +11CB1 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN I +11CB2..11CB3 ; Vowel_Dependent # Mn [2] MARCHEN VOWEL SIGN U..MARCHEN VOWEL SIGN E +11CB4 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN O +11D31..11D36 ; Vowel_Dependent # Mn [6] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN VOCALIC R +11D3A ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN E +11D3C..11D3D ; Vowel_Dependent # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O +11D3F ; Vowel_Dependent # Mn MASARAM GONDI VOWEL SIGN AU +11D43 ; Vowel_Dependent # Mn MASARAM GONDI SIGN CANDRA +11D8A..11D8E ; Vowel_Dependent # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU +11D90..11D91 ; Vowel_Dependent # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI +11D93..11D94 ; Vowel_Dependent # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU +11EF3..11EF4 ; Vowel_Dependent # Mn [2] MAKASAR VOWEL SIGN I..MAKASAR VOWEL SIGN U +11EF5..11EF6 ; Vowel_Dependent # Mc [2] MAKASAR VOWEL SIGN E..MAKASAR VOWEL SIGN O +11F34..11F35 ; Vowel_Dependent # Mc [2] KAWI VOWEL SIGN AA..KAWI VOWEL SIGN ALTERNATE AA +11F36..11F3A ; Vowel_Dependent # Mn [5] KAWI VOWEL SIGN I..KAWI VOWEL SIGN VOCALIC R +11F3E..11F3F ; Vowel_Dependent # Mc [2] KAWI VOWEL SIGN E..KAWI VOWEL SIGN AI +11F40 ; Vowel_Dependent # Mn KAWI VOWEL SIGN EU +1611E..16129 ; Vowel_Dependent # Mn [12] GURUNG KHEMA VOWEL SIGN AA..GURUNG KHEMA VOWEL LENGTH MARK +16D63..16D6A ; Vowel_Dependent # Lo [8] KIRAT RAI VOWEL SIGN AA..KIRAT RAI VOWEL SIGN AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel + +# (Other) Vowels (reanalyzed as ordinary alphabetic letters or marks) + +# [Not derivable] + +1963..196D ; Vowel # Lo [11] TAI LE LETTER A..TAI LE LETTER AI +A85E..A861 ; Vowel # Lo [4] PHAGS-PA LETTER I..PHAGS-PA LETTER O +A866 ; Vowel # Lo PHAGS-PA LETTER EE +A922..A925 ; Vowel # Lo [4] KAYAH LI LETTER A..KAYAH LI LETTER OO +A926..A92A ; Vowel # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O +11150..11154 ; Vowel # Lo [5] MAHAJANI LETTER A..MAHAJANI LETTER O + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Placeholder + +# Consonant Placeholder +# This includes generic placeholders used for +# Indic script layout (NBSP and dotted circle), as well as a few script- +# specific vowel-holder characters which are not technically +# consonants, but serve instead as bases for placement of vowel marks. +# Vowel carriers that are null consonants instead have the +# Indic_Syllabic_Category Consonant. + +# [Not derivable] + +002D ; Consonant_Placeholder # Pd HYPHEN-MINUS +00A0 ; Consonant_Placeholder # Zs NO-BREAK SPACE +00D7 ; Consonant_Placeholder # Sm MULTIPLICATION SIGN +0980 ; Consonant_Placeholder # Lo BENGALI ANJI +0A72..0A73 ; Consonant_Placeholder # Lo [2] GURMUKHI IRI..GURMUKHI URA +104B ; Consonant_Placeholder # Po MYANMAR SIGN SECTION +104E ; Consonant_Placeholder # Po MYANMAR SYMBOL AFOREMENTIONED +1CFA ; Consonant_Placeholder # Lo VEDIC SIGN DOUBLE ANUSVARA ANTARGOMUKHA +2010..2014 ; Consonant_Placeholder # Pd [5] HYPHEN..EM DASH +25CC ; Consonant_Placeholder # So DOTTED CIRCLE +AA74..AA76 ; Consonant_Placeholder # Lo [3] MYANMAR LOGOGRAM KHAMTI OAY..MYANMAR LOGOGRAM KHAMTI HM +11A3F ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL HEAD MARK +11A45 ; Consonant_Placeholder # Po ZANABAZAR SQUARE INITIAL DOUBLE-LINED HEAD MARK +11EF2 ; Consonant_Placeholder # Lo MAKASAR ANGKA + +# ================================================ + +# Indic_Syllabic_Category=Consonant + +# Consonant +# This includes ordinary abugida consonants with inherent vowels. +# In scripts that do not have distinct independent vowel characters, but instead +# form independent vowels by adding dependent vowels to a vowel carrier which +# otherwise represents the inherent vowel, that vowel carrier has the +# Indic_Syllabic_Category Consonant, as a null consonant. Such vowel carriers +# can often also be analyzed as glottal stops with inherent vowels. +# An example is U+0F68 TIBETAN LETTER A. + +# [Not derivable] + +0915..0939 ; Consonant # Lo [37] DEVANAGARI LETTER KA..DEVANAGARI LETTER HA +0958..095F ; Consonant # Lo [8] DEVANAGARI LETTER QA..DEVANAGARI LETTER YYA +0978..097F ; Consonant # Lo [8] DEVANAGARI LETTER MARWARI DDA..DEVANAGARI LETTER BBA +0995..09A8 ; Consonant # Lo [20] BENGALI LETTER KA..BENGALI LETTER NA +09AA..09B0 ; Consonant # Lo [7] BENGALI LETTER PA..BENGALI LETTER RA +09B2 ; Consonant # Lo BENGALI LETTER LA +09B6..09B9 ; Consonant # Lo [4] BENGALI LETTER SHA..BENGALI LETTER HA +09DC..09DD ; Consonant # Lo [2] BENGALI LETTER RRA..BENGALI LETTER RHA +09DF ; Consonant # Lo BENGALI LETTER YYA +09F0..09F1 ; Consonant # Lo [2] BENGALI LETTER RA WITH MIDDLE DIAGONAL..BENGALI LETTER RA WITH LOWER DIAGONAL +0A15..0A28 ; Consonant # Lo [20] GURMUKHI LETTER KA..GURMUKHI LETTER NA +0A2A..0A30 ; Consonant # Lo [7] GURMUKHI LETTER PA..GURMUKHI LETTER RA +0A32..0A33 ; Consonant # Lo [2] GURMUKHI LETTER LA..GURMUKHI LETTER LLA +0A35..0A36 ; Consonant # Lo [2] GURMUKHI LETTER VA..GURMUKHI LETTER SHA +0A38..0A39 ; Consonant # Lo [2] GURMUKHI LETTER SA..GURMUKHI LETTER HA +0A59..0A5C ; Consonant # Lo [4] GURMUKHI LETTER KHHA..GURMUKHI LETTER RRA +0A5E ; Consonant # Lo GURMUKHI LETTER FA +0A95..0AA8 ; Consonant # Lo [20] GUJARATI LETTER KA..GUJARATI LETTER NA +0AAA..0AB0 ; Consonant # Lo [7] GUJARATI LETTER PA..GUJARATI LETTER RA +0AB2..0AB3 ; Consonant # Lo [2] GUJARATI LETTER LA..GUJARATI LETTER LLA +0AB5..0AB9 ; Consonant # Lo [5] GUJARATI LETTER VA..GUJARATI LETTER HA +0AF9 ; Consonant # Lo GUJARATI LETTER ZHA +0B15..0B28 ; Consonant # Lo [20] ORIYA LETTER KA..ORIYA LETTER NA +0B2A..0B30 ; Consonant # Lo [7] ORIYA LETTER PA..ORIYA LETTER RA +0B32..0B33 ; Consonant # Lo [2] ORIYA LETTER LA..ORIYA LETTER LLA +0B35..0B39 ; Consonant # Lo [5] ORIYA LETTER VA..ORIYA LETTER HA +0B5C..0B5D ; Consonant # Lo [2] ORIYA LETTER RRA..ORIYA LETTER RHA +0B5F ; Consonant # Lo ORIYA LETTER YYA +0B71 ; Consonant # Lo ORIYA LETTER WA +0B95 ; Consonant # Lo TAMIL LETTER KA +0B99..0B9A ; Consonant # Lo [2] TAMIL LETTER NGA..TAMIL LETTER CA +0B9C ; Consonant # Lo TAMIL LETTER JA +0B9E..0B9F ; Consonant # Lo [2] TAMIL LETTER NYA..TAMIL LETTER TTA +0BA3..0BA4 ; Consonant # Lo [2] TAMIL LETTER NNA..TAMIL LETTER TA +0BA8..0BAA ; Consonant # Lo [3] TAMIL LETTER NA..TAMIL LETTER PA +0BAE..0BB9 ; Consonant # Lo [12] TAMIL LETTER MA..TAMIL LETTER HA +0C15..0C28 ; Consonant # Lo [20] TELUGU LETTER KA..TELUGU LETTER NA +0C2A..0C39 ; Consonant # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C58..0C5A ; Consonant # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C95..0CA8 ; Consonant # Lo [20] KANNADA LETTER KA..KANNADA LETTER NA +0CAA..0CB3 ; Consonant # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA +0CB5..0CB9 ; Consonant # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA +0CDE ; Consonant # Lo KANNADA LETTER FA +0D15..0D3A ; Consonant # Lo [38] MALAYALAM LETTER KA..MALAYALAM LETTER TTTA +0D9A..0DB1 ; Consonant # Lo [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA +0DB3..0DBB ; Consonant # Lo [9] SINHALA LETTER SANYAKA DAYANNA..SINHALA LETTER RAYANNA +0DBD ; Consonant # Lo SINHALA LETTER DANTAJA LAYANNA +0DC0..0DC6 ; Consonant # Lo [7] SINHALA LETTER VAYANNA..SINHALA LETTER FAYANNA +0E01..0E2E ; Consonant # Lo [46] THAI CHARACTER KO KAI..THAI CHARACTER HO NOKHUK +0E81..0E82 ; Consonant # Lo [2] LAO LETTER KO..LAO LETTER KHO SUNG +0E84 ; Consonant # Lo LAO LETTER KHO TAM +0E86..0E8A ; Consonant # Lo [5] LAO LETTER PALI GHA..LAO LETTER SO TAM +0E8C..0EA3 ; Consonant # Lo [24] LAO LETTER PALI JHA..LAO LETTER LO LING +0EA5 ; Consonant # Lo LAO LETTER LO LOOT +0EA7..0EAE ; Consonant # Lo [8] LAO LETTER WO..LAO LETTER HO TAM +0EDC..0EDF ; Consonant # Lo [4] LAO HO NO..LAO LETTER KHMU NYO +0F40..0F47 ; Consonant # Lo [8] TIBETAN LETTER KA..TIBETAN LETTER JA +0F49..0F6C ; Consonant # Lo [36] TIBETAN LETTER NYA..TIBETAN LETTER RRA +1000..1020 ; Consonant # Lo [33] MYANMAR LETTER KA..MYANMAR LETTER LLA +103F ; Consonant # Lo MYANMAR LETTER GREAT SA +1050..1051 ; Consonant # Lo [2] MYANMAR LETTER SHA..MYANMAR LETTER SSA +105A..105D ; Consonant # Lo [4] MYANMAR LETTER MON NGA..MYANMAR LETTER MON BBE +1061 ; Consonant # Lo MYANMAR LETTER SGAW KAREN SHA +1065..1066 ; Consonant # Lo [2] MYANMAR LETTER WESTERN PWO KAREN THA..MYANMAR LETTER WESTERN PWO KAREN PWA +106E..1070 ; Consonant # Lo [3] MYANMAR LETTER EASTERN PWO KAREN NNA..MYANMAR LETTER EASTERN PWO KAREN GHWA +1075..1081 ; Consonant # Lo [13] MYANMAR LETTER SHAN KA..MYANMAR LETTER SHAN HA +108E ; Consonant # Lo MYANMAR LETTER RUMAI PALAUNG FA +1703..1711 ; Consonant # Lo [15] TAGALOG LETTER KA..TAGALOG LETTER HA +171F ; Consonant # Lo TAGALOG LETTER ARCHAIC RA +1723..1731 ; Consonant # Lo [15] HANUNOO LETTER KA..HANUNOO LETTER HA +1743..1751 ; Consonant # Lo [15] BUHID LETTER KA..BUHID LETTER HA +1763..176C ; Consonant # Lo [10] TAGBANWA LETTER KA..TAGBANWA LETTER YA +176E..1770 ; Consonant # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA +1780..17A2 ; Consonant # Lo [35] KHMER LETTER KA..KHMER LETTER QA +1900..191E ; Consonant # Lo [31] LIMBU VOWEL-CARRIER LETTER..LIMBU LETTER TRA +1950..1962 ; Consonant # Lo [19] TAI LE LETTER KA..TAI LE LETTER NA +1980..19AB ; Consonant # Lo [44] NEW TAI LUE LETTER HIGH QA..NEW TAI LUE LETTER LOW SUA +1A00..1A16 ; Consonant # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA +1A20..1A4C ; Consonant # Lo [45] TAI THAM LETTER HIGH KA..TAI THAM LETTER LOW HA +1A53..1A54 ; Consonant # Lo [2] TAI THAM LETTER LAE..TAI THAM LETTER GREAT SA +1B13..1B33 ; Consonant # Lo [33] BALINESE LETTER KA..BALINESE LETTER HA +1B45..1B4C ; Consonant # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA +1B8A..1BA0 ; Consonant # Lo [23] SUNDANESE LETTER KA..SUNDANESE LETTER HA +1BAE..1BAF ; Consonant # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA +1BBB..1BBD ; Consonant # Lo [3] SUNDANESE LETTER REU..SUNDANESE LETTER BHA +1BC0..1BE3 ; Consonant # Lo [36] BATAK LETTER A..BATAK LETTER MBA +1C00..1C23 ; Consonant # Lo [36] LEPCHA LETTER KA..LEPCHA LETTER A +1C4D..1C4F ; Consonant # Lo [3] LEPCHA LETTER TTA..LEPCHA LETTER DDA +A807..A80A ; Consonant # Lo [4] SYLOTI NAGRI LETTER KO..SYLOTI NAGRI LETTER GHO +A80C..A822 ; Consonant # Lo [23] SYLOTI NAGRI LETTER CO..SYLOTI NAGRI LETTER HO +A840..A85D ; Consonant # Lo [30] PHAGS-PA LETTER KA..PHAGS-PA LETTER A +A862..A865 ; Consonant # Lo [4] PHAGS-PA LETTER QA..PHAGS-PA LETTER GGA +A869..A870 ; Consonant # Lo [8] PHAGS-PA LETTER TTA..PHAGS-PA LETTER ASPIRATED FA +A872 ; Consonant # Lo PHAGS-PA SUPERFIXED LETTER RA +A892..A8B3 ; Consonant # Lo [34] SAURASHTRA LETTER KA..SAURASHTRA LETTER LLA +A90A..A921 ; Consonant # Lo [24] KAYAH LI LETTER KA..KAYAH LI LETTER CA +A930..A946 ; Consonant # Lo [23] REJANG LETTER KA..REJANG LETTER A +A989..A98B ; Consonant # Lo [3] JAVANESE LETTER PA CEREK..JAVANESE LETTER NGA LELET RASWADI +A98F..A9B2 ; Consonant # Lo [36] JAVANESE LETTER KA..JAVANESE LETTER HA +A9E0..A9E4 ; Consonant # Lo [5] MYANMAR LETTER SHAN GHA..MYANMAR LETTER SHAN BHA +A9E7..A9EF ; Consonant # Lo [9] MYANMAR LETTER TAI LAING NYA..MYANMAR LETTER TAI LAING NNA +A9FA..A9FE ; Consonant # Lo [5] MYANMAR LETTER TAI LAING LLA..MYANMAR LETTER TAI LAING BHA +AA06..AA28 ; Consonant # Lo [35] CHAM LETTER KA..CHAM LETTER HA +AA60..AA6F ; Consonant # Lo [16] MYANMAR LETTER KHAMTI GA..MYANMAR LETTER KHAMTI FA +AA71..AA73 ; Consonant # Lo [3] MYANMAR LETTER KHAMTI XA..MYANMAR LETTER KHAMTI RA +AA7A ; Consonant # Lo MYANMAR LETTER AITON RA +AA7E..AA7F ; Consonant # Lo [2] MYANMAR LETTER SHWE PALAUNG CHA..MYANMAR LETTER SHWE PALAUNG SHA +AA80..AAAF ; Consonant # Lo [48] TAI VIET LETTER LOW KO..TAI VIET LETTER HIGH O +AAE2..AAEA ; Consonant # Lo [9] MEETEI MAYEK LETTER CHA..MEETEI MAYEK LETTER SSA +ABC0..ABCD ; Consonant # Lo [14] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER HUK +ABD0 ; Consonant # Lo MEETEI MAYEK LETTER PHAM +ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTER BHAM +10A00 ; Consonant # Lo KHAROSHTHI LETTER A +10A10..10A13 ; Consonant # Lo [4] KHAROSHTHI LETTER KA..KHAROSHTHI LETTER GHA +10A15..10A17 ; Consonant # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA +10A19..10A35 ; Consonant # Lo [29] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER VHA +11013..11037 ; Consonant # Lo [37] BRAHMI LETTER KA..BRAHMI LETTER OLD TAMIL NNNA +11075 ; Consonant # Lo BRAHMI LETTER OLD TAMIL LLA +1108D..110AF ; Consonant # Lo [35] KAITHI LETTER KA..KAITHI LETTER HA +11107..11126 ; Consonant # Lo [32] CHAKMA LETTER KAA..CHAKMA LETTER HAA +11144 ; Consonant # Lo CHAKMA LETTER LHAA +11147 ; Consonant # Lo CHAKMA LETTER VAA +11155..11172 ; Consonant # Lo [30] MAHAJANI LETTER KA..MAHAJANI LETTER RRA +11191..111B2 ; Consonant # Lo [34] SHARADA LETTER KA..SHARADA LETTER HA +11208..11211 ; Consonant # Lo [10] KHOJKI LETTER KA..KHOJKI LETTER JJA +11213..1122B ; Consonant # Lo [25] KHOJKI LETTER NYA..KHOJKI LETTER LLA +1123F ; Consonant # Lo KHOJKI LETTER QA +11284..11286 ; Consonant # Lo [3] MULTANI LETTER KA..MULTANI LETTER GA +11288 ; Consonant # Lo MULTANI LETTER GHA +1128A..1128D ; Consonant # Lo [4] MULTANI LETTER CA..MULTANI LETTER JJA +1128F..1129D ; Consonant # Lo [15] MULTANI LETTER NYA..MULTANI LETTER BA +1129F..112A8 ; Consonant # Lo [10] MULTANI LETTER BHA..MULTANI LETTER RHA +112BA..112DE ; Consonant # Lo [37] KHUDAWADI LETTER KA..KHUDAWADI LETTER HA +11315..11328 ; Consonant # Lo [20] GRANTHA LETTER KA..GRANTHA LETTER NA +1132A..11330 ; Consonant # Lo [7] GRANTHA LETTER PA..GRANTHA LETTER RA +11332..11333 ; Consonant # Lo [2] GRANTHA LETTER LA..GRANTHA LETTER LLA +11335..11339 ; Consonant # Lo [5] GRANTHA LETTER VA..GRANTHA LETTER HA +11392..113B5 ; Consonant # Lo [36] TULU-TIGALARI LETTER KA..TULU-TIGALARI LETTER LLLA +1140E..11434 ; Consonant # Lo [39] NEWA LETTER KA..NEWA LETTER HA +1148F..114AF ; Consonant # Lo [33] TIRHUTA LETTER KA..TIRHUTA LETTER HA +1158E..115AE ; Consonant # Lo [33] SIDDHAM LETTER KA..SIDDHAM LETTER HA +1160E..1162F ; Consonant # Lo [34] MODI LETTER KA..MODI LETTER LLA +1168A..116AA ; Consonant # Lo [33] TAKRI LETTER KA..TAKRI LETTER RRA +116B8 ; Consonant # Lo TAKRI LETTER ARCHAIC KHA +11700..1171A ; Consonant # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA +11740..11746 ; Consonant # Lo [7] AHOM LETTER CA..AHOM LETTER LLA +1180A..1182B ; Consonant # Lo [34] DOGRA LETTER KA..DOGRA LETTER RRA +1190C..11913 ; Consonant # Lo [8] DIVES AKURU LETTER KA..DIVES AKURU LETTER JA +11915..11916 ; Consonant # Lo [2] DIVES AKURU LETTER NYA..DIVES AKURU LETTER TTA +11918..1192F ; Consonant # Lo [24] DIVES AKURU LETTER DDA..DIVES AKURU LETTER ZA +119AE..119D0 ; Consonant # Lo [35] NANDINAGARI LETTER KA..NANDINAGARI LETTER RRA +11A00 ; Consonant # Lo ZANABAZAR SQUARE LETTER A +11A0B..11A32 ; Consonant # Lo [40] ZANABAZAR SQUARE LETTER KA..ZANABAZAR SQUARE LETTER KSSA +11A50 ; Consonant # Lo SOYOMBO LETTER A +11A5C..11A83 ; Consonant # Lo [40] SOYOMBO LETTER KA..SOYOMBO LETTER KSSA +11C0E..11C2E ; Consonant # Lo [33] BHAIKSUKI LETTER KA..BHAIKSUKI LETTER HA +11C72..11C8F ; Consonant # Lo [30] MARCHEN LETTER KA..MARCHEN LETTER A +11D0C..11D30 ; Consonant # Lo [37] MASARAM GONDI LETTER KA..MASARAM GONDI LETTER TRA +11D6C..11D89 ; Consonant # Lo [30] GUNJALA GONDI LETTER YA..GUNJALA GONDI LETTER SA +11EE0..11EF1 ; Consonant # Lo [18] MAKASAR LETTER KA..MAKASAR LETTER A +11F12..11F33 ; Consonant # Lo [34] KAWI LETTER KA..KAWI LETTER JNYA +16101..1611D ; Consonant # Lo [29] GURUNG KHEMA LETTER KA..GURUNG KHEMA LETTER SA +16D43..16D62 ; Consonant # Lo [32] KIRAT RAI LETTER A..KIRAT RAI LETTER HA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Dead + +# Dead Consonant (special consonant with killed vowel) + +# [Not derivable] + +09CE ; Consonant_Dead # Lo BENGALI LETTER KHANDA TA +0C5D ; Consonant_Dead # Lo TELUGU LETTER NAKAARA POLLU +0CDD ; Consonant_Dead # Lo KANNADA LETTER NAKAARA POLLU +0D54..0D56 ; Consonant_Dead # Lo [3] MALAYALAM LETTER CHILLU M..MALAYALAM LETTER CHILLU LLL +0D7A..0D7F ; Consonant_Dead # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K +1CF2..1CF3 ; Consonant_Dead # Lo [2] VEDIC SIGN ARDHAVISARGA..VEDIC SIGN ROTATED ARDHAVISARGA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_With_Stacker + +# Consonants that may cause conjunct formation or consonant stacking with the +# next consonant, without the use of a stacker + +# [Not derivable] + +0CF1..0CF2 ; Consonant_With_Stacker # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA +1CF5..1CF6 ; Consonant_With_Stacker # Lo [2] VEDIC SIGN JIHVAMULIYA..VEDIC SIGN UPADHMANIYA +11003..11004 ; Consonant_With_Stacker # Lo [2] BRAHMI SIGN JIHVAMULIYA..BRAHMI SIGN UPADHMANIYA +11460..11461 ; Consonant_With_Stacker # Lo [2] NEWA SIGN JIHVAMULIYA..NEWA SIGN UPADHMANIYA +11A3A ; Consonant_With_Stacker # Lo ZANABAZAR SQUARE CLUSTER-INITIAL LETTER RA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Prefixed + +# Other consonants that behave like a Consonant_Preceding_Repha + +# [Not derivable] + +111C2..111C3 ; Consonant_Prefixed # Lo [2] SHARADA SIGN JIHVAMULIYA..SHARADA SIGN UPADHMANIYA +1193F ; Consonant_Prefixed # Lo DIVES AKURU PREFIXED NASAL SIGN +11A84..11A85 ; Consonant_Prefixed # Lo [2] SOYOMBO SIGN JIHVAMULIYA..SOYOMBO SIGN UPADHMANIYA +11A87..11A89 ; Consonant_Prefixed # Lo [3] SOYOMBO CLUSTER-INITIAL LETTER LA..SOYOMBO CLUSTER-INITIAL LETTER SA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Preceding_Repha + +# Cluster-initial "r" consonants in the form of a dependent sign (also known as +# "repha") that precede the base character in the encoding order, but are +# reordered in text rendering to be somewhere after the base. Reanalyzed in +# some orthographies to be a final consonant. + +# [Not derivable] + +0D4E ; Consonant_Preceding_Repha # Lo MALAYALAM LETTER DOT REPH +113D1 ; Consonant_Preceding_Repha # Lo TULU-TIGALARI REPHA +11941 ; Consonant_Preceding_Repha # Lo DIVES AKURU INITIAL RA +11A86 ; Consonant_Preceding_Repha # Lo SOYOMBO CLUSTER-INITIAL LETTER RA +11D46 ; Consonant_Preceding_Repha # Lo MASARAM GONDI REPHA +11F02 ; Consonant_Preceding_Repha # Lo KAWI SIGN REPHA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Initial_Postfixed + +# Other consonants that behave like a Consonant_Succeeding_Repha + +# [Not derivable] + +1A5A ; Consonant_Initial_Postfixed # Mn TAI THAM CONSONANT SIGN LOW PA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Succeeding_Repha + +# Cluster-initial "r" consonants that behave like a Consonant_Preceding_Repha +# but succeed the base character in the encoding order, and are thus not +# reordered in text rendering. Reanalyzed in some orthographies to be a final +# consonant. + +# [Not derivable] + +17CC ; Consonant_Succeeding_Repha # Mn KHMER SIGN ROBAT + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Subjoined + +# Subjoined Consonant (C2 form subtending a base consonant in Tibetan, etc.) + +# [Not derivable] + +0F8D..0F97 ; Consonant_Subjoined # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Consonant_Subjoined # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +1929..192B ; Consonant_Subjoined # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1A57 ; Consonant_Subjoined # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A5B..1A5E ; Consonant_Subjoined # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1BA1 ; Consonant_Subjoined # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA2..1BA3 ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BAC..1BAD ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C24..1C25 ; Consonant_Subjoined # Mc [2] LEPCHA SUBJOINED LETTER YA..LEPCHA SUBJOINED LETTER RA +A867..A868 ; Consonant_Subjoined # Lo [2] PHAGS-PA SUBJOINED LETTER WA..PHAGS-PA SUBJOINED LETTER YA +A871 ; Consonant_Subjoined # Lo PHAGS-PA SUBJOINED LETTER RA +11C92..11CA7 ; Consonant_Subjoined # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CA9 ; Consonant_Subjoined # Mc MARCHEN SUBJOINED LETTER YA +11CAA..11CAF ; Consonant_Subjoined # Mn [6] MARCHEN SUBJOINED LETTER RA..MARCHEN SUBJOINED LETTER A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Medial + +# Medial Consonant (medial liquid, occurring in clusters) + +# [Not derivable] + +0A75 ; Consonant_Medial # Mn GURMUKHI SIGN YAKASH +0EBC ; Consonant_Medial # Mn LAO SEMIVOWEL SIGN LO +0EBD ; Consonant_Medial # Lo LAO SEMIVOWEL SIGN NYO +103B..103C ; Consonant_Medial # Mc [2] MYANMAR CONSONANT SIGN MEDIAL YA..MYANMAR CONSONANT SIGN MEDIAL RA +103D..103E ; Consonant_Medial # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +105E..1060 ; Consonant_Medial # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Consonant_Medial # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +1A55 ; Consonant_Medial # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A56 ; Consonant_Medial # Mn TAI THAM CONSONANT SIGN MEDIAL LA +A8B4 ; Consonant_Medial # Mc SAURASHTRA CONSONANT SIGN HAARU +A9BD ; Consonant_Medial # Mn JAVANESE CONSONANT SIGN KERET +A9BE..A9BF ; Consonant_Medial # Mc [2] JAVANESE CONSONANT SIGN PENGKAL..JAVANESE CONSONANT SIGN CAKRA +AA33..AA34 ; Consonant_Medial # Mc [2] CHAM CONSONANT SIGN YA..CHAM CONSONANT SIGN RA +AA35..AA36 ; Consonant_Medial # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +1171D ; Consonant_Medial # Mn AHOM CONSONANT SIGN MEDIAL LA +1171E ; Consonant_Medial # Mc AHOM CONSONANT SIGN MEDIAL RA +1171F ; Consonant_Medial # Mn AHOM CONSONANT SIGN MEDIAL LIGATING RA +11940 ; Consonant_Medial # Mc DIVES AKURU MEDIAL YA +11942 ; Consonant_Medial # Mc DIVES AKURU MEDIAL RA +11A3B..11A3E ; Consonant_Medial # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA +11D47 ; Consonant_Medial # Mn MASARAM GONDI RA-KARA +1612A..1612C ; Consonant_Medial # Mc [3] GURUNG KHEMA CONSONANT SIGN MEDIAL YA..GURUNG KHEMA CONSONANT SIGN MEDIAL HA +1612E ; Consonant_Medial # Mn GURUNG KHEMA CONSONANT SIGN MEDIAL RA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Final + +# Final Consonant (special final forms which do not take vowels) + +# [Not derivable] + +1930..1931 ; Consonant_Final # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Consonant_Final # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +1939 ; Consonant_Final # Mn LIMBU SIGN MUKPHRENG +19C1..19C7 ; Consonant_Final # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B +1A58..1A59 ; Consonant_Final # Mn [2] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN FINAL NGA +1B03 ; Consonant_Final # Mn BALINESE SIGN SURANG +1B81 ; Consonant_Final # Mn SUNDANESE SIGN PANGLAYAR +1BBE..1BBF ; Consonant_Final # Lo [2] SUNDANESE LETTER FINAL K..SUNDANESE LETTER FINAL M +1BF0..1BF1 ; Consonant_Final # Mn [2] BATAK CONSONANT SIGN NG..BATAK CONSONANT SIGN H +1C2D..1C33 ; Consonant_Final # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +A94F..A951 ; Consonant_Final # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A952 ; Consonant_Final # Mc REJANG CONSONANT SIGN H +A982 ; Consonant_Final # Mn JAVANESE SIGN LAYAR +AA40..AA42 ; Consonant_Final # Lo [3] CHAM LETTER FINAL K..CHAM LETTER FINAL NG +AA43 ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL NG +AA44..AA4B ; Consonant_Final # Lo [8] CHAM LETTER FINAL CH..CHAM LETTER FINAL SS +AA4C ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL M +AA4D ; Consonant_Final # Mc CHAM CONSONANT SIGN FINAL H +ABDB..ABE2 ; Consonant_Final # Lo [8] MEETEI MAYEK LETTER KOK LONSUM..MEETEI MAYEK LETTER I LONSUM +11A8A..11A95 ; Consonant_Final # Mn [12] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO FINAL CONSONANT SIGN -A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Head_Letter + +# Head Letter (Tibetan) + +# [Not derivable] + +0F88..0F8C ; Consonant_Head_Letter # Lo [5] TIBETAN SIGN LCE TSA CAN..TIBETAN SIGN INVERTED MCHU CAN + +# ================================================ + +# Indic_Syllabic_Category=Modifying_Letter + +# Reanalyzed letters not participating in the abugida structure, but +# serving to modify the sound of an adjacent vowel or consonant. +# Note that this is not the same as General_Category=Modifier_Letter. + +# [Not derivable] + +0B83 ; Modifying_Letter # Lo TAMIL SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Tone_Letter + +# Tone Letter (spacing lexical tone mark with status as a letter) + +# [Not derivable] + +1970..1974 ; Tone_Letter # Lo [5] TAI LE LETTER TONE-2..TAI LE LETTER TONE-6 +AAC0 ; Tone_Letter # Lo TAI VIET TONE MAI NUENG +AAC2 ; Tone_Letter # Lo TAI VIET TONE MAI SONG + +# ================================================ + +# Indic_Syllabic_Category=Tone_Mark + +# Tone Mark (nonspacing or spacing lexical tone mark) + +# [Not derivable] + +0E48..0E4B ; Tone_Mark # Mn [4] THAI CHARACTER MAI EK..THAI CHARACTER MAI CHATTAWA +0EC8..0ECB ; Tone_Mark # Mn [4] LAO TONE MAI EK..LAO TONE MAI CATAWA +1037 ; Tone_Mark # Mn MYANMAR SIGN DOT BELOW +1063..1064 ; Tone_Mark # Mc [2] MYANMAR TONE MARK SGAW KAREN HATHI..MYANMAR TONE MARK SGAW KAREN KE PHO +1069..106D ; Tone_Mark # Mc [5] MYANMAR SIGN WESTERN PWO KAREN TONE-1..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1087..108C ; Tone_Mark # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108D ; Tone_Mark # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +108F ; Tone_Mark # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109B ; Tone_Mark # Mc [2] MYANMAR SIGN KHAMTI TONE-1..MYANMAR SIGN KHAMTI TONE-3 +19C8..19C9 ; Tone_Mark # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A75..1A79 ; Tone_Mark # Mn [5] TAI THAM SIGN TONE-1..TAI THAM SIGN KHUEN TONE-5 +A92B..A92D ; Tone_Mark # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +AA7B ; Tone_Mark # Mc MYANMAR SIGN PAO KAREN TONE +AA7C ; Tone_Mark # Mn MYANMAR SIGN TAI LAING TONE-2 +AA7D ; Tone_Mark # Mc MYANMAR SIGN TAI LAING TONE-5 +AABF ; Tone_Mark # Mn TAI VIET TONE MAI EK +AAC1 ; Tone_Mark # Mn TAI VIET TONE MAI THO +ABEC ; Tone_Mark # Mc MEETEI MAYEK LUM IYEK + +# ================================================ + +# Indic_Syllabic_Category=Gemination_Mark + +# Gemination Mark (doubling of the preceding or following consonant) +# +# U+0A71 GURMUKHI ADDAK precedes the consonant it geminates, while the +# others follow the consonant they geminate. + +# [Not derivable] + +0A71 ; Gemination_Mark # Mn GURMUKHI ADDAK +0AFB ; Gemination_Mark # Mn GUJARATI SIGN SHADDA +11237 ; Gemination_Mark # Mn KHOJKI SIGN SHADDA +113D2 ; Gemination_Mark # Mn TULU-TIGALARI GEMINATION MARK +11A98 ; Gemination_Mark # Mn SOYOMBO GEMINATION MARK + +# ================================================ + +# Indic_Syllabic_Category=Cantillation_Mark + +# Cantillation Mark (recitation marks, such as svara markers for the Samaveda) + +# [Not derivable] + +0951..0952 ; Cantillation_Mark # Mn [2] DEVANAGARI STRESS SIGN UDATTA..DEVANAGARI STRESS SIGN ANUDATTA +0A51 ; Cantillation_Mark # Mn GURMUKHI SIGN UDAAT +0AFA ; Cantillation_Mark # Mn GUJARATI SIGN SUKUN +0AFC ; Cantillation_Mark # Mn GUJARATI SIGN MADDAH +1CD0..1CD2 ; Cantillation_Mark # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CD4..1CE0 ; Cantillation_Mark # Mn [13] VEDIC SIGN YAJURVEDIC MIDLINE SVARITA..VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CE1 ; Cantillation_Mark # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF4 ; Cantillation_Mark # Mn VEDIC TONE CANDRA ABOVE +1CF7 ; Cantillation_Mark # Mc VEDIC SIGN ATIKRAMA +1CF8..1CF9 ; Cantillation_Mark # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE +20F0 ; Cantillation_Mark # Mn COMBINING ASTERISK ABOVE +A8E0..A8F1 ; Cantillation_Mark # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +1123E ; Cantillation_Mark # Mn KHOJKI SIGN SUKUN +11366..1136C ; Cantillation_Mark # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Cantillation_Mark # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA +113E1..113E2 ; Cantillation_Mark # Mn [2] TULU-TIGALARI VEDIC TONE SVARITA..TULU-TIGALARI VEDIC TONE ANUDATTA + +# ================================================ + +# Indic_Syllabic_Category=Register_Shifter + +# Register Shifter (shifts register for consonants, akin to a tone mark) + +# [Not derivable] + +17C9..17CA ; Register_Shifter # Mn [2] KHMER SIGN MUUSIKATOAN..KHMER SIGN TRIISAP + +# ================================================ + +# Indic_Syllabic_Category=Syllable_Modifier + +# Syllable Modifier (miscellaneous combining characters that modify +# something in the orthographic syllable they succeed or appear in) + +# [Not derivable] + +00B2..00B3 ; Syllable_Modifier # No [2] SUPERSCRIPT TWO..SUPERSCRIPT THREE +09FE ; Syllable_Modifier # Mn BENGALI SANDHI MARK +0ECE ; Syllable_Modifier # Mn LAO YAMAKKAN +0F35 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0FC6 ; Syllable_Modifier # Mn TIBETAN SYMBOL PADMA GDAN +17CB ; Syllable_Modifier # Mn KHMER SIGN BANTOC +17CE..17D0 ; Syllable_Modifier # Mn [3] KHMER SIGN KAKABAT..KHMER SIGN SAMYOK SANNYA +17D3 ; Syllable_Modifier # Mn KHMER SIGN BATHAMASAT +17DD ; Syllable_Modifier # Mn KHMER SIGN ATTHACAN +193B ; Syllable_Modifier # Mn LIMBU SIGN SA-I +1A7B..1A7C ; Syllable_Modifier # Mn [2] TAI THAM SIGN MAI SAM..TAI THAM SIGN KHUEN-LUE KARAN +1A7F ; Syllable_Modifier # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1C36 ; Syllable_Modifier # Mn LEPCHA SIGN RAN +1DFB ; Syllable_Modifier # Mn COMBINING DELETION MARK +2074 ; Syllable_Modifier # No SUPERSCRIPT FOUR +2082..2084 ; Syllable_Modifier # No [3] SUBSCRIPT TWO..SUBSCRIPT FOUR +111C9 ; Syllable_Modifier # Mn SHARADA SANDHI MARK +1145E ; Syllable_Modifier # Mn NEWA SANDHI MARK +11A33 ; Syllable_Modifier # Mn ZANABAZAR SQUARE FINAL CONSONANT MARK + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Killer + +# Consonant Killer (signifies that the previous consonant or consonants are +# not pronounced) + +# [Not derivable] + +0E4C ; Consonant_Killer # Mn THAI CHARACTER THANTHAKHAT +17CD ; Consonant_Killer # Mn KHMER SIGN TOANDAKHIAT + +# ================================================ + +# Indic_Syllabic_Category=Non_Joiner + +# Non_Joiner (Zero Width Non-Joiner) + +# [Not derivable] + +200C ; Non_Joiner # Cf ZERO WIDTH NON-JOINER + +# ================================================ + +# Indic_Syllabic_Category=Joiner + +# Joiner (Zero Width Joiner) + +# [Not derivable] + +200D ; Joiner # Cf ZERO WIDTH JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number_Joiner + +# Number_Joiner (forms ligatures between numbers for multiplication) + +# [Not derivable] + +1107F ; Number_Joiner # Mn BRAHMI NUMBER JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number + +# Number (can be used as vowel-holders like consonant placeholders) +# Note: A number may even hold subjoined consonants which may in turn +# have been formed using a virama or a stacker, e.g. the sequence +# where THAI THAM LETTER LOW TA is subjoined to +# TAI THAM THAM DIGIT THREE using an invisible stacker. + +# [Not derivable] + +0030..0039 ; Number # Nd [10] DIGIT ZERO..DIGIT NINE +0966..096F ; Number # Nd [10] DEVANAGARI DIGIT ZERO..DEVANAGARI DIGIT NINE +09E6..09EF ; Number # Nd [10] BENGALI DIGIT ZERO..BENGALI DIGIT NINE +0A66..0A6F ; Number # Nd [10] GURMUKHI DIGIT ZERO..GURMUKHI DIGIT NINE +0AE6..0AEF ; Number # Nd [10] GUJARATI DIGIT ZERO..GUJARATI DIGIT NINE +0B66..0B6F ; Number # Nd [10] ORIYA DIGIT ZERO..ORIYA DIGIT NINE +0BE6..0BEF ; Number # Nd [10] TAMIL DIGIT ZERO..TAMIL DIGIT NINE +0C66..0C6F ; Number # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE +0CE6..0CEF ; Number # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE +0D66..0D6F ; Number # Nd [10] MALAYALAM DIGIT ZERO..MALAYALAM DIGIT NINE +0DE6..0DEF ; Number # Nd [10] SINHALA LITH DIGIT ZERO..SINHALA LITH DIGIT NINE +0E50..0E59 ; Number # Nd [10] THAI DIGIT ZERO..THAI DIGIT NINE +0ED0..0ED9 ; Number # Nd [10] LAO DIGIT ZERO..LAO DIGIT NINE +0F20..0F29 ; Number # Nd [10] TIBETAN DIGIT ZERO..TIBETAN DIGIT NINE +0F2A..0F33 ; Number # No [10] TIBETAN DIGIT HALF ONE..TIBETAN DIGIT HALF ZERO +1040..1049 ; Number # Nd [10] MYANMAR DIGIT ZERO..MYANMAR DIGIT NINE +1090..1099 ; Number # Nd [10] MYANMAR SHAN DIGIT ZERO..MYANMAR SHAN DIGIT NINE +17E0..17E9 ; Number # Nd [10] KHMER DIGIT ZERO..KHMER DIGIT NINE +1946..194F ; Number # Nd [10] LIMBU DIGIT ZERO..LIMBU DIGIT NINE +19D0..19D9 ; Number # Nd [10] NEW TAI LUE DIGIT ZERO..NEW TAI LUE DIGIT NINE +19DA ; Number # No NEW TAI LUE THAM DIGIT ONE +1A80..1A89 ; Number # Nd [10] TAI THAM HORA DIGIT ZERO..TAI THAM HORA DIGIT NINE +1A90..1A99 ; Number # Nd [10] TAI THAM THAM DIGIT ZERO..TAI THAM THAM DIGIT NINE +1B50..1B59 ; Number # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE +1BB0..1BB9 ; Number # Nd [10] SUNDANESE DIGIT ZERO..SUNDANESE DIGIT NINE +1C40..1C49 ; Number # Nd [10] LEPCHA DIGIT ZERO..LEPCHA DIGIT NINE +A8D0..A8D9 ; Number # Nd [10] SAURASHTRA DIGIT ZERO..SAURASHTRA DIGIT NINE +A900..A909 ; Number # Nd [10] KAYAH LI DIGIT ZERO..KAYAH LI DIGIT NINE +A9D0..A9D9 ; Number # Nd [10] JAVANESE DIGIT ZERO..JAVANESE DIGIT NINE +A9F0..A9F9 ; Number # Nd [10] MYANMAR TAI LAING DIGIT ZERO..MYANMAR TAI LAING DIGIT NINE +AA50..AA59 ; Number # Nd [10] CHAM DIGIT ZERO..CHAM DIGIT NINE +ABF0..ABF9 ; Number # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE +10A40..10A48 ; Number # No [9] KHAROSHTHI DIGIT ONE..KHAROSHTHI FRACTION ONE HALF +11066..1106F ; Number # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11136..1113F ; Number # Nd [10] CHAKMA DIGIT ZERO..CHAKMA DIGIT NINE +111D0..111D9 ; Number # Nd [10] SHARADA DIGIT ZERO..SHARADA DIGIT NINE +111E1..111F4 ; Number # No [20] SINHALA ARCHAIC DIGIT ONE..SINHALA ARCHAIC NUMBER ONE THOUSAND +112F0..112F9 ; Number # Nd [10] KHUDAWADI DIGIT ZERO..KHUDAWADI DIGIT NINE +11450..11459 ; Number # Nd [10] NEWA DIGIT ZERO..NEWA DIGIT NINE +114D0..114D9 ; Number # Nd [10] TIRHUTA DIGIT ZERO..TIRHUTA DIGIT NINE +11650..11659 ; Number # Nd [10] MODI DIGIT ZERO..MODI DIGIT NINE +116C0..116C9 ; Number # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE +116D0..116E3 ; Number # Nd [20] MYANMAR PAO DIGIT ZERO..MYANMAR EASTERN PWO KAREN DIGIT NINE +11730..11739 ; Number # Nd [10] AHOM DIGIT ZERO..AHOM DIGIT NINE +1173A..1173B ; Number # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY +11950..11959 ; Number # Nd [10] DIVES AKURU DIGIT ZERO..DIVES AKURU DIGIT NINE +11C50..11C59 ; Number # Nd [10] BHAIKSUKI DIGIT ZERO..BHAIKSUKI DIGIT NINE +11C5A..11C6C ; Number # No [19] BHAIKSUKI NUMBER ONE..BHAIKSUKI HUNDREDS UNIT MARK +11D50..11D59 ; Number # Nd [10] MASARAM GONDI DIGIT ZERO..MASARAM GONDI DIGIT NINE +11DA0..11DA9 ; Number # Nd [10] GUNJALA GONDI DIGIT ZERO..GUNJALA GONDI DIGIT NINE +11F50..11F59 ; Number # Nd [10] KAWI DIGIT ZERO..KAWI DIGIT NINE +16130..16139 ; Number # Nd [10] GURUNG KHEMA DIGIT ZERO..GURUNG KHEMA DIGIT NINE +16D70..16D79 ; Number # Nd [10] KIRAT RAI DIGIT ZERO..KIRAT RAI DIGIT NINE + +# ================================================ + +# Indic_Syllabic_Category=Brahmi_Joining_Number + +# Brahmi Joining Number (may be joined by a Number_Joiner of the same +# script, e.g. in Brahmi) +# +# Note: These are different from Numbers, in the way that there is no known +# evidence of Brahmi Joining Numbers taking vowels or subjoined consonants. +# Until such evidence is found, implementations may assume that Brahmi +# Joining Numbers only participate in shaping with other Brahmi Joining +# Numbers. + +# [Not derivable] + +11052..11065 ; Brahmi_Joining_Number # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND + +# EOF diff --git a/data/6.0.0-indic-positional-category.txt b/data/6.0.0-indic-positional-category.txt new file mode 100644 index 0000000..c5f2e11 --- /dev/null +++ b/data/6.0.0-indic-positional-category.txt @@ -0,0 +1,418 @@ +# IndicMatraCategory-6.0.0.txt +# Date: 2010-07-14, 15:03:00 PDT [KW] +# +# Unicode Character Database +# Copyright (c) 1991-2010 Unicode, Inc. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# For documentation, see UAX #44. +# +# This file defines the following provisional property: +# +# Indic_Matra_Category enumerated property +# +# NB: Provisional properties and data files have no associated stability +# guarantees. They are provided in part to determine the possible usefulness +# of a property or other data and to encourage analysis and further investigation +# which may result in their improvement. Provisional properties and +# data files may change arbitrarily, or may even be removed in a future version of the +# Unicode Character Database, if they prove not to be useful. +# +# Scope: This provisional property is aimed at the problem of +# the specification of syllabic structure for Indic scripts. +# Because dependent vowels (and visible viramas, where they occur) +# are placed in notional slots around the consonant (or consonant +# cluster) core of an Indic syllable, there may be cooccurrence +# constraints or other interactions. Also, it may be desirable, +# in cases where more than one dependent vowel may occur in +# sequence, as for example, in a top slot and a bottom slot, to +# specify preferred orders for spelling. As such, this property +# is designed primarily to supplement the Indic_Syllabic_Category +# property. +# +# Note that this provisional property is *not* intended as +# a prescriptive property regarding display or font design, +# for a number of reasons. Good font design requires information +# that is outside the context of a character encoding standard, +# and is best handled in other venues. For Indic dependent +# vowels, in particular: +# +# 1. Matra placement may vary somewhat based on typeface design. +# 2. Matra placement, even within a single script, may vary +# somewhat according to historic period or local conventions. +# 3. Matra placement may be changed by explicit orthographic reform +# decisions. +# 4. Matras may ligate in various ways with a consonant (or even +# other elements of a syllable) instead of occurring in a +# discrete location. +# 4. Matra display may be contextually determined. This is +# notable, for example, in the Tamil script, where the shape +# and placement of -u and -uu vowels depends strongly on +# which consonant they adjoin. +# +# Format: +# Field 0 Code Point or Code Point Range +# Field 1 Indic_Matra_Category +# +# A comment field shows General_Category property values and character names. +# +# The scripts assessed as containing dependent vowels or viramas in the +# structural sense used for the Indic_Matra_Category are: +# +# Devanagari, Bengali, Gurmukhi, Gujarati, Oriya, Tamil, Telugu, +# Kannada, Malayalam, Sinhala, Thai, Lao, Tibetan, Myanmar, +# Tagalog, Hanunoo, Buhid, Tagbanwa, Khmer, Limbu, New Tai Lue, +# Buginese, Tai Tham, Balinese, Sundanese, Batak, Lepcha, +# Syloti Nagri, Saurashtra, Rejang, Javanese, Cham, Tai Viet, +# Meetei Mayek, Karoshthi, Brahmi, Kaithi +# +# All characters for all other scripts not in that list +# take the default value for this property. +# +# See IndicSyllabicCategory.txt for a slightly more extended +# list of Indic scripts, including those which do not have +# dependent vowel characters. Currently, those additional +# Indic scripts without dependent vowel characters are +# Tai Le, Phags-pa, and Kayah Li. +# + +# ================================================ + +# Property: Indic_Matra_Category +# +# All code points not explicitly listed for Indic_Matra_Category +# have the value NA (Not_Applicable). +# +# @missing: 0000..10FFFF; NA + +# Only Indic dependent vowels (Indic_Syllabic_Category=Vowel_Dependent) +# and viramas (Indic_Syllabic_Category=Virama) +# have a non-default value for this property. + +# ------------------------------------------------ + +# Indic_Matra_Category=Right + +093B ; Right # Mc DEVANAGARI VOWEL SIGN OOE +093E ; Right # Mc DEVANAGARI VOWEL SIGN AA +0940 ; Right # Mc DEVANAGARI VOWEL SIGN II +0949..094C ; Right # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094F ; Right # Mc DEVANAGARI VOWEL SIGN AW +09BE ; Right # Mc BENGALI VOWEL SIGN AA +09C0 ; Right # Mc BENGALI VOWEL SIGN II +09D7 ; Right # Mc BENGALI AU LENGTH MARK +0A3E ; Right # Mc GURMUKHI VOWEL SIGN AA +0A40 ; Right # Mc GURMUKHI VOWEL SIGN II +0ABE ; Right # Mc GUJARATI VOWEL SIGN AA +0AC0 ; Right # Mc GUJARATI VOWEL SIGN II +0ACB..0ACC ; Right # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0B3E ; Right # Mc ORIYA VOWEL SIGN AA +0B40 ; Right # Mc ORIYA VOWEL SIGN II +0BBE..0BBF ; Right # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BD7 ; Right # Mc TAMIL AU LENGTH MARK +0C41..0C44 ; Right # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0CBE ; Right # Mc KANNADA VOWEL SIGN AA +0CC1..0CC4 ; Right # Mc [4] KANNADA VOWEL SIGN U..KANNADA VOWEL SIGN VOCALIC RR +0CD5..0CD6 ; Right # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0D3E..0D40 ; Right # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D42 ; Right # Mn [2] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN UU +# Note: U and UU form complex ligatures with consonants in older Malayalam orthography +0D57 ; Right # Mc MALAYALAM AU LENGTH MARK +0DCF..0DD1 ; Right # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD8 ; Right # Mc SINHALA VOWEL SIGN GAETTA-PILLA +0DDF ; Right # Mc SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Right # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Right # Lo THAI CHARACTER SARA A +0E32..0E33 ; Right # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E45 ; Right # Lo THAI CHARACTER LAKKHANGYAO +0EB0 ; Right # Lo LAO VOWEL SIGN A +0EB2..0EB3 ; Right # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +102B..102C ; Right # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +1056..1057 ; Right # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1062 ; Right # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Right # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1083 ; Right # Mc MYANMAR VOWEL SIGN SHAN AA +109C ; Right # Mc MYANMAR VOWEL SIGN AITON A +17B6 ; Right # Mc KHMER VOWEL SIGN AA +17C8 ; Right # Mc KHMER SIGN YUUKALEAPINTU +1923..1924 ; Right # Mc [2] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AI +19B0..19B4 ; Right # Mc [5] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN UU +19B8..19B9 ; Right # Mc [2] NEW TAI LUE VOWEL SIGN OA..NEW TAI LUE VOWEL SIGN UE +19BB..19C0 ; Right # Mc [6] NEW TAI LUE VOWEL SIGN AAY..NEW TAI LUE VOWEL SIGN IY +1A1A ; Right # Mc BUGINESE VOWEL SIGN O +1A61 ; Right # Mc TAI THAM VOWEL SIGN A +1A63..1A64 ; Right # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A6D ; Right # Mc TAI THAM VOWEL SIGN OY +1B35 ; Right # Mc BALINESE VOWEL SIGN TEDUNG +1B44 ; Right # Mc BALINESE ADEG ADEG +1BA7 ; Right # Mc SUNDANESE VOWEL SIGN PANOLONG +1BAA ; Right # Mc SUNDANESE SIGN PAMAAEH +1BF2..1BF3 ; Right # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +1C26 ; Right # Mc LEPCHA VOWEL SIGN AA +1C2A..1C2B ; Right # Mc [2] LEPCHA VOWEL SIGN U..LEPCHA VOWEL SIGN UU +A823..A824 ; Right # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A827 ; Right # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Right # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A953 ; Right # Mc REJANG VIRAMA +A9B4..A9B5 ; Right # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +AAB1 ; Right # Lo TAI VIET VOWEL AA +AABA ; Right # Lo TAI VIET VOWEL UA +AABD ; Right # Lo TAI VIET VOWEL AN +ABE3..ABE4 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE6..ABE7 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE9..ABEA ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +110B0 ; Right # Mc KAITHI VOWEL SIGN AA +110B2 ; Right # Mc KAITHI VOWEL SIGN II +110B7..110B8 ; Right # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU + +# Indic_Matra_Category=Left + +093F ; Left # Mc DEVANAGARI VOWEL SIGN I +094E ; Left # Mc DEVANAGARI VOWEL SIGN PRISHTHAMATRA E +09BF ; Left # Mc BENGALI VOWEL SIGN I +09C7..09C8 ; Left # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +0A3F ; Left # Mc GURMUKHI VOWEL SIGN I +0ABF ; Left # Mc GUJARATI VOWEL SIGN I +0B47 ; Left # Mc ORIYA VOWEL SIGN E +0BC6..0BC8 ; Left # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0D46..0D48 ; Left # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0DD9 ; Left # Mc SINHALA VOWEL SIGN KOMBUVA +0DDB ; Left # Mc SINHALA VOWEL SIGN KOMBU DEKA +1031 ; Left # Mc MYANMAR VOWEL SIGN E +1084 ; Left # Mc MYANMAR VOWEL SIGN SHAN E +17C1..17C3 ; Left # Mc [3] KHMER VOWEL SIGN E..KHMER VOWEL SIGN AI +19B5..19B7 ; Left # Mc [3] NEW TAI LUE VOWEL SIGN E..NEW TAI LUE VOWEL SIGN O +19BA ; Left # Mc NEW TAI LUE VOWEL SIGN AY +1A19 ; Left # Mc BUGINESE VOWEL SIGN E +1A1B ; Left # Mc BUGINESE VOWEL SIGN AE +1A6E..1A72 ; Left # Mc [5] TAI THAM VOWEL SIGN E..TAI THAM VOWEL SIGN THAM AI +1B3E..1B3F ; Left # Mc [2] BALINESE VOWEL SIGN TALING..BALINESE VOWEL SIGN TALING REPA +1BA6 ; Left # Mc SUNDANESE VOWEL SIGN PANAELAENG +1C27..1C28 ; Left # Mc [2] LEPCHA VOWEL SIGN I..LEPCHA VOWEL SIGN O +A9BA..A9BB ; Left # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +AA2F..AA30 ; Left # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +110B1 ; Left # Mc KAITHI VOWEL SIGN I + +# Indic_Matra_Category=Visual_Order_Left + +# These are dependent vowels that occur to the left of the consonant +# letter in a syllable, but which occur in scripts using the visual order +# model, instead of the logical order model. Because of the different +# model, these left-side vowels occur first in the backing store (before +# the consonant letter) and are not reordered during text rendering. +# +# [Derivation: Logical_Order_Exception=True] + +0E40..0E44 ; Visual_Order_Left # Lo [5] THAI CHARACTER SARA E..THAI CHARACTER SARA AI MAIMALAI +0EC0..0EC4 ; Visual_Order_Left # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +AAB5..AAB6 ; Visual_Order_Left # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB9 ; Visual_Order_Left # Lo TAI VIET VOWEL UEA +AABB..AABC ; Visual_Order_Left # Lo [2] TAI VIET VOWEL AUE..TAI VIET VOWEL AY + +# Indic_Matra_Category=Left_And_Right + +09CB..09CC ; Left_And_Right # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +0B4B ; Left_And_Right # Mc ORIYA VOWEL SIGN O +0BCA..0BCC ; Left_And_Right # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0D4A..0D4C ; Left_And_Right # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0DDC..0DDE ; Left_And_Right # Mc [3] SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA..SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA +17C0 ; Left_And_Right # Mc KHMER VOWEL SIGN IE +17C4..17C5 ; Left_And_Right # Mc [2] KHMER VOWEL SIGN OO..KHMER VOWEL SIGN AU +1B40..1B41 ; Left_And_Right # Mc [2] BALINESE VOWEL SIGN TALING TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG + +# Indic_Matra_Category=Top + +093A ; Top # Mn DEVANAGARI VOWEL SIGN OE +0945..0948 ; Top # Mn [4] DEVANAGARI VOWEL SIGN CANDRA E..DEVANAGARI VOWEL SIGN AI +0955 ; Top # Mn DEVANAGARI VOWEL SIGN CANDRA LONG E +0A47..0A48 ; Top # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Top # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0AC5 ; Top # Mn GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Top # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0B3F ; Top # Mn ORIYA VOWEL SIGN I +0B56 ; Top # Mn ORIYA AI LENGTH MARK +0BC0 ; Top # Mn TAMIL VOWEL SIGN II +0BCD ; Top # Mn TAMIL SIGN VIRAMA +0C3E..0C40 ; Top # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C46..0C47 ; Top # Mn [2] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN EE +0C4A..0C4C ; Top # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C4D ; Top # Mn TELUGU SIGN VIRAMA +0C55 ; Top # Mn TELUGU LENGTH MARK +0CBF ; Top # Mn KANNADA VOWEL SIGN I +0CC6 ; Top # Mn KANNADA VOWEL SIGN E +0CCC ; Top # Mn KANNADA VOWEL SIGN AU +0CCD ; Top # Mn KANNADA SIGN VIRAMA +0D4D ; Top # Mn MALAYALAM SIGN VIRAMA +0DCA ; Top # Mn SINHALA SIGN AL-LAKUNA +0DD2..0DD3 ; Top # Mn [2] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN DIGA IS-PILLA +0E31 ; Top # Mn THAI CHARACTER MAI HAN-AKAT +0E34..0E37 ; Top # Mn [4] THAI CHARACTER SARA I..THAI CHARACTER SARA UEE +0E47 ; Top # Mn THAI CHARACTER MAITAIKHU +0E4E ; Top # Mn THAI CHARACTER YAMAKKAN +0EB1 ; Top # Mn LAO VOWEL SIGN MAI KAN +0EB4..0EB7 ; Top # Mn [4] LAO VOWEL SIGN I..LAO VOWEL SIGN YY +0EBB ; Top # Mn LAO VOWEL SIGN MAI KON +0F72 ; Top # Mn TIBETAN VOWEL SIGN I +0F7A..0F7D ; Top # Mn [4] TIBETAN VOWEL SIGN E..TIBETAN VOWEL SIGN OO +0F80 ; Top # Mn TIBETAN VOWEL SIGN REVERSED I +102D..102E ; Top # Mn [2] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN II +1032..1035 ; Top # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +103A ; Top # Mn MYANMAR SIGN ASAT +1071..1074 ; Top # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1085..1086 ; Top # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109D ; Top # Mn MYANMAR VOWEL SIGN AITON AI +1712 ; Top # Mn TAGALOG VOWEL SIGN I +1732 ; Top # Mn HANUNOO VOWEL SIGN I +1752 ; Top # Mn BUHID VOWEL SIGN I +1772 ; Top # Mn TAGBANWA VOWEL SIGN I +17B7..17BA ; Top # Mn [4] KHMER VOWEL SIGN I..KHMER VOWEL SIGN YY +17D1 ; Top # Mn KHMER SIGN VIRIAM +1920..1921 ; Top # Mn [2] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN I +1927..1928 ; Top # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +1A17 ; Top # Mn BUGINESE VOWEL SIGN I +1A62 ; Top # Mn TAI THAM VOWEL SIGN MAI SAT +1A65..1A68 ; Top # Mn [4] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN UUE +1A6B ; Top # Mn TAI THAM VOWEL SIGN O +1A73..1A74 ; Top # Mn [2] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN MAI KANG +1B36..1B37 ; Top # Mn [2] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN ULU SARI +1B42 ; Top # Mn BALINESE VOWEL SIGN PEPET +1BA4 ; Top # Mn SUNDANESE VOWEL SIGN PANGHULU +1BA8..1BA9 ; Top # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +A806 ; Top # Mn SYLOTI NAGRI SIGN HASANTA +A826 ; Top # Mn SYLOTI NAGRI VOWEL SIGN E +A94A ; Top # Mn REJANG VOWEL SIGN AI +A9B6..A9B7 ; Top # Mn [2] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN WULU MELIK +A9BC ; Top # Mn JAVANESE VOWEL SIGN PEPET +AA29..AA2C ; Top # Mn [4] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN EI +AA2E ; Top # Mn CHAM VOWEL SIGN OE +AA31 ; Top # Mn CHAM VOWEL SIGN AU +AAB0 ; Top # Mn TAI VIET MAI KANG +AAB2..AAB3 ; Top # Mn [2] TAI VIET VOWEL I..TAI VIET VOWEL UE +AAB7..AAB8 ; Top # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AABE ; Top # Mn TAI VIET VOWEL AM +ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP +10A05 ; Top # Mn KHAROSHTHI VOWEL SIGN E +11038..1103B ; Top # Mn [4] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN II +11042..11045 ; Top # Mn [4] BRAHMI VOWEL SIGN E..BRAHMI VOWEL SIGN AU +11046 ; Top # Mn BRAHMI VIRAMA +110B5..110B6 ; Top # Mn [2] KAITHI VOWEL SIGN E..KAITHI VOWEL SIGN AI + +# Indic_Matra_Category=Bottom + +0941..0944 ; Bottom # Mn [4] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN VOCALIC RR +094D ; Bottom # Mn DEVANAGARI SIGN VIRAMA +0956..0957 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN UE..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09C1..09C4 ; Bottom # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09CD ; Bottom # Mn BENGALI SIGN VIRAMA +09E2..09E3 ; Bottom # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A41..0A42 ; Bottom # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A4D ; Bottom # Mn GURMUKHI SIGN VIRAMA +0AC1..0AC4 ; Bottom # Mn [4] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN VOCALIC RR +0ACD ; Bottom # Mn GUJARATI SIGN VIRAMA +0AE2..0AE3 ; Bottom # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B41..0B44 ; Bottom # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B4D ; Bottom # Mn ORIYA SIGN VIRAMA +0B62..0B63 ; Bottom # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BC1..0BC2 ; Bottom # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +# Note: U and UU have contextually variable placement in Tamil. +0C56 ; Bottom # Mn TELUGU AI LENGTH MARK +0C62..0C63 ; Bottom # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CE2..0CE3 ; Bottom # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D43..0D44 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC R..MALAYALAM VOWEL SIGN VOCALIC RR +0D62..0D63 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DD4 ; Bottom # Mn SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Bottom # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0E38..0E39 ; Bottom # Mn [2] THAI CHARACTER SARA U..THAI CHARACTER SARA UU +0E3A ; Bottom # Mn THAI CHARACTER PHINTHU +0EB8..0EB9 ; Bottom # Mn [2] LAO VOWEL SIGN U..LAO VOWEL SIGN UU +0F71 ; Bottom # Mn TIBETAN VOWEL SIGN AA +0F74..0F75 ; Bottom # Mn [2] TIBETAN VOWEL SIGN U..TIBETAN VOWEL SIGN UU +0F84 ; Bottom # Mn TIBETAN MARK HALANTA +102F..1030 ; Bottom # Mn [2] MYANMAR VOWEL SIGN U..MYANMAR VOWEL SIGN UU +1058..1059 ; Bottom # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1713 ; Bottom # Mn TAGALOG VOWEL SIGN U +1714 ; Bottom # Mn TAGALOG SIGN VIRAMA +1733 ; Bottom # Mn HANUNOO VOWEL SIGN U +1734 ; Bottom # Mn HANUNOO SIGN PAMUDPOD +1753 ; Bottom # Mn BUHID VOWEL SIGN U +1773 ; Bottom # Mn TAGBANWA VOWEL SIGN U +17BB..17BD ; Bottom # Mn [3] KHMER VOWEL SIGN U..KHMER VOWEL SIGN UA +1922 ; Bottom # Mn LIMBU VOWEL SIGN U +1A18 ; Bottom # Mn BUGINESE VOWEL SIGN U +1A69..1A6A ; Bottom # Mn [2] TAI THAM VOWEL SIGN U..TAI THAM VOWEL SIGN UU +1A6C ; Bottom # Mn TAI THAM VOWEL SIGN OA BELOW +1B38..1B3A ; Bottom # Mn [3] BALINESE VOWEL SIGN SUKU..BALINESE VOWEL SIGN RA REPA +1BA5 ; Bottom # Mn SUNDANESE VOWEL SIGN PANYUKU +1C2C ; Bottom # Mn LEPCHA VOWEL SIGN E +A825 ; Bottom # Mn SYLOTI NAGRI VOWEL SIGN U +A8C4 ; Bottom # Mn SAURASHTRA SIGN VIRAMA +A947..A949 ; Bottom # Mn [3] REJANG VOWEL SIGN I..REJANG VOWEL SIGN E +A94B..A94E ; Bottom # Mn [4] REJANG VOWEL SIGN O..REJANG VOWEL SIGN EA +A9B8..A9B9 ; Bottom # Mn [2] JAVANESE VOWEL SIGN SUKU..JAVANESE VOWEL SIGN SUKU MENDUT +AA2D ; Bottom # Mn CHAM VOWEL SIGN U +AA32 ; Bottom # Mn CHAM VOWEL SIGN UE +AAB4 ; Bottom # Mn TAI VIET VOWEL U +ABE8 ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK +10A02..10A03 ; Bottom # Mn [2] KHAROSHTHI VOWEL SIGN U..KHAROSHTHI VOWEL SIGN VOCALIC R +10A0C ; Bottom # Mn KHAROSHTHI VOWEL LENGTH MARK +1103C..11041 ; Bottom # Mn [6] BRAHMI VOWEL SIGN U..BRAHMI VOWEL SIGN VOCALIC LL +110B3..110B4 ; Bottom # Mn [2] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN UU +110B9 ; Bottom # Mn KAITHI SIGN VIRAMA + +# Indic_Matra_Category=Top_And_Bottom + +0C48 ; Top_And_Bottom # Mn TELUGU VOWEL SIGN AI +0F73 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN II +0F76..0F79 ; Top_And_Bottom # Mn [4] TIBETAN VOWEL SIGN VOCALIC R..TIBETAN VOWEL SIGN VOCALIC LL +0F81 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN REVERSED II +1B3C ; Top_And_Bottom # Mn BALINESE VOWEL SIGN LA LENGA + +# Indic_Matra_Category=Top_And_Right + +0AC9 ; Top_And_Right # Mc GUJARATI VOWEL SIGN CANDRA O +0B57 ; Top_And_Right # Mc ORIYA AU LENGTH MARK +0CC0 ; Top_And_Right # Mc KANNADA VOWEL SIGN II +0CC7..0CC8 ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +1925..1926 ; Top_And_Right # Mc [2] LIMBU VOWEL SIGN OO..LIMBU VOWEL SIGN AU +1B43 ; Top_And_Right # Mc BALINESE VOWEL SIGN PEPET TEDUNG + +# Indic_Matra_Category=Top_And_Left + +0B48 ; Top_And_Left # Mc ORIYA VOWEL SIGN AI +0DDA ; Top_And_Left # Mc SINHALA VOWEL SIGN DIGA KOMBUVA +17BE ; Top_And_Left # Mc KHMER VOWEL SIGN OE +1C29 ; Top_And_Left # Mc LEPCHA VOWEL SIGN OO + +# Indic_Matra_Category=Top_And_Left_And_Right + +0B4C ; Top_And_Left_And_Right # Mc ORIYA VOWEL SIGN AU +17BF ; Top_And_Left_And_Right # Mc KHMER VOWEL SIGN YA + +# Indic_Matra_Category=Bottom_And_Right + +1B3B ; Bottom_And_Right # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +A9C0 ; Bottom_And_Right # Mc JAVANESE PANGKON + +# Indic_Matra_Category=Top_And_Bottom_And_Right + +1B3D ; Top_And_Bottom_And_Right # Mc BALINESE VOWEL SIGN LA LENGA TEDUNG + +# Indic_Matra_Category=Overstruck + +10A01 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN I +10A06 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN O + +# Indic_Matra_Category=Invisible + +# The Invisible category refers to viramas for certain script +# which are used only to control consonant stacking or cluster +# formation, and which have no visible display on their own. + +1039 ; Invisible # Mn MYANMAR SIGN VIRAMA +17D2 ; Invisible # Mn KHMER SIGN COENG +1A60 ; Invisible # Mn TAI THAM SIGN SAKOT +10A3F ; Invisible # Mn KHAROSHTHI VIRAMA + +# EOF diff --git a/data/6.0.0-indic-syllabic-category.txt b/data/6.0.0-indic-syllabic-category.txt new file mode 100644 index 0000000..674c4de --- /dev/null +++ b/data/6.0.0-indic-syllabic-category.txt @@ -0,0 +1,757 @@ +# IndicSyllabicCategory-6.0.0.txt +# Date: 2010-05-25, 11:45:00 PDT [KW] +# +# Unicode Character Database +# Copyright (c) 1991-2010 Unicode, Inc. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# For documentation, see UAX #44. +# +# This file defines the following provisional property: +# +# Indic_Syllabic_Category enumerated property +# +# NB: Provisional properties and data files have no associated stability +# guarantees. They are provided in part to determine the possible usefulness +# of a property or other data and to encourage analysis and further investigation +# which may result in their improvement. Provisional properties and +# data files may change arbitrarily, or may even be removed in a future version of the +# Unicode Character Database, if they prove not to be useful. +# +# Scope: This provisional property is aimed at two general problem +# areas involving the analysis and processing of Indic scripts: +# +# 1. Specification of syllabic structure. +# 2. Specification of segmentation rules. +# +# Both of these problem areas may benefit from having defined subtypes +# of Indic script characters which are relevant to how Indic +# syllables (or aksaras) are constructed. Note that rules for +# syllabic structure in Indic scripts may differ significantly +# from how phonological syllables are defined. +# +# Format: +# Field 0 Code Point or Code Point Range +# Field 1 Indic_Syllabic_Category +# +# A comment field shows General_Category property values and character names. +# +# The scripts assessed as Indic in the +# structural sense used for the Indic_Syllabic_Category are: +# +# Devanagari, Bengali, Gurmukhi, Gujarati, Oriya, Tamil, Telugu, +# Kannada, Malayalam, Sinhala, Thai, Lao, Tibetan, Myanmar, +# Tagalog, Hanunoo, Buhid, Tagbanwa, Khmer, Limbu, Tai Le, New Tai Lue, +# Buginese, Tai Tham, Balinese, Sundanese, Batak, Lepcha, +# Syloti Nagri, Phags-Pa, Saurashtra, Kayah Li, Rejang, Javanese, Cham, Tai Viet, +# Meetei Mayek, Karoshthi, Brahmi, Kaithi +# +# All characters for all other scripts not in that list +# take the default value for this property, unless they +# are individually listed in this data file. +# + +# ================================================ + +# Property: Indic_Syllabic_Category +# +# All code points not explicitly listed for Indic_Syllabic_Category +# have the value Other. +# +# @missing: 0000..10FFFF; Other + +# ================================================ + +# Indic_Syllabic_Category=Bindu + +# Bindu/Anusvara (nasalization or -n) +# Excludes various Vedic nasalization signs. + +# [Not derivable] + +0900..0902 ; Bindu # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +0981 ; Bindu # Mn BENGALI SIGN CANDRABINDU +0982 ; Bindu # Mc BENGALI SIGN ANUSVARA +0A01..0A02 ; Bindu # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A70 ; Bindu # Mn GURMUKHI TIPPI +0A81..0A82 ; Bindu # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0B01 ; Bindu # Mn ORIYA SIGN CANDRABINDU +0B02 ; Bindu # Mc ORIYA SIGN ANUSVARA +0B82 ; Bindu # Mn TAMIL SIGN ANUSVARA +0C01..0C02 ; Bindu # Mc [2] TELUGU SIGN CANDRABINDU..TELUGU SIGN ANUSVARA +0C82 ; Bindu # Mc KANNADA SIGN ANUSVARA +0D02 ; Bindu # Mc MALAYALAM SIGN ANUSVARA +0D82 ; Bindu # Mc SINHALA SIGN ANUSVARAYA +0E4D ; Bindu # Mn THAI CHARACTER NIKHAHIT +0ECD ; Bindu # Mn LAO NIGGAHITA +0F7E ; Bindu # Mn TIBETAN SIGN RJES SU NGA RO +0F82..0F83 ; Bindu # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +1036 ; Bindu # Mn MYANMAR SIGN ANUSVARA +17C6 ; Bindu # Mn KHMER SIGN NIKAHIT +1932 ; Bindu # Mn LIMBU SMALL LETTER ANUSVARA +1B00..1B02 ; Bindu # Mn [3] BALINESE SIGN ULU RICEM..BALINESE SIGN CECEK +A80B ; Bindu # Mn SYLOTI NAGRI SIGN ANUSVARA +A873 ; Bindu # Lo PHAGS-PA LETTER CANDRABINDU +A980..A981 ; Bindu # Mn [2] JAVANESE SIGN PANYANGGA..JAVANESE SIGN CECAK +1B80 ; Bindu # Mn SUNDANESE SIGN PANYECEK +1C34..1C35 ; Bindu # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A880 ; Bindu # Mc SAURASHTRA SIGN ANUSVARA +10A0E ; Bindu # Mn KHAROSHTHI SIGN ANUSVARA +11000 ; Bindu # Mc BRAHMI SIGN CANDRABINDU +11001 ; Bindu # Mn BRAHMI SIGN ANUSVARA +11080..11081 ; Bindu # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA + +# ================================================ + +# Indic_Syllabic_Category=Visarga + +# Visarga (-h) + +# [Not derivable] + +0903 ; Visarga # Mc DEVANAGARI SIGN VISARGA +0983 ; Visarga # Mc BENGALI SIGN VISARGA +0A03 ; Visarga # Mc GURMUKHI SIGN VISARGA +0A83 ; Visarga # Mc GUJARATI SIGN VISARGA +0B03 ; Visarga # Mc ORIYA SIGN VISARGA +0C03 ; Visarga # Mc TELUGU SIGN VISARGA +0C83 ; Visarga # Mc KANNADA SIGN VISARGA +0D03 ; Visarga # Mc MALAYALAM SIGN VISARGA +0D83 ; Visarga # Mc SINHALA SIGN VISARGAYA +0F7F ; Visarga # Mc TIBETAN SIGN RNAM BCAD +1038 ; Visarga # Mc MYANMAR SIGN VISARGA +17C7 ; Visarga # Mc KHMER SIGN REAHMUK +1B04 ; Visarga # Mc BALINESE SIGN BISAH +1B82 ; Visarga # Mc SUNDANESE SIGN PANGWISAD +A881 ; Visarga # Mc SAURASHTRA SIGN VISARGA +A983 ; Visarga # Mc JAVANESE SIGN WIGNYAN +10A0F ; Visarga # Mn KHAROSHTHI SIGN VISARGA +11002 ; Visarga # Mc BRAHMI SIGN VISARGA +11082 ; Visarga # Mc KAITHI SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Avagraha + +# Avagraha (elision of initial a- in sandhi) + +# [Not derivable] + +093D ; Avagraha # Lo DEVANAGARI SIGN AVAGRAHA +09BD ; Avagraha # Lo BENGALI SIGN AVAGRAHA +0ABD ; Avagraha # Lo GUJARATI SIGN AVAGRAHA +0B3D ; Avagraha # Lo ORIYA SIGN AVAGRAHA +0C3D ; Avagraha # Lo TELUGU SIGN AVAGRAHA +0CBD ; Avagraha # Lo KANNADA SIGN AVAGRAHA +0D3D ; Avagraha # Lo MALAYALAM SIGN AVAGRAHA +0F85 ; Avagraha # Po TIBETAN MARK PALUTA +17DC ; Avagraha # Lo KHMER SIGN AVAKRAHASANYA + +# ================================================ + +# Indic_Syllabic_Category=Nukta + +# Nukta (diacritic for borrowed consonants) + +# [Derivation: (ccc=7) - 1037] + +093C ; Nukta # Mn DEVANAGARI SIGN NUKTA +09BC ; Nukta # Mn BENGALI SIGN NUKTA +0A3C ; Nukta # Mn GURMUKHI SIGN NUKTA +0ABC ; Nukta # Mn GUJARATI SIGN NUKTA +0B3C ; Nukta # Mn ORIYA SIGN NUKTA +0CBC ; Nukta # Mn KANNADA SIGN NUKTA +1B34 ; Nukta # Mn BALINESE SIGN REREKAN +1BE6 ; Nukta # Mn BATAK SIGN TOMPI +1C37 ; Nukta # Mn LEPCHA SIGN NUKTA +A9B3 ; Nukta # Mn JAVANESE SIGN CECAK TELU +110BA ; Nukta # Mn KAITHI SIGN NUKTA + +# ================================================ + +# Indic_Syllabic_Category=Virama + +# Virama (killing of inherent vowel in consonant sequence, +# or consonant stacker, depending on model) +# Also includes pure killers. + +# [Derivation: (ccc=9) + 0E4E + 17D1] + +094D ; Virama # Mn DEVANAGARI SIGN VIRAMA +09CD ; Virama # Mn BENGALI SIGN VIRAMA +0A4D ; Virama # Mn GURMUKHI SIGN VIRAMA +0ACD ; Virama # Mn GUJARATI SIGN VIRAMA +0B4D ; Virama # Mn ORIYA SIGN VIRAMA +0BCD ; Virama # Mn TAMIL SIGN VIRAMA +0C4D ; Virama # Mn TELUGU SIGN VIRAMA +0CCD ; Virama # Mn KANNADA SIGN VIRAMA +0D4D ; Virama # Mn MALAYALAM SIGN VIRAMA +0DCA ; Virama # Mn SINHALA SIGN AL-LAKUNA +0E3A ; Virama # Mn THAI CHARACTER PHINTHU +0E4E ; Virama # Mn THAI CHARACTER YAMAKKAN +0F84 ; Virama # Mn TIBETAN MARK HALANTA +1039..103A ; Virama # Mn [2] MYANMAR SIGN VIRAMA..MYANMAR SIGN ASAT +1714 ; Virama # Mn TAGALOG SIGN VIRAMA +1734 ; Virama # Mn HANUNOO SIGN PAMUDPOD +17D1..17D2 ; Virama # Mn [2] KHMER SIGN VIRIAM..KHMER SIGN COENG +1A60 ; Virama # Mn TAI THAM SIGN SAKOT +1B44 ; Virama # Mc BALINESE ADEG ADEG +1BAA ; Virama # Mc SUNDANESE SIGN PAMAAEH +1BF2..1BF3 ; Virama # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +A806 ; Virama # Mn SYLOTI NAGRI SIGN HASANTA +A8C4 ; Virama # Mn SAURASHTRA SIGN VIRAMA +A953 ; Virama # Mc REJANG VIRAMA +A9C0 ; Virama # Mc JAVANESE PANGKON +ABED ; Virama # Mn MEETEI MAYEK APUN IYEK +10A3F ; Virama # Mn KHAROSHTHI VIRAMA +11046 ; Virama # Mn BRAHMI VIRAMA +110B9 ; Virama # Mn KAITHI SIGN VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Independent + +# Independent Vowels (contrasted with matras) + +# [Not derivable] + +0904..0914 ; Vowel_Independent # Lo [17] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER AU +0960..0961 ; Vowel_Independent # Lo [2] DEVANAGARI LETTER VOCALIC RR..DEVANAGARI LETTER VOCALIC LL +0972..0977 ; Vowel_Independent # Lo [6] DEVANAGARI LETTER CANDRA A..DEVANAGARI LETTER UUE +0985..098C ; Vowel_Independent # Lo [8] BENGALI LETTER A..BENGALI LETTER VOCALIC L +098F..0990 ; Vowel_Independent # Lo [2] BENGALI LETTER E..BENGALI LETTER AI +0993..0994 ; Vowel_Independent # Lo [2] BENGALI LETTER O..BENGALI LETTER AU +09E0..09E1 ; Vowel_Independent # Lo [2] BENGALI LETTER VOCALIC RR..BENGALI LETTER VOCALIC LL +0A05..0A0A ; Vowel_Independent # Lo [6] GURMUKHI LETTER A..GURMUKHI LETTER UU +0A0F..0A10 ; Vowel_Independent # Lo [2] GURMUKHI LETTER EE..GURMUKHI LETTER AI +0A13..0A14 ; Vowel_Independent # Lo [2] GURMUKHI LETTER OO..GURMUKHI LETTER AU +0A85..0A8D ; Vowel_Independent # Lo [9] GUJARATI LETTER A..GUJARATI VOWEL CANDRA E +0A8F..0A91 ; Vowel_Independent # Lo [3] GUJARATI LETTER E..GUJARATI VOWEL CANDRA O +0A93..0A94 ; Vowel_Independent # Lo [2] GUJARATI LETTER O..GUJARATI LETTER AU +0AE0..0AE1 ; Vowel_Independent # Lo [2] GUJARATI LETTER VOCALIC RR..GUJARATI LETTER VOCALIC LL +0B05..0B0C ; Vowel_Independent # Lo [8] ORIYA LETTER A..ORIYA LETTER VOCALIC L +0B0F..0B10 ; Vowel_Independent # Lo [2] ORIYA LETTER E..ORIYA LETTER AI +0B13..0B14 ; Vowel_Independent # Lo [2] ORIYA LETTER O..ORIYA LETTER AU +0B60..0B61 ; Vowel_Independent # Lo [2] ORIYA LETTER VOCALIC RR..ORIYA LETTER VOCALIC LL +0B85..0B8A ; Vowel_Independent # Lo [6] TAMIL LETTER A..TAMIL LETTER UU +0B8E..0B90 ; Vowel_Independent # Lo [3] TAMIL LETTER E..TAMIL LETTER AI +0B92..0B94 ; Vowel_Independent # Lo [3] TAMIL LETTER O..TAMIL LETTER AU +0C05..0C0C ; Vowel_Independent # Lo [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L +0C0E..0C10 ; Vowel_Independent # Lo [3] TELUGU LETTER E..TELUGU LETTER AI +0C12..0C14 ; Vowel_Independent # Lo [3] TELUGU LETTER O..TELUGU LETTER AU +0C60..0C61 ; Vowel_Independent # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL +0C85..0C8C ; Vowel_Independent # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L +0C8E..0C90 ; Vowel_Independent # Lo [3] KANNADA LETTER E..KANNADA LETTER AI +0C92..0C94 ; Vowel_Independent # Lo [3] KANNADA LETTER O..KANNADA LETTER AU +0CE0..0CE1 ; Vowel_Independent # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL +0D05..0D0C ; Vowel_Independent # Lo [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L +0D0E..0D10 ; Vowel_Independent # Lo [3] MALAYALAM LETTER E..MALAYALAM LETTER AI +0D12..0D14 ; Vowel_Independent # Lo [3] MALAYALAM LETTER O..MALAYALAM LETTER AU +0D60..0D61 ; Vowel_Independent # Lo [2] MALAYALAM LETTER VOCALIC RR..MALAYALAM LETTER VOCALIC LL +0D85..0D96 ; Vowel_Independent # Lo [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA +1021..102A ; Vowel_Independent # Lo [10] MYANMAR LETTER A..MYANMAR LETTER AU +1052..1055 ; Vowel_Independent # Lo [4] MYANMAR LETTER VOCALIC R..MYANMAR LETTER VOCALIC LL +1700..1702 ; Vowel_Independent # Lo [3] TAGALOG LETTER A..TAGALOG LETTER U +1720..1722 ; Vowel_Independent # Lo [3] HANUNOO LETTER A..HANUNOO LETTER U +1740..1742 ; Vowel_Independent # Lo [3] BUHID LETTER A..BUHID LETTER U +1760..1762 ; Vowel_Independent # Lo [3] TAGBANWA LETTER A..TAGBANWA LETTER U +17A3..17B3 ; Vowel_Independent # Lo [17] KHMER INDEPENDENT VOWEL QAQ..KHMER INDEPENDENT VOWEL QAU +1A4D..1A52 ; Vowel_Independent # Lo [6] TAI THAM LETTER I..TAI THAM LETTER OO +1B05..1B12 ; Vowel_Independent # Lo [14] BALINESE LETTER AKARA..BALINESE LETTER OKARA TEDUNG +1B83..1B89 ; Vowel_Independent # Lo [7] SUNDANESE LETTER A..SUNDANESE LETTER EU +1BE4..1BE5 ; Vowel_Independent # Lo [2] BATAK LETTER I..BATAK LETTER U +A800..A801 ; Vowel_Independent # Lo [2] SYLOTI NAGRI LETTER A..SYLOTI NAGRI LETTER I +A803..A805 ; Vowel_Independent # Lo [3] SYLOTI NAGRI LETTER U..SYLOTI NAGRI LETTER O +A882..A891 ; Vowel_Independent # Lo [16] SAURASHTRA LETTER A..SAURASHTRA LETTER AU +A984..A988 ; Vowel_Independent # Lo [5] JAVANESE LETTER A..JAVANESE LETTER U +A98C..A98E ; Vowel_Independent # Lo [3] JAVANESE LETTER E..JAVANESE LETTER O +AA00..AA05 ; Vowel_Independent # Lo [6] CHAM LETTER A..CHAM LETTER O +11005..11012 ; Vowel_Independent # Lo [14] BRAHMI LETTER A..BRAHMI LETTER AU +11083..1108C ; Vowel_Independent # Lo [10] KAITHI LETTER A..KAITHI LETTER AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Dependent + +# Dependent Vowels (contrasted with independent vowels and/or with complex placement) +# Matras (in Indic scripts) + +# [Not derivable] + +093A ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN OE +093B ; Vowel_Dependent # Mc DEVANAGARI VOWEL SIGN OOE +093E..0940 ; Vowel_Dependent # Mc [3] DEVANAGARI VOWEL SIGN AA..DEVANAGARI VOWEL SIGN II +0941..0948 ; Vowel_Dependent # Mn [8] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN AI +0949..094C ; Vowel_Dependent # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094E..094F ; Vowel_Dependent # Mc [2] DEVANAGARI VOWEL SIGN PRISHTHAMATRA E..DEVANAGARI VOWEL SIGN AW +0955..0957 ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN CANDRA LONG E..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Vowel_Dependent # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BE..09C0 ; Vowel_Dependent # Mc [3] BENGALI VOWEL SIGN AA..BENGALI VOWEL SIGN II +09C1..09C4 ; Vowel_Dependent # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09C7..09C8 ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +09CB..09CC ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +09D7 ; Vowel_Dependent # Mc BENGALI AU LENGTH MARK +09E2..09E3 ; Vowel_Dependent # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3E..0A40 ; Vowel_Dependent # Mc [3] GURMUKHI VOWEL SIGN AA..GURMUKHI VOWEL SIGN II +0A41..0A42 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A47..0A48 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0ABE..0AC0 ; Vowel_Dependent # Mc [3] GUJARATI VOWEL SIGN AA..GUJARATI VOWEL SIGN II +0AC1..0AC5 ; Vowel_Dependent # Mn [5] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AC9 ; Vowel_Dependent # Mc GUJARATI VOWEL SIGN CANDRA O +0ACB..0ACC ; Vowel_Dependent # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0AE2..0AE3 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3E ; Vowel_Dependent # Mc ORIYA VOWEL SIGN AA +0B3F ; Vowel_Dependent # Mn ORIYA VOWEL SIGN I +0B40 ; Vowel_Dependent # Mc ORIYA VOWEL SIGN II +0B41..0B44 ; Vowel_Dependent # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B47..0B48 ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI +0B4B..0B4C ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN O..ORIYA VOWEL SIGN AU +0B56 ; Vowel_Dependent # Mn ORIYA AI LENGTH MARK +0B57 ; Vowel_Dependent # Mc ORIYA AU LENGTH MARK +0B62..0B63 ; Vowel_Dependent # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BBE..0BBF ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC0 ; Vowel_Dependent # Mn TAMIL VOWEL SIGN II +0BC1..0BC2 ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BC6..0BC8 ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0BCA..0BCC ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0BD7 ; Vowel_Dependent # Mc TAMIL AU LENGTH MARK +0C3E..0C40 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C41..0C44 ; Vowel_Dependent # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C46..0C48 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI +0C4A..0C4C ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C55..0C56 ; Vowel_Dependent # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK +0C62..0C63 ; Vowel_Dependent # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBE ; Vowel_Dependent # Mc KANNADA VOWEL SIGN AA +0CBF ; Vowel_Dependent # Mn KANNADA VOWEL SIGN I +0CC0..0CC4 ; Vowel_Dependent # Mc [5] KANNADA VOWEL SIGN II..KANNADA VOWEL SIGN VOCALIC RR +0CC6 ; Vowel_Dependent # Mn KANNADA VOWEL SIGN E +0CC7..0CC8 ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +0CCC ; Vowel_Dependent # Mn KANNADA VOWEL SIGN AU +0CD5..0CD6 ; Vowel_Dependent # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CE2..0CE3 ; Vowel_Dependent # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D3E..0D40 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D44 ; Vowel_Dependent # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR +0D46..0D48 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0D4A..0D4C ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0D57 ; Vowel_Dependent # Mc MALAYALAM AU LENGTH MARK +0D62..0D63 ; Vowel_Dependent # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DCF..0DD1 ; Vowel_Dependent # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD2..0DD4 ; Vowel_Dependent # Mn [3] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Vowel_Dependent # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0DD8..0DDF ; Vowel_Dependent # Mc [8] SINHALA VOWEL SIGN GAETTA-PILLA..SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Vowel_Dependent # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Vowel_Dependent # Lo THAI CHARACTER SARA A +0E31 ; Vowel_Dependent # Mn THAI CHARACTER MAI HAN-AKAT +0E32..0E33 ; Vowel_Dependent # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E34..0E39 ; Vowel_Dependent # Mn [6] THAI CHARACTER SARA I..THAI CHARACTER SARA UU +0E40..0E45 ; Vowel_Dependent # Lo [6] THAI CHARACTER SARA E..THAI CHARACTER LAKKHANGYAO +0E47 ; Vowel_Dependent # Mn THAI CHARACTER MAITAIKHU +0EB0 ; Vowel_Dependent # Lo LAO VOWEL SIGN A +0EB1 ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KAN +0EB2..0EB3 ; Vowel_Dependent # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0EB4..0EB9 ; Vowel_Dependent # Mn [6] LAO VOWEL SIGN I..LAO VOWEL SIGN UU +0EBB ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KON +0EC0..0EC4 ; Vowel_Dependent # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +0F71..0F7D ; Vowel_Dependent # Mn [13] TIBETAN VOWEL SIGN AA..TIBETAN VOWEL SIGN OO +0F80..0F81 ; Vowel_Dependent # Mn [2] TIBETAN VOWEL SIGN REVERSED I..TIBETAN VOWEL SIGN REVERSED II +102B..102C ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +102D..1030 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN UU +1031 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN E +1032..1035 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +1056..1057 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1058..1059 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1062 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1071..1074 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1083..1084 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN SHAN AA..MYANMAR VOWEL SIGN SHAN E +1085..1086 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109C ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN AITON A +109D ; Vowel_Dependent # Mn MYANMAR VOWEL SIGN AITON AI +1712..1713 ; Vowel_Dependent # Mn [2] TAGALOG VOWEL SIGN I..TAGALOG VOWEL SIGN U +1732..1733 ; Vowel_Dependent # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1752..1753 ; Vowel_Dependent # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U +1772..1773 ; Vowel_Dependent # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U +17B6 ; Vowel_Dependent # Mc KHMER VOWEL SIGN AA +17B7..17BD ; Vowel_Dependent # Mn [7] KHMER VOWEL SIGN I..KHMER VOWEL SIGN UA +17BE..17C5 ; Vowel_Dependent # Mc [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU +17C8 ; Vowel_Dependent # Mc KHMER SIGN YUUKALEAPINTU +1920..1922 ; Vowel_Dependent # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U +1923..1926 ; Vowel_Dependent # Mc [4] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AU +1927..1928 ; Vowel_Dependent # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +19B0..19C0 ; Vowel_Dependent # Mc [17] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN IY +1A17..1A18 ; Vowel_Dependent # Mn [2] BUGINESE VOWEL SIGN I..BUGINESE VOWEL SIGN U +1A19..1A1B ; Vowel_Dependent # Mc [3] BUGINESE VOWEL SIGN E..BUGINESE VOWEL SIGN AE +1A61 ; Vowel_Dependent # Mc TAI THAM VOWEL SIGN A +1A62 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN MAI SAT +1A63..1A64 ; Vowel_Dependent # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A65..1A6C ; Vowel_Dependent # Mn [8] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN OA BELOW +1A6D..1A72 ; Vowel_Dependent # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI +1A73..1A74 ; Vowel_Dependent # Mn [2] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN MAI KANG +1B35 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN TEDUNG +1B36..1B3A ; Vowel_Dependent # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA +1B3B ; Vowel_Dependent # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +1B3C ; Vowel_Dependent # Mn BALINESE VOWEL SIGN LA LENGA +1B3D..1B41 ; Vowel_Dependent # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1B42 ; Vowel_Dependent # Mn BALINESE VOWEL SIGN PEPET +1B43 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN PEPET TEDUNG +1BA4..1BA5 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PANGHULU..SUNDANESE VOWEL SIGN PANYUKU +1BA6..1BA7 ; Vowel_Dependent # Mc [2] SUNDANESE VOWEL SIGN PANAELAENG..SUNDANESE VOWEL SIGN PANOLONG +1BA8..1BA9 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE7 ; Vowel_Dependent # Mc BATAK VOWEL SIGN E +1BE8..1BE9 ; Vowel_Dependent # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BEA..1BEC ; Vowel_Dependent # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BED ; Vowel_Dependent # Mn BATAK VOWEL SIGN KARO O +1BEE ; Vowel_Dependent # Mc BATAK VOWEL SIGN U +1BEF ; Vowel_Dependent # Mn BATAK VOWEL SIGN U FOR SIMALUNGUN SA +1C26..1C2B ; Vowel_Dependent # Mc [6] LEPCHA VOWEL SIGN AA..LEPCHA VOWEL SIGN UU +1C2C ; Vowel_Dependent # Mn LEPCHA VOWEL SIGN E +A823..A824 ; Vowel_Dependent # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A825..A826 ; Vowel_Dependent # Mn [2] SYLOTI NAGRI VOWEL SIGN U..SYLOTI NAGRI VOWEL SIGN E +A827 ; Vowel_Dependent # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Vowel_Dependent # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A947..A94E ; Vowel_Dependent # Mn [8] REJANG VOWEL SIGN I..REJANG VOWEL SIGN EA +A9B4..A9B5 ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9B6..A9B9 ; Vowel_Dependent # Mn [4] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BA..A9BB ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +A9BC ; Vowel_Dependent # Mn JAVANESE VOWEL SIGN PEPET +AA29..AA2E ; Vowel_Dependent # Mn [6] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN OE +AA2F..AA30 ; Vowel_Dependent # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA31..AA32 ; Vowel_Dependent # Mn [2] CHAM VOWEL SIGN AU..CHAM VOWEL SIGN UE +AAB0 ; Vowel_Dependent # Mn TAI VIET MAI KANG +AAB1 ; Vowel_Dependent # Lo TAI VIET VOWEL AA +AAB2..AAB4 ; Vowel_Dependent # Mn [3] TAI VIET VOWEL I..TAI VIET VOWEL U +AAB5..AAB6 ; Vowel_Dependent # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB7..AAB8 ; Vowel_Dependent # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AAB9..AABD ; Vowel_Dependent # Lo [5] TAI VIET VOWEL UEA..TAI VIET VOWEL AN +AABE ; Vowel_Dependent # Mn TAI VIET VOWEL AM +ABE3..ABE4 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE5 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN ANAP +ABE6..ABE7 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE8 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABE9..ABEA ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +10A01..10A03 ; Vowel_Dependent # Mn [3] KHAROSHTHI VOWEL SIGN I..KHAROSHTHI VOWEL SIGN VOCALIC R +10A05..10A06 ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O +10A0C ; Vowel_Dependent # Mn KHAROSHTHI VOWEL LENGTH MARK +11038..11045 ; Vowel_Dependent # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +110B0..110B2 ; Vowel_Dependent # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II +110B3..110B6 ; Vowel_Dependent # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI +110B7..110B8 ; Vowel_Dependent # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel + +# (Other) Vowels (reanalyzed as ordinary alphabetic letters or marks) + +# [Not derivable] + +1963..196D ; Vowel # Lo [11] TAI LE LETTER A..TAI LE LETTER AI +A85E..A861 ; Vowel # Lo [4] PHAGS-PA LETTER I..PHAGS-PA LETTER O +A866 ; Vowel # Lo [1] PHAGS-PA LETTER EE +A922..A925 ; Vowel # Lo [4] KAYAH LI LETTER A..KAYAH LI LETTER OO +A926..A92A ; Vowel # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Placeholder + +# Consonant Placeholder +# This includes generic placeholders used for +# Indic script layout (NBSP and dotted circle), as well as a few script- +# specific vowel-holder characters which are not technically +# consonants, but serve instead as bases for placement of vowel marks. + +# [Not derivable] + +00A0 ; Consonant_Placeholder # Zs NO-BREAK SPACE +0A72..0A73 ; Consonant_Placeholder # Lo [2] GURMUKHI IRI..GURMUKHI URA +1900 ; Consonant_Placeholder # Lo LIMBU VOWEL-CARRIER LETTER +25CC ; Consonant_Placeholder # So DOTTED CIRCLE + +# ================================================ + +# Indic_Syllabic_Category=Consonant + +# Consonant (ordinary abugida consonants, with inherent vowels) + +# [Not derivable] + +0915..0939 ; Consonant # Lo [35] DEVANAGARI LETTER KA..DEVANAGARI LETTER HA +0958..095F ; Consonant # Lo [8] DEVANAGARI LETTER QA..DEVANAGARI LETTER YYA +0979..097F ; Consonant # Lo [7] DEVANAGARI LETTER ZHA..DEVANAGARI LETTER BBA +0995..09A8 ; Consonant # Lo [20] BENGALI LETTER KA..BENGALI LETTER NA +09AA..09B0 ; Consonant # Lo [7] BENGALI LETTER PA..BENGALI LETTER RA +09B2 ; Consonant # Lo BENGALI LETTER LA +09B6..09B9 ; Consonant # Lo [4] BENGALI LETTER SHA..BENGALI LETTER HA +09DC..09DD ; Consonant # Lo [2] BENGALI LETTER RRA..BENGALI LETTER RHA +09DF ; Consonant # Lo BENGALI LETTER YYA +09F0..09F1 ; Consonant # Lo [2] BENGALI LETTER RA WITH MIDDLE DIAGONAL..BENGALI LETTER RA WITH LOWER DIAGONAL +0A15..0A28 ; Consonant # Lo [20] GURMUKHI LETTER KA..GURMUKHI LETTER NA +0A2A..0A30 ; Consonant # Lo [7] GURMUKHI LETTER PA..GURMUKHI LETTER RA +0A32..0A33 ; Consonant # Lo [2] GURMUKHI LETTER LA..GURMUKHI LETTER LLA +0A35..0A36 ; Consonant # Lo [2] GURMUKHI LETTER VA..GURMUKHI LETTER SHA +0A38..0A39 ; Consonant # Lo [2] GURMUKHI LETTER SA..GURMUKHI LETTER HA +0A59..0A5C ; Consonant # Lo [4] GURMUKHI LETTER KHHA..GURMUKHI LETTER RRA +0A5E ; Consonant # Lo GURMUKHI LETTER FA +0A95..0AA8 ; Consonant # Lo [20] GUJARATI LETTER KA..GUJARATI LETTER NA +0AAA..0AB0 ; Consonant # Lo [7] GUJARATI LETTER PA..GUJARATI LETTER RA +0AB2..0AB3 ; Consonant # Lo [2] GUJARATI LETTER LA..GUJARATI LETTER LLA +0AB5..0AB9 ; Consonant # Lo [5] GUJARATI LETTER VA..GUJARATI LETTER HA +0B15..0B28 ; Consonant # Lo [20] ORIYA LETTER KA..ORIYA LETTER NA +0B2A..0B30 ; Consonant # Lo [7] ORIYA LETTER PA..ORIYA LETTER RA +0B32..0B33 ; Consonant # Lo [2] ORIYA LETTER LA..ORIYA LETTER LLA +0B35..0B39 ; Consonant # Lo [5] ORIYA LETTER VA..ORIYA LETTER HA +0B5C..0B5D ; Consonant # Lo [2] ORIYA LETTER RRA..ORIYA LETTER RHA +0B5F ; Consonant # Lo ORIYA LETTER YYA +0B71 ; Consonant # Lo ORIYA LETTER WA +0B95 ; Consonant # Lo TAMIL LETTER KA +0B99..0B9A ; Consonant # Lo [2] TAMIL LETTER NGA..TAMIL LETTER CA +0B9C ; Consonant # Lo TAMIL LETTER JA +0B9E..0B9F ; Consonant # Lo [2] TAMIL LETTER NYA..TAMIL LETTER TTA +0BA3..0BA4 ; Consonant # Lo [2] TAMIL LETTER NNA..TAMIL LETTER TA +0BA8..0BAA ; Consonant # Lo [3] TAMIL LETTER NA..TAMIL LETTER PA +0BAE..0BB9 ; Consonant # Lo [12] TAMIL LETTER MA..TAMIL LETTER HA +0C15..0C28 ; Consonant # Lo [20] TELUGU LETTER KA..TELUGU LETTER NA +0C2A..0C33 ; Consonant # Lo [10] TELUGU LETTER PA..TELUGU LETTER LLA +0C35..0C39 ; Consonant # Lo [5] TELUGU LETTER VA..TELUGU LETTER HA +0C58..0C59 ; Consonant # Lo [2] TELUGU LETTER TSA..TELUGU LETTER DZA +0C95..0CA8 ; Consonant # Lo [20] KANNADA LETTER KA..KANNADA LETTER NA +0CAA..0CB3 ; Consonant # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA +0CB5..0CB9 ; Consonant # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA +0CDE ; Consonant # Lo KANNADA LETTER FA +0D15..0D3A ; Consonant # Lo [38] MALAYALAM LETTER KA..MALAYALAM LETTER TTTA +0D9A..0DB1 ; Consonant # Lo [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA +0DB3..0DBB ; Consonant # Lo [9] SINHALA LETTER SANYAKA DAYANNA..SINHALA LETTER RAYANNA +0DBD ; Consonant # Lo SINHALA LETTER DANTAJA LAYANNA +0DC0..0DC6 ; Consonant # Lo [7] SINHALA LETTER VAYANNA..SINHALA LETTER FAYANNA +0E01..0E2E ; Consonant # Lo [46] THAI CHARACTER KO KAI..THAI CHARACTER NOKHUK +0E81..0E82 ; Consonant # Lo [2] LAO LETTER KO..LAO LETTER KHO SUNG +0E84 ; Consonant # Lo LAO LETTER KHO TAM +0E87..0E88 ; Consonant # Lo [2] LAO LETTER NGO..LAO LETTER CO +0E8A ; Consonant # Lo LAO LETTER SO TAM +0E8D ; Consonant # Lo LAO LETTER NYO +0E94..0E97 ; Consonant # Lo [4] LAO LETTER DO..LAO LETTER THO TAM +0E99..0E9F ; Consonant # Lo [7] LAO LETTER NO..LAO LETTER FO SUNG +0EA1..0EA3 ; Consonant # Lo [3] LAO LETTER MO..LAO LETTER LO LING +0EA5 ; Consonant # Lo LAO LETTER LO LOOT +0EA7 ; Consonant # Lo LAO LETTER WO +0EAA..0EAB ; Consonant # Lo [2] LAO LETTER SO SUNG..LAO LETTER HO SUNG +0EAD..0EAE ; Consonant # Lo [2] LAO LETTER O..LAO LETTER HO TAM +0EDC..0EDD ; Consonant # Lo [2] LAO HO NO..LAO HO MO +0F40..0F47 ; Consonant # Lo [8] TIBETAN LETTER KA..TIBETAN LETTER JA +0F49..0F6C ; Consonant # Lo [36] TIBETAN LETTER NYA..TIBETAN LETTER RRA +1000..1020 ; Consonant # Lo [33] MYANMAR LETTER KA..MYANMAR LETTER LLA +103F ; Consonant # Lo MYANMAR LETTER GREAT SA +1050..1051 ; Consonant # Lo [2] MYANMAR LETTER SHA..MYANMAR LETTER SSA +105A..105D ; Consonant # Lo [4] MYANMAR LETTER MON NGA..MYANMAR LETTER MON BBE +1061 ; Consonant # Lo MYANMAR LETTER SGAW KAREN SHA +1065..1066 ; Consonant # Lo [2] MYANMAR LETTER WESTERN PWO KAREN THA..MYANMAR LETTER WESTERN PWO KAREN PWA +106E..1070 ; Consonant # Lo [3] MYANMAR LETTER EASTERN PWO KAREN NNA..MYANMAR LETTER EASTERN PWO KAREN GHWA +1075..1081 ; Consonant # Lo [13] MYANMAR LETTER SHAN KA..MYANMAR LETTER SHAN HA +108E ; Consonant # Lo MYANMAR LETTER RUMAI PALAUNG FA +1703..170C ; Consonant # Lo [10] TAGALOG LETTER KA..TAGALOG LETTER YA +170E..1711 ; Consonant # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1723..1731 ; Consonant # Lo [15] HANUNOO LETTER KA..HANUNOO LETTER HA +1743..1751 ; Consonant # Lo [15] BUHID LETTER KA..BUHID LETTER HA +1763..176C ; Consonant # Lo [10] TAGBANWA LETTER KA..TAGBANWA LETTER YA +176E..1770 ; Consonant # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA +1780..17A2 ; Consonant # Lo [35] KHMER LETTER KA..KHMER LETTER QA +1901..191C ; Consonant # Lo [28] LIMBU LETTER KA..LIMBU LETTER HA +1950..1962 ; Consonant # Lo [19] TAI LE LETTER KA..TAI LE LETTER NA +1980..19AB ; Consonant # Lo [44] NEW TAI LUE LETTER HIGH QA..NEW TAI LUE LETTER LOW SUA +1A00..1A16 ; Consonant # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA +1A20..1A4C ; Consonant # Lo [45] TAI THAM LETTER HIGH KA..TAI THAM LETTER LOW HA +1A53..1A54 ; Consonant # Lo [2] TAI THAM LETTER LAE..TAI THAM LETTER GREAT SA +1B13..1B33 ; Consonant # Lo [33] BALINESE LETTER KA..BALINESE LETTER HA +1B45..1B4B ; Consonant # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B8A..1BA0 ; Consonant # Lo [23] SUNDANESE LETTER KA..SUNDANESE LETTER HA +1BAE..1BAF ; Consonant # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA +1BC0..1BE3 ; Consonant # Lo [36] BATAK LETTER A..BATAK LETTER MBA +1C00..1C23 ; Consonant # Lo [36] LEPCHA LETTER KA..LEPCHA LETTER A +1C4D..1C4F ; Consonant # Lo [3] LEPCHA LETTER TTA..LEPCHA LETTER DDA +A807..A80A ; Consonant # Lo [4] SYLOTI NAGRI LETTER KO..SYLOTI NAGRI LETTER GHO +A80C..A822 ; Consonant # Lo [23] SYLOTI NAGRI LETTER CO..SYLOTI NAGRI LETTER HO +A840..A85D ; Consonant # Lo [30] PHAGS-PA LETTER KA..PHAGS-PA LETTER A +A862..A865 ; Consonant # Lo [4] PHAGS-PA LETTER QA..PHAGS-PA LETTER GGA +A869..A870 ; Consonant # Lo [8] PHAGS-PA LETTER TTA..PHAGS-PA LETTER ASPIRATED FA +A872 ; Consonant # Lo PHAGS-PA SUPERFIXED LETTER RA +A892..A8B3 ; Consonant # Lo [34] SAURASHTRA LETTER KA..SAURASHTRA LETTER LLA +A90A..A921 ; Consonant # Lo [24] KAYAH LI LETTER KA..KAYAH LI LETTER CA +A930..A946 ; Consonant # Lo [23] REJANG LETTER KA..REJANG LETTER A +A989..A98B ; Consonant # Lo [3] JAVANESE LETTER PA CEREK..JAVANESE LETTER NGA LELET RASWADI +A98F..A9B2 ; Consonant # Lo [34] JAVANESE LETTER KA..JAVANESE LETTER HA +AA06..AA28 ; Consonant # Lo [35] CHAM LETTER KA..CHAM LETTER HA +AA60..AA6F ; Consonant # Lo [16] MYANMAR LETTER KHAMTI GA..MYANMAR LETTER KHAMTI FA +AA71..AA73 ; Consonant # Lo [3] MYANMAR LETTER KHAMTI XA..MYAMNAR LETTER KHAMTI RA +AA7A ; Consonant # Lo MYANMAR LETTER AITON RA +AA80..AAAF ; Consonant # Lo [48] TAI VIET LETTER LOW KO..TAI VIET LETTER HIGH O +ABC0..ABDA ; Consonant # Lo [27] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER BHAM +10A00 ; Consonant # Lo KHAROSHTHI LETTER A +10A10..10A13 ; Consonant # Lo [4] KHAROSHTHI LETTER KA..KHAROSHTHI LETTER GHA +10A15..10A17 ; Consonant # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA +10A19..10A33 ; Consonant # Lo [27] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER TTTHA +11013..11037 ; Consonant # Lo [37] BRAHMI LETTER KA..BRAHMI LETTER OLD TAMIL NNNA +1108D..110AF ; Consonant # Lo [35] KAITHI LETTER KA..KAITHI LETTER HA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Dead + +# Dead Consonant (special consonant with killed vowel) + +# [Not derivable] + +09CE ; Consonant_Dead # Lo BENGALI LETTER KHANDA TA +0D7A..0D7F ; Consonant_Dead # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Repha + +# Repha Form of RA (reanalyzed in some scripts) + +# [Not derivable] + +0D4E ; Consonant_Repha # Lo MALAYALAM LETTER DOT REPH +17CC ; Consonant_Repha # Mn KHMER SIGN ROBAT +1B03 ; Consonant_Repha # Mn BALINESE SIGN SURANG +1B81 ; Consonant_Repha # Mn SUNDANESE SIGN PANGLAYAR +A982 ; Consonant_Repha # Mn JAVANESE SIGN LAYAR + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Subjoined + +# Subjoined Consonant (C2 form subtending a base consonant in Tibetan, etc.) + +# [Not derivable] + +0F8D..0F97 ; Consonant_Subjoined # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Consonant_Subjoined # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +1929..192B ; Consonant_Subjoined # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1BA1 ; Consonant_Subjoined # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA2..1BA3 ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1C24..1C25 ; Consonant_Subjoined # Mc [2] LEPCHA SUBJOINED LETTER YA..LEPCHA SUBJOINED LETTER RA +A867..A868 ; Consonant_Subjoined # Lo [2] PHAGS-PA SUBJOINED LETTER WA..PHAGS-PA SUBJOINED LETTER YA +A871 ; Consonant_Subjoined # Lo PHAGS-PA SUBJOINED LETTER RA +A9BD ; Consonant_Subjoined # Mc JAVANESE CONSONANT SIGN KERET + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Medial + +# Medial Consonant (medial liquid, occurring in clusters) + +# [Not derivable] + +0A75 ; Consonant_Medial # Mn GURMUKHI SIGN YAKASH +0EBC ; Consonant_Medial # Mn LAO SEMIVOWEL SIGN LO +0EBD ; Consonant_Medial # Lo LAO SEMIVOWEL SIGN NYO +103B..103C ; Consonant_Medial # Mc [2] MYANMAR CONSONANT SIGN MEDIAL YA..MYANMAR CONSONANT SIGN MEDIAL RA +103D..103E ; Consonant_Medial # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +105E..1060 ; Consonant_Medial # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Consonant_Medial # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +1A55 ; Consonant_Medial # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A56 ; Consonant_Medial # Mn TAI THAM CONSONANT SIGN MEDIAL LA +A9BE..A9BF ; Consonant_Medial # Mc JAVANESE CONSONANT SIGN PENGKAL..JAVANESE CONSONANT SIGN CAKRA +AA33..AA34 ; Consonant_Medial # Mc [2] CHAM CONSONANT SIGN YA..CHAM CONSONANT SIGN RA +AA35..AA36 ; Consonant_Medial # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Final + +# Final Consonant (special final forms which do not take vowels) + +# [Not derivable] + +1930..1931 ; Consonant_Final # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Consonant_Final # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +19C1..19C7 ; Consonant_Final # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B +1A57 ; Consonant_Final # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A58..1A5E ; Consonant_Final # Mn [7] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN SA +1BF0..1BF1 ; Consonant_Final # Mn [2] BATAK CONSONANT SIGN NG..BATAK CONSONANT SIGN H +1C2D..1C33 ; Consonant_Final # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +A8B4 ; Consonant_Final # Mc SAURASHTRA CONSONANT SIGN HAARU +A94F..A951 ; Consonant_Final # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A952 ; Consonant_Final # Mc REJANG CONSONANT SIGN H +AA40..AA42 ; Consonant_Final # Lo [3] CHAM LETTER FINAL K..CHAM LETTER FINAL NG +AA43 ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL NG +AA44..AA4B ; Consonant_Final # Lo [8] CHAM LETTER FINAL CH..CHAM LETTER FINAL SS +AA4C ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL M +AA4D ; Consonant_Final # Mc CHAM CONSONANT SIGN FINAL H +ABDB..ABE2 ; Consonant_Final # Lo [8] MEETEI MAYEK LETTER KOK LONSUM..MEETEI MAYEK LETTER I LONSUM + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Head_Letter + +# Head Letter (Tibetan) + +# [Not derivable] + +0F88..0F8C ; Consonant_Head_Letter # Lo [5] TIBETAN SIGN LCE TSA CAN..TIBETAN SIGN INVERTED MCHU CAN + +# ================================================ + +# Indic_Syllabic_Category=Modifying_Letter + +# Reanalyzed letters not participating in the abugida structure, but +# serving to modify the sound of an adjacent vowel or consonant. +# Note that this is not the same as General_Category=Modifier_Letter. + +# [Not derivable] + +0B83 ; Modifying_Letter # Lo TAMIL SIGN VISARGA (aytham) + +# ================================================ + +# Indic_Syllabic_Category=Tone_Letter + +# Tone Letter (spacing lexical tone mark with status as a letter) + +# [Not derivable] + +1970..1974 ; Tone_Letter # Lo [5] TAI LE LETTER TONE-2..TAI LE LETTER TONE-6 +AAC0 ; Tone_Letter # Lo TAI VIET TONE MAI NUENG +AAC2 ; Tone_Letter # Lo TAI VIET TONE MAI SONG + +# ================================================ + +# Indic_Syllabic_Category=Tone_Mark + +# Tone Mark (nonspacing or spacing lexical tone mark) +# Excludes Vedic tone marks, which are more akin to cantillation marks. + +# [Not derivable] + +0E48..0E4B ; Tone_Mark # Mn [4] THAI CHARACTER MAI EK..THAI CHARACTER MAI CHATTAWA +0EC8..0ECB ; Tone_Mark # Mn [4] LAO TONE MAI EK..LAO TONE MAI CATAWA +1037 ; Tone_Mark # Mn MYANMAR SIGN DOT BELOW +1063..1064 ; Tone_Mark # Mc [2] MYANMAR TONE MARK SGAW KAREN HATHI..MYANMAR TONE MARK SGAW KAREN KE PHO +1069..106D ; Tone_Mark # Mc [5] MYANMAR SIGN WESTERN PWO KAREN TONE-1..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1087..108C ; Tone_Mark # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108D ; Tone_Mark # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +108F ; Tone_Mark # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109B ; Tone_Mark # Mc [2] MYANMAR SIGN KHAMTI TONE-1..MYANMAR SIGN KHAMTI TONE-3 +19C8..19C9 ; Tone_Mark # Mc [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A75..1A79 ; Tone_Mark # Mn [5] TAI THAM SIGN TONE-1..TAI THAM SIGN KHUEN TONE-5 +A92B..A92D ; Tone_Mark # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +AA7B ; Tone_Mark # Mc MYANMAR SIGN PAO KAREN TONE +AABF ; Tone_Mark # Mn TAI VIET TONE MAI EK +AAC1 ; Tone_Mark # Mn TAI VIET TONE MAI THO +ABEC ; Tone_Mark # Mc MEETEI MAYEK LUM IYEK + +# ================================================ + +# Indic_Syllabic_Category=Register_Shifter + +# Register Shifter (shifts register for consonants, akin to a tone mark) + +# [Not derivable] + +17C9..17CA ; Register_Shifter # Mn [2] KHMER SIGN MUUSIKATOAN..KHMER SIGN TRIISAP + +# EOF diff --git a/data/6.1.0-indic-positional-category.txt b/data/6.1.0-indic-positional-category.txt new file mode 100644 index 0000000..68cbd09 --- /dev/null +++ b/data/6.1.0-indic-positional-category.txt @@ -0,0 +1,446 @@ +# IndicMatraCategory-6.1.0.txt +# Date: 2011-08-31, 23:50:00 GMT [KW] +# +# Unicode Character Database +# Copyright (c) 1991-2011 Unicode, Inc. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# For documentation, see UAX #44. +# +# This file defines the following provisional property: +# +# Indic_Matra_Category enumerated property +# +# NB: Provisional properties and data files have no associated stability +# guarantees. They are provided in part to determine the possible usefulness +# of a property or other data and to encourage analysis and further investigation +# which may result in their improvement. Provisional properties and +# data files may change arbitrarily, or may even be removed in a future version of the +# Unicode Character Database, if they prove not to be useful. +# +# Scope: This provisional property is aimed at the problem of +# the specification of syllabic structure for Indic scripts. +# Because dependent vowels (and visible viramas, where they occur) +# are placed in notional slots around the consonant (or consonant +# cluster) core of an Indic syllable, there may be cooccurrence +# constraints or other interactions. Also, it may be desirable, +# in cases where more than one dependent vowel may occur in +# sequence, as for example, in a top slot and a bottom slot, to +# specify preferred orders for spelling. As such, this property +# is designed primarily to supplement the Indic_Syllabic_Category +# property. +# +# Note that this provisional property is *not* intended as +# a prescriptive property regarding display or font design, +# for a number of reasons. Good font design requires information +# that is outside the context of a character encoding standard, +# and is best handled in other venues. For Indic dependent +# vowels, in particular: +# +# 1. Matra placement may vary somewhat based on typeface design. +# 2. Matra placement, even within a single script, may vary +# somewhat according to historic period or local conventions. +# 3. Matra placement may be changed by explicit orthographic reform +# decisions. +# 4. Matras may ligate in various ways with a consonant (or even +# other elements of a syllable) instead of occurring in a +# discrete location. +# 4. Matra display may be contextually determined. This is +# notable, for example, in the Tamil script, where the shape +# and placement of -u and -uu vowels depends strongly on +# which consonant they adjoin. +# +# Format: +# Field 0 Code Point or Code Point Range +# Field 1 Indic_Matra_Category +# +# A comment field shows General_Category property values and character names. +# +# The scripts assessed as containing dependent vowels or viramas in the +# structural sense used for the Indic_Matra_Category are: +# +# Devanagari, Bengali, Gurmukhi, Gujarati, Oriya, Tamil, Telugu, +# Kannada, Malayalam, Sinhala, Thai, Lao, Tibetan, Myanmar, +# Tagalog, Hanunoo, Buhid, Tagbanwa, Khmer, Limbu, New Tai Lue, +# Buginese, Tai Tham, Balinese, Sundanese, Batak, Lepcha, +# Syloti Nagri, Saurashtra, Rejang, Javanese, Cham, Tai Viet, +# Meetei Mayek, Kharoshthi, Brahmi, Kaithi, Chakma, Sharada, Takri +# +# All characters for all other scripts not in that list +# take the default value for this property. +# +# See IndicSyllabicCategory.txt for a slightly more extended +# list of Indic scripts, including those which do not have +# dependent vowel characters. Currently, those additional +# Indic scripts without dependent vowel characters are +# Tai Le, Phags-pa, and Kayah Li. +# + +# ================================================ + +# Property: Indic_Matra_Category +# +# All code points not explicitly listed for Indic_Matra_Category +# have the value NA (Not_Applicable). +# +# @missing: 0000..10FFFF; NA + +# Only Indic dependent vowels (Indic_Syllabic_Category=Vowel_Dependent) +# and viramas (Indic_Syllabic_Category=Virama) +# have a non-default value for this property. + +# ------------------------------------------------ + +# Indic_Matra_Category=Right + +093B ; Right # Mc DEVANAGARI VOWEL SIGN OOE +093E ; Right # Mc DEVANAGARI VOWEL SIGN AA +0940 ; Right # Mc DEVANAGARI VOWEL SIGN II +0949..094C ; Right # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094F ; Right # Mc DEVANAGARI VOWEL SIGN AW +09BE ; Right # Mc BENGALI VOWEL SIGN AA +09C0 ; Right # Mc BENGALI VOWEL SIGN II +09D7 ; Right # Mc BENGALI AU LENGTH MARK +0A3E ; Right # Mc GURMUKHI VOWEL SIGN AA +0A40 ; Right # Mc GURMUKHI VOWEL SIGN II +0ABE ; Right # Mc GUJARATI VOWEL SIGN AA +0AC0 ; Right # Mc GUJARATI VOWEL SIGN II +0ACB..0ACC ; Right # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0B3E ; Right # Mc ORIYA VOWEL SIGN AA +0B40 ; Right # Mc ORIYA VOWEL SIGN II +0BBE..0BBF ; Right # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BD7 ; Right # Mc TAMIL AU LENGTH MARK +0C41..0C44 ; Right # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0CBE ; Right # Mc KANNADA VOWEL SIGN AA +0CC1..0CC4 ; Right # Mc [4] KANNADA VOWEL SIGN U..KANNADA VOWEL SIGN VOCALIC RR +0CD5..0CD6 ; Right # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0D3E..0D40 ; Right # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D42 ; Right # Mn [2] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN UU +# Note: U and UU form complex ligatures with consonants in older Malayalam orthography +0D57 ; Right # Mc MALAYALAM AU LENGTH MARK +0DCF..0DD1 ; Right # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD8 ; Right # Mc SINHALA VOWEL SIGN GAETTA-PILLA +0DDF ; Right # Mc SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Right # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Right # Lo THAI CHARACTER SARA A +0E32..0E33 ; Right # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E45 ; Right # Lo THAI CHARACTER LAKKHANGYAO +0EB0 ; Right # Lo LAO VOWEL SIGN A +0EB2..0EB3 ; Right # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +102B..102C ; Right # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +1056..1057 ; Right # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1062 ; Right # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Right # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1083 ; Right # Mc MYANMAR VOWEL SIGN SHAN AA +109C ; Right # Mc MYANMAR VOWEL SIGN AITON A +17B6 ; Right # Mc KHMER VOWEL SIGN AA +17C8 ; Right # Mc KHMER SIGN YUUKALEAPINTU +1923..1924 ; Right # Mc [2] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AI +19B0..19B4 ; Right # Mc [5] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN UU +19B8..19B9 ; Right # Mc [2] NEW TAI LUE VOWEL SIGN OA..NEW TAI LUE VOWEL SIGN UE +19BB..19C0 ; Right # Mc [6] NEW TAI LUE VOWEL SIGN AAY..NEW TAI LUE VOWEL SIGN IY +1A1A ; Right # Mc BUGINESE VOWEL SIGN O +1A61 ; Right # Mc TAI THAM VOWEL SIGN A +1A63..1A64 ; Right # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A6D ; Right # Mc TAI THAM VOWEL SIGN OY +1B35 ; Right # Mc BALINESE VOWEL SIGN TEDUNG +1B44 ; Right # Mc BALINESE ADEG ADEG +1BA7 ; Right # Mc SUNDANESE VOWEL SIGN PANOLONG +1BAA ; Right # Mc SUNDANESE SIGN PAMAAEH +1BF2..1BF3 ; Right # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +1C26 ; Right # Mc LEPCHA VOWEL SIGN AA +1C2A..1C2B ; Right # Mc [2] LEPCHA VOWEL SIGN U..LEPCHA VOWEL SIGN UU +A823..A824 ; Right # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A827 ; Right # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Right # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A953 ; Right # Mc REJANG VIRAMA +A9B4..A9B5 ; Right # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +AAB1 ; Right # Lo TAI VIET VOWEL AA +AABA ; Right # Lo TAI VIET VOWEL UA +AABD ; Right # Lo TAI VIET VOWEL AN +AAEF ; Right # Mc MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE6..ABE7 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE9..ABEA ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +110B0 ; Right # Mc KAITHI VOWEL SIGN AA +110B2 ; Right # Mc KAITHI VOWEL SIGN II +110B7..110B8 ; Right # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +111B3 ; Right # Mc SHARADA VOWEL SIGN AA +111B5 ; Right # Mc SHARADA VOWEL SIGN II +111C0 ; Right # Mc SHARADA SIGN VIRAMA +116AF ; Right # Mc TAKRI VOWEL SIGN II + +# Indic_Matra_Category=Left + +093F ; Left # Mc DEVANAGARI VOWEL SIGN I +094E ; Left # Mc DEVANAGARI VOWEL SIGN PRISHTHAMATRA E +09BF ; Left # Mc BENGALI VOWEL SIGN I +09C7..09C8 ; Left # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +0A3F ; Left # Mc GURMUKHI VOWEL SIGN I +0ABF ; Left # Mc GUJARATI VOWEL SIGN I +0B47 ; Left # Mc ORIYA VOWEL SIGN E +0BC6..0BC8 ; Left # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0D46..0D48 ; Left # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0DD9 ; Left # Mc SINHALA VOWEL SIGN KOMBUVA +0DDB ; Left # Mc SINHALA VOWEL SIGN KOMBU DEKA +1031 ; Left # Mc MYANMAR VOWEL SIGN E +1084 ; Left # Mc MYANMAR VOWEL SIGN SHAN E +17C1..17C3 ; Left # Mc [3] KHMER VOWEL SIGN E..KHMER VOWEL SIGN AI +19B5..19B7 ; Left # Mc [3] NEW TAI LUE VOWEL SIGN E..NEW TAI LUE VOWEL SIGN O +19BA ; Left # Mc NEW TAI LUE VOWEL SIGN AY +1A19 ; Left # Mc BUGINESE VOWEL SIGN E +1A1B ; Left # Mc BUGINESE VOWEL SIGN AE +1A6E..1A72 ; Left # Mc [5] TAI THAM VOWEL SIGN E..TAI THAM VOWEL SIGN THAM AI +1B3E..1B3F ; Left # Mc [2] BALINESE VOWEL SIGN TALING..BALINESE VOWEL SIGN TALING REPA +1BA6 ; Left # Mc SUNDANESE VOWEL SIGN PANAELAENG +1C27..1C28 ; Left # Mc [2] LEPCHA VOWEL SIGN I..LEPCHA VOWEL SIGN O +A9BA..A9BB ; Left # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +AA2F..AA30 ; Left # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AAEB ; Left # Mc MEETEI MAYEK VOWEL SIGN II +AAEE ; Left # Mc MEETEI MAYEK VOWEL SIGN AU +110B1 ; Left # Mc KAITHI VOWEL SIGN I +1112C ; Left # Mc CHAKMA VOWEL SIGN E +111B4 ; Left # Mc SHARADA VOWEL SIGN I +116AE ; Left # Mc TAKRI VOWEL SIGN I + +# Indic_Matra_Category=Visual_Order_Left + +# These are dependent vowels that occur to the left of the consonant +# letter in a syllable, but which occur in scripts using the visual order +# model, instead of the logical order model. Because of the different +# model, these left-side vowels occur first in the backing store (before +# the consonant letter) and are not reordered during text rendering. +# +# [Derivation: Logical_Order_Exception=True] + +0E40..0E44 ; Visual_Order_Left # Lo [5] THAI CHARACTER SARA E..THAI CHARACTER SARA AI MAIMALAI +0EC0..0EC4 ; Visual_Order_Left # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +AAB5..AAB6 ; Visual_Order_Left # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB9 ; Visual_Order_Left # Lo TAI VIET VOWEL UEA +AABB..AABC ; Visual_Order_Left # Lo [2] TAI VIET VOWEL AUE..TAI VIET VOWEL AY + +# Indic_Matra_Category=Left_And_Right + +09CB..09CC ; Left_And_Right # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +0B4B ; Left_And_Right # Mc ORIYA VOWEL SIGN O +0BCA..0BCC ; Left_And_Right # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0D4A..0D4C ; Left_And_Right # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0DDC..0DDE ; Left_And_Right # Mc [3] SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA..SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA +17C0 ; Left_And_Right # Mc KHMER VOWEL SIGN IE +17C4..17C5 ; Left_And_Right # Mc [2] KHMER VOWEL SIGN OO..KHMER VOWEL SIGN AU +1B40..1B41 ; Left_And_Right # Mc [2] BALINESE VOWEL SIGN TALING TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG + +# Indic_Matra_Category=Top + +093A ; Top # Mn DEVANAGARI VOWEL SIGN OE +0945..0948 ; Top # Mn [4] DEVANAGARI VOWEL SIGN CANDRA E..DEVANAGARI VOWEL SIGN AI +0955 ; Top # Mn DEVANAGARI VOWEL SIGN CANDRA LONG E +0A47..0A48 ; Top # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Top # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0AC5 ; Top # Mn GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Top # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0B3F ; Top # Mn ORIYA VOWEL SIGN I +0B56 ; Top # Mn ORIYA AI LENGTH MARK +0BC0 ; Top # Mn TAMIL VOWEL SIGN II +0BCD ; Top # Mn TAMIL SIGN VIRAMA +0C3E..0C40 ; Top # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C46..0C47 ; Top # Mn [2] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN EE +0C4A..0C4C ; Top # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C4D ; Top # Mn TELUGU SIGN VIRAMA +0C55 ; Top # Mn TELUGU LENGTH MARK +0CBF ; Top # Mn KANNADA VOWEL SIGN I +0CC6 ; Top # Mn KANNADA VOWEL SIGN E +0CCC ; Top # Mn KANNADA VOWEL SIGN AU +0CCD ; Top # Mn KANNADA SIGN VIRAMA +0D4D ; Top # Mn MALAYALAM SIGN VIRAMA +0DCA ; Top # Mn SINHALA SIGN AL-LAKUNA +0DD2..0DD3 ; Top # Mn [2] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN DIGA IS-PILLA +0E31 ; Top # Mn THAI CHARACTER MAI HAN-AKAT +0E34..0E37 ; Top # Mn [4] THAI CHARACTER SARA I..THAI CHARACTER SARA UEE +0E47 ; Top # Mn THAI CHARACTER MAITAIKHU +0E4E ; Top # Mn THAI CHARACTER YAMAKKAN +0EB1 ; Top # Mn LAO VOWEL SIGN MAI KAN +0EB4..0EB7 ; Top # Mn [4] LAO VOWEL SIGN I..LAO VOWEL SIGN YY +0EBB ; Top # Mn LAO VOWEL SIGN MAI KON +0F72 ; Top # Mn TIBETAN VOWEL SIGN I +0F7A..0F7D ; Top # Mn [4] TIBETAN VOWEL SIGN E..TIBETAN VOWEL SIGN OO +0F80 ; Top # Mn TIBETAN VOWEL SIGN REVERSED I +102D..102E ; Top # Mn [2] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN II +1032..1035 ; Top # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +103A ; Top # Mn MYANMAR SIGN ASAT +1071..1074 ; Top # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1085..1086 ; Top # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109D ; Top # Mn MYANMAR VOWEL SIGN AITON AI +1712 ; Top # Mn TAGALOG VOWEL SIGN I +1732 ; Top # Mn HANUNOO VOWEL SIGN I +1752 ; Top # Mn BUHID VOWEL SIGN I +1772 ; Top # Mn TAGBANWA VOWEL SIGN I +17B7..17BA ; Top # Mn [4] KHMER VOWEL SIGN I..KHMER VOWEL SIGN YY +17D1 ; Top # Mn KHMER SIGN VIRIAM +1920..1921 ; Top # Mn [2] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN I +1927..1928 ; Top # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +1A17 ; Top # Mn BUGINESE VOWEL SIGN I +1A62 ; Top # Mn TAI THAM VOWEL SIGN MAI SAT +1A65..1A68 ; Top # Mn [4] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN UUE +1A6B ; Top # Mn TAI THAM VOWEL SIGN O +1A73..1A74 ; Top # Mn [2] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN MAI KANG +1B36..1B37 ; Top # Mn [2] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN ULU SARI +1B42 ; Top # Mn BALINESE VOWEL SIGN PEPET +1BA4 ; Top # Mn SUNDANESE VOWEL SIGN PANGHULU +1BA8..1BA9 ; Top # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +A806 ; Top # Mn SYLOTI NAGRI SIGN HASANTA +A826 ; Top # Mn SYLOTI NAGRI VOWEL SIGN E +A94A ; Top # Mn REJANG VOWEL SIGN AI +A9B6..A9B7 ; Top # Mn [2] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN WULU MELIK +A9BC ; Top # Mn JAVANESE VOWEL SIGN PEPET +AA29..AA2C ; Top # Mn [4] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN EI +AA2E ; Top # Mn CHAM VOWEL SIGN OE +AA31 ; Top # Mn CHAM VOWEL SIGN AU +AAB0 ; Top # Mn TAI VIET MAI KANG +AAB2..AAB3 ; Top # Mn [2] TAI VIET VOWEL I..TAI VIET VOWEL UE +AAB7..AAB8 ; Top # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AABE ; Top # Mn TAI VIET VOWEL AM +AAED ; Top # Mn MEETEI MAYEK VOWEL SIGN AAI +ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP +10A05 ; Top # Mn KHAROSHTHI VOWEL SIGN E +11038..1103B ; Top # Mn [4] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN II +11042..11045 ; Top # Mn [4] BRAHMI VOWEL SIGN E..BRAHMI VOWEL SIGN AU +11046 ; Top # Mn BRAHMI VIRAMA +110B5..110B6 ; Top # Mn [2] KAITHI VOWEL SIGN E..KAITHI VOWEL SIGN AI +11127..11129 ; Top # Mn [3] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN II +1112D ; Top # Mn CHAKMA VOWEL SIGN AI +11130 ; Top # Mn CHAKMA VOWEL SIGN OI +11134 ; Top # Mn CHAKMA MAAYYAA +111BC..111BE ; Top # Mn [3] SHARADA VOWEL SIGN E..SHARADA VOWEL SIGN O +116AD ; Top # Mn TAKRI VOWEL SIGN AA +116B2..116B5 ; Top # Mn [4] TAKRI VOWEL SIGN E..TAKRI VOWEL SIGN AU +116B6 ; Top # Mn TAKRI SIGN VIRAMA + +# Indic_Matra_Category=Bottom + +0941..0944 ; Bottom # Mn [4] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN VOCALIC RR +094D ; Bottom # Mn DEVANAGARI SIGN VIRAMA +0956..0957 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN UE..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09C1..09C4 ; Bottom # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09CD ; Bottom # Mn BENGALI SIGN VIRAMA +09E2..09E3 ; Bottom # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A41..0A42 ; Bottom # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A4D ; Bottom # Mn GURMUKHI SIGN VIRAMA +0AC1..0AC4 ; Bottom # Mn [4] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN VOCALIC RR +0ACD ; Bottom # Mn GUJARATI SIGN VIRAMA +0AE2..0AE3 ; Bottom # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B41..0B44 ; Bottom # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B4D ; Bottom # Mn ORIYA SIGN VIRAMA +0B62..0B63 ; Bottom # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BC1..0BC2 ; Bottom # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +# Note: U and UU have contextually variable placement in Tamil. +0C56 ; Bottom # Mn TELUGU AI LENGTH MARK +0C62..0C63 ; Bottom # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CE2..0CE3 ; Bottom # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D43..0D44 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC R..MALAYALAM VOWEL SIGN VOCALIC RR +0D62..0D63 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DD4 ; Bottom # Mn SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Bottom # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0E38..0E39 ; Bottom # Mn [2] THAI CHARACTER SARA U..THAI CHARACTER SARA UU +0E3A ; Bottom # Mn THAI CHARACTER PHINTHU +0EB8..0EB9 ; Bottom # Mn [2] LAO VOWEL SIGN U..LAO VOWEL SIGN UU +0F71 ; Bottom # Mn TIBETAN VOWEL SIGN AA +0F74..0F75 ; Bottom # Mn [2] TIBETAN VOWEL SIGN U..TIBETAN VOWEL SIGN UU +0F84 ; Bottom # Mn TIBETAN MARK HALANTA +102F..1030 ; Bottom # Mn [2] MYANMAR VOWEL SIGN U..MYANMAR VOWEL SIGN UU +1058..1059 ; Bottom # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1713 ; Bottom # Mn TAGALOG VOWEL SIGN U +1714 ; Bottom # Mn TAGALOG SIGN VIRAMA +1733 ; Bottom # Mn HANUNOO VOWEL SIGN U +1734 ; Bottom # Mn HANUNOO SIGN PAMUDPOD +1753 ; Bottom # Mn BUHID VOWEL SIGN U +1773 ; Bottom # Mn TAGBANWA VOWEL SIGN U +17BB..17BD ; Bottom # Mn [3] KHMER VOWEL SIGN U..KHMER VOWEL SIGN UA +1922 ; Bottom # Mn LIMBU VOWEL SIGN U +1A18 ; Bottom # Mn BUGINESE VOWEL SIGN U +1A69..1A6A ; Bottom # Mn [2] TAI THAM VOWEL SIGN U..TAI THAM VOWEL SIGN UU +1A6C ; Bottom # Mn TAI THAM VOWEL SIGN OA BELOW +1B38..1B3A ; Bottom # Mn [3] BALINESE VOWEL SIGN SUKU..BALINESE VOWEL SIGN RA REPA +1BA5 ; Bottom # Mn SUNDANESE VOWEL SIGN PANYUKU +1C2C ; Bottom # Mn LEPCHA VOWEL SIGN E +A825 ; Bottom # Mn SYLOTI NAGRI VOWEL SIGN U +A8C4 ; Bottom # Mn SAURASHTRA SIGN VIRAMA +A947..A949 ; Bottom # Mn [3] REJANG VOWEL SIGN I..REJANG VOWEL SIGN E +A94B..A94E ; Bottom # Mn [4] REJANG VOWEL SIGN O..REJANG VOWEL SIGN EA +A9B8..A9B9 ; Bottom # Mn [2] JAVANESE VOWEL SIGN SUKU..JAVANESE VOWEL SIGN SUKU MENDUT +AA2D ; Bottom # Mn CHAM VOWEL SIGN U +AA32 ; Bottom # Mn CHAM VOWEL SIGN UE +AAB4 ; Bottom # Mn TAI VIET VOWEL U +AAEC ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UU +ABE8 ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK +10A02..10A03 ; Bottom # Mn [2] KHAROSHTHI VOWEL SIGN U..KHAROSHTHI VOWEL SIGN VOCALIC R +10A0C ; Bottom # Mn KHAROSHTHI VOWEL LENGTH MARK +1103C..11041 ; Bottom # Mn [6] BRAHMI VOWEL SIGN U..BRAHMI VOWEL SIGN VOCALIC LL +110B3..110B4 ; Bottom # Mn [2] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN UU +110B9 ; Bottom # Mn KAITHI SIGN VIRAMA +1112A..1112B ; Bottom # Mn [2] CHAKMA VOWEL SIGN U..CHAKMA VOWEL SIGN UU +11131..11132 ; Bottom # Mn [2] CHAKMA O MARK..CHAKMA AU MARK +111B6..111BB ; Bottom # Mn [6] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN VOCALIC LL +116B0..116B1 ; Bottom # Mn [2] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN UU + +# Indic_Matra_Category=Top_And_Bottom + +0C48 ; Top_And_Bottom # Mn TELUGU VOWEL SIGN AI +0F73 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN II +0F76..0F79 ; Top_And_Bottom # Mn [4] TIBETAN VOWEL SIGN VOCALIC R..TIBETAN VOWEL SIGN VOCALIC LL +0F81 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN REVERSED II +1B3C ; Top_And_Bottom # Mn BALINESE VOWEL SIGN LA LENGA +1112E..1112F ; Top_And_Bottom # Mn [2] CHAKMA VOWEL SIGN O..CHAKMA VOWEL SIGN AU + +# Indic_Matra_Category=Top_And_Right + +0AC9 ; Top_And_Right # Mc GUJARATI VOWEL SIGN CANDRA O +0B57 ; Top_And_Right # Mc ORIYA AU LENGTH MARK +0CC0 ; Top_And_Right # Mc KANNADA VOWEL SIGN II +0CC7..0CC8 ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +1925..1926 ; Top_And_Right # Mc [2] LIMBU VOWEL SIGN OO..LIMBU VOWEL SIGN AU +1B43 ; Top_And_Right # Mc BALINESE VOWEL SIGN PEPET TEDUNG +111BF ; Top_And_Right # Mc SHARADA VOWEL SIGN AU + +# Indic_Matra_Category=Top_And_Left + +0B48 ; Top_And_Left # Mc ORIYA VOWEL SIGN AI +0DDA ; Top_And_Left # Mc SINHALA VOWEL SIGN DIGA KOMBUVA +17BE ; Top_And_Left # Mc KHMER VOWEL SIGN OE +1C29 ; Top_And_Left # Mc LEPCHA VOWEL SIGN OO + +# Indic_Matra_Category=Top_And_Left_And_Right + +0B4C ; Top_And_Left_And_Right # Mc ORIYA VOWEL SIGN AU +17BF ; Top_And_Left_And_Right # Mc KHMER VOWEL SIGN YA + +# Indic_Matra_Category=Bottom_And_Right + +1B3B ; Bottom_And_Right # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +A9C0 ; Bottom_And_Right # Mc JAVANESE PANGKON + +# Indic_Matra_Category=Top_And_Bottom_And_Right + +1B3D ; Top_And_Bottom_And_Right # Mc BALINESE VOWEL SIGN LA LENGA TEDUNG + +# Indic_Matra_Category=Overstruck + +10A01 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN I +10A06 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN O + +# Indic_Matra_Category=Invisible + +# The Invisible category refers to viramas for certain script +# which are used only to control consonant stacking or cluster +# formation, and which have no visible display on their own. + +1039 ; Invisible # Mn MYANMAR SIGN VIRAMA +17D2 ; Invisible # Mn KHMER SIGN COENG +1A60 ; Invisible # Mn TAI THAM SIGN SAKOT +AAF6 ; Invisible # Mn MEETEI MAYEK VIRAMA +10A3F ; Invisible # Mn KHAROSHTHI VIRAMA +11133 ; Invisible # Mn CHAKMA VIRAMA + +# EOF diff --git a/data/6.1.0-indic-syllabic-category.txt b/data/6.1.0-indic-syllabic-category.txt new file mode 100644 index 0000000..9d771ba --- /dev/null +++ b/data/6.1.0-indic-syllabic-category.txt @@ -0,0 +1,796 @@ +# IndicSyllabicCategory-6.1.0.txt +# Date: 2011-08-31, 23:54:00 GMT [KW] +# +# Unicode Character Database +# Copyright (c) 1991-2011 Unicode, Inc. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# For documentation, see UAX #44. +# +# This file defines the following provisional property: +# +# Indic_Syllabic_Category enumerated property +# +# NB: Provisional properties and data files have no associated stability +# guarantees. They are provided in part to determine the possible usefulness +# of a property or other data and to encourage analysis and further investigation +# which may result in their improvement. Provisional properties and +# data files may change arbitrarily, or may even be removed in a future version of the +# Unicode Character Database, if they prove not to be useful. +# +# Scope: This provisional property is aimed at two general problem +# areas involving the analysis and processing of Indic scripts: +# +# 1. Specification of syllabic structure. +# 2. Specification of segmentation rules. +# +# Both of these problem areas may benefit from having defined subtypes +# of Indic script characters which are relevant to how Indic +# syllables (or aksaras) are constructed. Note that rules for +# syllabic structure in Indic scripts may differ significantly +# from how phonological syllables are defined. +# +# Format: +# Field 0 Code Point or Code Point Range +# Field 1 Indic_Syllabic_Category +# +# A comment field shows General_Category property values and character names. +# +# The scripts assessed as Indic in the +# structural sense used for the Indic_Syllabic_Category are: +# +# Devanagari, Bengali, Gurmukhi, Gujarati, Oriya, Tamil, Telugu, +# Kannada, Malayalam, Sinhala, Thai, Lao, Tibetan, Myanmar, +# Tagalog, Hanunoo, Buhid, Tagbanwa, Khmer, Limbu, Tai Le, New Tai Lue, +# Buginese, Tai Tham, Balinese, Sundanese, Batak, Lepcha, +# Syloti Nagri, Phags-Pa, Saurashtra, Kayah Li, Rejang, Javanese, Cham, Tai Viet, +# Meetei Mayek, Kharoshthi, Brahmi, Kaithi, Chakma, Sharada, Takri +# +# All characters for all other scripts not in that list +# take the default value for this property, unless they +# are individually listed in this data file. +# + +# ================================================ + +# Property: Indic_Syllabic_Category +# +# All code points not explicitly listed for Indic_Syllabic_Category +# have the value Other. +# +# @missing: 0000..10FFFF; Other + +# ================================================ + +# Indic_Syllabic_Category=Bindu + +# Bindu/Anusvara (nasalization or -n) +# Excludes various Vedic nasalization signs. + +# [Not derivable] + +0900..0902 ; Bindu # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +0981 ; Bindu # Mn BENGALI SIGN CANDRABINDU +0982 ; Bindu # Mc BENGALI SIGN ANUSVARA +0A01..0A02 ; Bindu # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A70 ; Bindu # Mn GURMUKHI TIPPI +0A81..0A82 ; Bindu # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0B01 ; Bindu # Mn ORIYA SIGN CANDRABINDU +0B02 ; Bindu # Mc ORIYA SIGN ANUSVARA +0B82 ; Bindu # Mn TAMIL SIGN ANUSVARA +0C01..0C02 ; Bindu # Mc [2] TELUGU SIGN CANDRABINDU..TELUGU SIGN ANUSVARA +0C82 ; Bindu # Mc KANNADA SIGN ANUSVARA +0D02 ; Bindu # Mc MALAYALAM SIGN ANUSVARA +0D82 ; Bindu # Mc SINHALA SIGN ANUSVARAYA +0E4D ; Bindu # Mn THAI CHARACTER NIKHAHIT +0ECD ; Bindu # Mn LAO NIGGAHITA +0F7E ; Bindu # Mn TIBETAN SIGN RJES SU NGA RO +0F82..0F83 ; Bindu # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +1036 ; Bindu # Mn MYANMAR SIGN ANUSVARA +17C6 ; Bindu # Mn KHMER SIGN NIKAHIT +1932 ; Bindu # Mn LIMBU SMALL LETTER ANUSVARA +1B00..1B02 ; Bindu # Mn [3] BALINESE SIGN ULU RICEM..BALINESE SIGN CECEK +A80B ; Bindu # Mn SYLOTI NAGRI SIGN ANUSVARA +A873 ; Bindu # Lo PHAGS-PA LETTER CANDRABINDU +A980..A981 ; Bindu # Mn [2] JAVANESE SIGN PANYANGGA..JAVANESE SIGN CECAK +1B80 ; Bindu # Mn SUNDANESE SIGN PANYECEK +1C34..1C35 ; Bindu # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A880 ; Bindu # Mc SAURASHTRA SIGN ANUSVARA +10A0E ; Bindu # Mn KHAROSHTHI SIGN ANUSVARA +11000 ; Bindu # Mc BRAHMI SIGN CANDRABINDU +11001 ; Bindu # Mn BRAHMI SIGN ANUSVARA +11080..11081 ; Bindu # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +11100..11101 ; Bindu # Mn CHAKMA SIGN CANDRABINDU..CHAKMA SIGN ANUSVARA +11180..11181 ; Bindu # Mn SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +116AB ; Bindu # Mn TAKRI SIGN ANUSVARA + +# ================================================ + +# Indic_Syllabic_Category=Visarga + +# Visarga (-h) +# Includes specialized case for Sanskrit: ardhavisarga +# Excludes letters for jihvamuliya and upadhmaniya, which are +# related, but structured somewhat differently. + +# [Not derivable] + +0903 ; Visarga # Mc DEVANAGARI SIGN VISARGA +0983 ; Visarga # Mc BENGALI SIGN VISARGA +0A03 ; Visarga # Mc GURMUKHI SIGN VISARGA +0A83 ; Visarga # Mc GUJARATI SIGN VISARGA +0B03 ; Visarga # Mc ORIYA SIGN VISARGA +0C03 ; Visarga # Mc TELUGU SIGN VISARGA +0C83 ; Visarga # Mc KANNADA SIGN VISARGA +0D03 ; Visarga # Mc MALAYALAM SIGN VISARGA +0D83 ; Visarga # Mc SINHALA SIGN VISARGAYA +0F7F ; Visarga # Mc TIBETAN SIGN RNAM BCAD +1038 ; Visarga # Mc MYANMAR SIGN VISARGA +17C7 ; Visarga # Mc KHMER SIGN REAHMUK +1B04 ; Visarga # Mc BALINESE SIGN BISAH +1B82 ; Visarga # Mc SUNDANESE SIGN PANGWISAD +1CF2 ; Visarga # Mc VEDIC SIGN ARDHAVISARGA +1CF3 ; Visarga # Mc VEDIC SIGN ROTATED ARDHAVISARGA +A881 ; Visarga # Mc SAURASHTRA SIGN VISARGA +A983 ; Visarga # Mc JAVANESE SIGN WIGNYAN +AAF5 ; Visarga # Mc MEETEI MAYEK VOWEL SIGN VISARGA +10A0F ; Visarga # Mn KHAROSHTHI SIGN VISARGA +11002 ; Visarga # Mc BRAHMI SIGN VISARGA +11082 ; Visarga # Mc KAITHI SIGN VISARGA +11102 ; Visarga # Mn CHAKMA SIGN VISARGA +11182 ; Visarga # Mn SHARADA SIGN VISARGA +116AC ; Visarga # Mc TAKRI SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Avagraha + +# Avagraha (elision of initial a- in sandhi) + +# [Not derivable] + +093D ; Avagraha # Lo DEVANAGARI SIGN AVAGRAHA +09BD ; Avagraha # Lo BENGALI SIGN AVAGRAHA +0ABD ; Avagraha # Lo GUJARATI SIGN AVAGRAHA +0B3D ; Avagraha # Lo ORIYA SIGN AVAGRAHA +0C3D ; Avagraha # Lo TELUGU SIGN AVAGRAHA +0CBD ; Avagraha # Lo KANNADA SIGN AVAGRAHA +0D3D ; Avagraha # Lo MALAYALAM SIGN AVAGRAHA +0F85 ; Avagraha # Po TIBETAN MARK PALUTA +17DC ; Avagraha # Lo KHMER SIGN AVAKRAHASANYA +1BBA ; Avagraha # Lo SUNDANESE AVAGRAHA +111C1 ; Avagraha # Lo SHARADA SIGN AVAGRAHA + +# ================================================ + +# Indic_Syllabic_Category=Nukta + +# Nukta (diacritic for borrowed consonants) + +# [Derivation: (ccc=7) - 1037] + +093C ; Nukta # Mn DEVANAGARI SIGN NUKTA +09BC ; Nukta # Mn BENGALI SIGN NUKTA +0A3C ; Nukta # Mn GURMUKHI SIGN NUKTA +0ABC ; Nukta # Mn GUJARATI SIGN NUKTA +0B3C ; Nukta # Mn ORIYA SIGN NUKTA +0CBC ; Nukta # Mn KANNADA SIGN NUKTA +1B34 ; Nukta # Mn BALINESE SIGN REREKAN +1BE6 ; Nukta # Mn BATAK SIGN TOMPI +1C37 ; Nukta # Mn LEPCHA SIGN NUKTA +A9B3 ; Nukta # Mn JAVANESE SIGN CECAK TELU +110BA ; Nukta # Mn KAITHI SIGN NUKTA +116B7 ; Nukta # Mn TAKRI SIGN NUKTA + +# ================================================ + +# Indic_Syllabic_Category=Virama + +# Virama (killing of inherent vowel in consonant sequence, +# or consonant stacker, depending on model) +# Also includes pure killers. + +# [Derivation: (ccc=9) + 0E4E + 17D1] + +094D ; Virama # Mn DEVANAGARI SIGN VIRAMA +09CD ; Virama # Mn BENGALI SIGN VIRAMA +0A4D ; Virama # Mn GURMUKHI SIGN VIRAMA +0ACD ; Virama # Mn GUJARATI SIGN VIRAMA +0B4D ; Virama # Mn ORIYA SIGN VIRAMA +0BCD ; Virama # Mn TAMIL SIGN VIRAMA +0C4D ; Virama # Mn TELUGU SIGN VIRAMA +0CCD ; Virama # Mn KANNADA SIGN VIRAMA +0D4D ; Virama # Mn MALAYALAM SIGN VIRAMA +0DCA ; Virama # Mn SINHALA SIGN AL-LAKUNA +0E3A ; Virama # Mn THAI CHARACTER PHINTHU +0E4E ; Virama # Mn THAI CHARACTER YAMAKKAN +0F84 ; Virama # Mn TIBETAN MARK HALANTA +1039..103A ; Virama # Mn [2] MYANMAR SIGN VIRAMA..MYANMAR SIGN ASAT +1714 ; Virama # Mn TAGALOG SIGN VIRAMA +1734 ; Virama # Mn HANUNOO SIGN PAMUDPOD +17D1..17D2 ; Virama # Mn [2] KHMER SIGN VIRIAM..KHMER SIGN COENG +1A60 ; Virama # Mn TAI THAM SIGN SAKOT +1B44 ; Virama # Mc BALINESE ADEG ADEG +1BAA ; Virama # Mc SUNDANESE SIGN PAMAAEH +1BAB ; Virama # Mc SUNDANESE SIGN VIRAMA +1BF2..1BF3 ; Virama # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +A806 ; Virama # Mn SYLOTI NAGRI SIGN HASANTA +A8C4 ; Virama # Mn SAURASHTRA SIGN VIRAMA +A953 ; Virama # Mc REJANG VIRAMA +A9C0 ; Virama # Mc JAVANESE PANGKON +AAF6 ; Virama # Mn MEETEI MAYEK VIRAMA +ABED ; Virama # Mn MEETEI MAYEK APUN IYEK +10A3F ; Virama # Mn KHAROSHTHI VIRAMA +11046 ; Virama # Mn BRAHMI VIRAMA +110B9 ; Virama # Mn KAITHI SIGN VIRAMA +11133..11134 ; Virama # Mn CHAKMA VIRAMA..CHAKMA MAAYYAA +111C0 ; Virama # Mc SHARADA SIGN VIRAMA +116B6 ; Virama # Mn TAKRI SIGN VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Independent + +# Independent Vowels (contrasted with matras) + +# [Not derivable] + +0904..0914 ; Vowel_Independent # Lo [17] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER AU +0960..0961 ; Vowel_Independent # Lo [2] DEVANAGARI LETTER VOCALIC RR..DEVANAGARI LETTER VOCALIC LL +0972..0977 ; Vowel_Independent # Lo [6] DEVANAGARI LETTER CANDRA A..DEVANAGARI LETTER UUE +0985..098C ; Vowel_Independent # Lo [8] BENGALI LETTER A..BENGALI LETTER VOCALIC L +098F..0990 ; Vowel_Independent # Lo [2] BENGALI LETTER E..BENGALI LETTER AI +0993..0994 ; Vowel_Independent # Lo [2] BENGALI LETTER O..BENGALI LETTER AU +09E0..09E1 ; Vowel_Independent # Lo [2] BENGALI LETTER VOCALIC RR..BENGALI LETTER VOCALIC LL +0A05..0A0A ; Vowel_Independent # Lo [6] GURMUKHI LETTER A..GURMUKHI LETTER UU +0A0F..0A10 ; Vowel_Independent # Lo [2] GURMUKHI LETTER EE..GURMUKHI LETTER AI +0A13..0A14 ; Vowel_Independent # Lo [2] GURMUKHI LETTER OO..GURMUKHI LETTER AU +0A85..0A8D ; Vowel_Independent # Lo [9] GUJARATI LETTER A..GUJARATI VOWEL CANDRA E +0A8F..0A91 ; Vowel_Independent # Lo [3] GUJARATI LETTER E..GUJARATI VOWEL CANDRA O +0A93..0A94 ; Vowel_Independent # Lo [2] GUJARATI LETTER O..GUJARATI LETTER AU +0AE0..0AE1 ; Vowel_Independent # Lo [2] GUJARATI LETTER VOCALIC RR..GUJARATI LETTER VOCALIC LL +0B05..0B0C ; Vowel_Independent # Lo [8] ORIYA LETTER A..ORIYA LETTER VOCALIC L +0B0F..0B10 ; Vowel_Independent # Lo [2] ORIYA LETTER E..ORIYA LETTER AI +0B13..0B14 ; Vowel_Independent # Lo [2] ORIYA LETTER O..ORIYA LETTER AU +0B60..0B61 ; Vowel_Independent # Lo [2] ORIYA LETTER VOCALIC RR..ORIYA LETTER VOCALIC LL +0B85..0B8A ; Vowel_Independent # Lo [6] TAMIL LETTER A..TAMIL LETTER UU +0B8E..0B90 ; Vowel_Independent # Lo [3] TAMIL LETTER E..TAMIL LETTER AI +0B92..0B94 ; Vowel_Independent # Lo [3] TAMIL LETTER O..TAMIL LETTER AU +0C05..0C0C ; Vowel_Independent # Lo [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L +0C0E..0C10 ; Vowel_Independent # Lo [3] TELUGU LETTER E..TELUGU LETTER AI +0C12..0C14 ; Vowel_Independent # Lo [3] TELUGU LETTER O..TELUGU LETTER AU +0C60..0C61 ; Vowel_Independent # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL +0C85..0C8C ; Vowel_Independent # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L +0C8E..0C90 ; Vowel_Independent # Lo [3] KANNADA LETTER E..KANNADA LETTER AI +0C92..0C94 ; Vowel_Independent # Lo [3] KANNADA LETTER O..KANNADA LETTER AU +0CE0..0CE1 ; Vowel_Independent # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL +0D05..0D0C ; Vowel_Independent # Lo [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L +0D0E..0D10 ; Vowel_Independent # Lo [3] MALAYALAM LETTER E..MALAYALAM LETTER AI +0D12..0D14 ; Vowel_Independent # Lo [3] MALAYALAM LETTER O..MALAYALAM LETTER AU +0D60..0D61 ; Vowel_Independent # Lo [2] MALAYALAM LETTER VOCALIC RR..MALAYALAM LETTER VOCALIC LL +0D85..0D96 ; Vowel_Independent # Lo [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA +1021..102A ; Vowel_Independent # Lo [10] MYANMAR LETTER A..MYANMAR LETTER AU +1052..1055 ; Vowel_Independent # Lo [4] MYANMAR LETTER VOCALIC R..MYANMAR LETTER VOCALIC LL +1700..1702 ; Vowel_Independent # Lo [3] TAGALOG LETTER A..TAGALOG LETTER U +1720..1722 ; Vowel_Independent # Lo [3] HANUNOO LETTER A..HANUNOO LETTER U +1740..1742 ; Vowel_Independent # Lo [3] BUHID LETTER A..BUHID LETTER U +1760..1762 ; Vowel_Independent # Lo [3] TAGBANWA LETTER A..TAGBANWA LETTER U +17A3..17B3 ; Vowel_Independent # Lo [17] KHMER INDEPENDENT VOWEL QAQ..KHMER INDEPENDENT VOWEL QAU +1A4D..1A52 ; Vowel_Independent # Lo [6] TAI THAM LETTER I..TAI THAM LETTER OO +1B05..1B12 ; Vowel_Independent # Lo [14] BALINESE LETTER AKARA..BALINESE LETTER OKARA TEDUNG +1B83..1B89 ; Vowel_Independent # Lo [7] SUNDANESE LETTER A..SUNDANESE LETTER EU +1BE4..1BE5 ; Vowel_Independent # Lo [2] BATAK LETTER I..BATAK LETTER U +A800..A801 ; Vowel_Independent # Lo [2] SYLOTI NAGRI LETTER A..SYLOTI NAGRI LETTER I +A803..A805 ; Vowel_Independent # Lo [3] SYLOTI NAGRI LETTER U..SYLOTI NAGRI LETTER O +A882..A891 ; Vowel_Independent # Lo [16] SAURASHTRA LETTER A..SAURASHTRA LETTER AU +A984..A988 ; Vowel_Independent # Lo [5] JAVANESE LETTER A..JAVANESE LETTER U +A98C..A98E ; Vowel_Independent # Lo [3] JAVANESE LETTER E..JAVANESE LETTER O +AA00..AA05 ; Vowel_Independent # Lo [6] CHAM LETTER A..CHAM LETTER O +AAE0..AAE1 ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER E..MEETEI MAYEK LETTER O +ABCE..ABCF ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER UN..MEETEI MAYEK LETTER I +ABD1 ; Vowel_Independent # Lo MEETEI MAYEK LETTER ATIYA +11005..11012 ; Vowel_Independent # Lo [14] BRAHMI LETTER A..BRAHMI LETTER AU +11083..1108C ; Vowel_Independent # Lo [10] KAITHI LETTER A..KAITHI LETTER AU +11103..11106 ; Vowel_Independent # Lo [4] CHAKMA LETTER AA..CHAKMA LETTER E +11183..11190 ; Vowel_Independent # Lo [14] SHARADA LETTER A..SHARADA LETTER AU +11680..11689 ; Vowel_Independent # Lo [10] TAKRI LETTER A..TAKRI LETTER AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Dependent + +# Dependent Vowels (contrasted with independent vowels and/or with complex placement) +# Matras (in Indic scripts) + +# [Not derivable] + +093A ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN OE +093B ; Vowel_Dependent # Mc DEVANAGARI VOWEL SIGN OOE +093E..0940 ; Vowel_Dependent # Mc [3] DEVANAGARI VOWEL SIGN AA..DEVANAGARI VOWEL SIGN II +0941..0948 ; Vowel_Dependent # Mn [8] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN AI +0949..094C ; Vowel_Dependent # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094E..094F ; Vowel_Dependent # Mc [2] DEVANAGARI VOWEL SIGN PRISHTHAMATRA E..DEVANAGARI VOWEL SIGN AW +0955..0957 ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN CANDRA LONG E..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Vowel_Dependent # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BE..09C0 ; Vowel_Dependent # Mc [3] BENGALI VOWEL SIGN AA..BENGALI VOWEL SIGN II +09C1..09C4 ; Vowel_Dependent # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09C7..09C8 ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +09CB..09CC ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +09D7 ; Vowel_Dependent # Mc BENGALI AU LENGTH MARK +09E2..09E3 ; Vowel_Dependent # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3E..0A40 ; Vowel_Dependent # Mc [3] GURMUKHI VOWEL SIGN AA..GURMUKHI VOWEL SIGN II +0A41..0A42 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A47..0A48 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0ABE..0AC0 ; Vowel_Dependent # Mc [3] GUJARATI VOWEL SIGN AA..GUJARATI VOWEL SIGN II +0AC1..0AC5 ; Vowel_Dependent # Mn [5] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AC9 ; Vowel_Dependent # Mc GUJARATI VOWEL SIGN CANDRA O +0ACB..0ACC ; Vowel_Dependent # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0AE2..0AE3 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3E ; Vowel_Dependent # Mc ORIYA VOWEL SIGN AA +0B3F ; Vowel_Dependent # Mn ORIYA VOWEL SIGN I +0B40 ; Vowel_Dependent # Mc ORIYA VOWEL SIGN II +0B41..0B44 ; Vowel_Dependent # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B47..0B48 ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI +0B4B..0B4C ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN O..ORIYA VOWEL SIGN AU +0B56 ; Vowel_Dependent # Mn ORIYA AI LENGTH MARK +0B57 ; Vowel_Dependent # Mc ORIYA AU LENGTH MARK +0B62..0B63 ; Vowel_Dependent # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BBE..0BBF ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC0 ; Vowel_Dependent # Mn TAMIL VOWEL SIGN II +0BC1..0BC2 ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BC6..0BC8 ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0BCA..0BCC ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0BD7 ; Vowel_Dependent # Mc TAMIL AU LENGTH MARK +0C3E..0C40 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C41..0C44 ; Vowel_Dependent # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C46..0C48 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI +0C4A..0C4C ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C55..0C56 ; Vowel_Dependent # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK +0C62..0C63 ; Vowel_Dependent # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBE ; Vowel_Dependent # Mc KANNADA VOWEL SIGN AA +0CBF ; Vowel_Dependent # Mn KANNADA VOWEL SIGN I +0CC0..0CC4 ; Vowel_Dependent # Mc [5] KANNADA VOWEL SIGN II..KANNADA VOWEL SIGN VOCALIC RR +0CC6 ; Vowel_Dependent # Mn KANNADA VOWEL SIGN E +0CC7..0CC8 ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +0CCC ; Vowel_Dependent # Mn KANNADA VOWEL SIGN AU +0CD5..0CD6 ; Vowel_Dependent # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CE2..0CE3 ; Vowel_Dependent # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D3E..0D40 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D44 ; Vowel_Dependent # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR +0D46..0D48 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0D4A..0D4C ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0D57 ; Vowel_Dependent # Mc MALAYALAM AU LENGTH MARK +0D62..0D63 ; Vowel_Dependent # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DCF..0DD1 ; Vowel_Dependent # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD2..0DD4 ; Vowel_Dependent # Mn [3] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Vowel_Dependent # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0DD8..0DDF ; Vowel_Dependent # Mc [8] SINHALA VOWEL SIGN GAETTA-PILLA..SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Vowel_Dependent # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Vowel_Dependent # Lo THAI CHARACTER SARA A +0E31 ; Vowel_Dependent # Mn THAI CHARACTER MAI HAN-AKAT +0E32..0E33 ; Vowel_Dependent # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E34..0E39 ; Vowel_Dependent # Mn [6] THAI CHARACTER SARA I..THAI CHARACTER SARA UU +0E40..0E45 ; Vowel_Dependent # Lo [6] THAI CHARACTER SARA E..THAI CHARACTER LAKKHANGYAO +0E47 ; Vowel_Dependent # Mn THAI CHARACTER MAITAIKHU +0EB0 ; Vowel_Dependent # Lo LAO VOWEL SIGN A +0EB1 ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KAN +0EB2..0EB3 ; Vowel_Dependent # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0EB4..0EB9 ; Vowel_Dependent # Mn [6] LAO VOWEL SIGN I..LAO VOWEL SIGN UU +0EBB ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KON +0EC0..0EC4 ; Vowel_Dependent # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +0F71..0F7D ; Vowel_Dependent # Mn [13] TIBETAN VOWEL SIGN AA..TIBETAN VOWEL SIGN OO +0F80..0F81 ; Vowel_Dependent # Mn [2] TIBETAN VOWEL SIGN REVERSED I..TIBETAN VOWEL SIGN REVERSED II +102B..102C ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +102D..1030 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN UU +1031 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN E +1032..1035 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +1056..1057 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1058..1059 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1062 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1071..1074 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1083..1084 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN SHAN AA..MYANMAR VOWEL SIGN SHAN E +1085..1086 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109C ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN AITON A +109D ; Vowel_Dependent # Mn MYANMAR VOWEL SIGN AITON AI +1712..1713 ; Vowel_Dependent # Mn [2] TAGALOG VOWEL SIGN I..TAGALOG VOWEL SIGN U +1732..1733 ; Vowel_Dependent # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1752..1753 ; Vowel_Dependent # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U +1772..1773 ; Vowel_Dependent # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U +17B6 ; Vowel_Dependent # Mc KHMER VOWEL SIGN AA +17B7..17BD ; Vowel_Dependent # Mn [7] KHMER VOWEL SIGN I..KHMER VOWEL SIGN UA +17BE..17C5 ; Vowel_Dependent # Mc [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU +17C8 ; Vowel_Dependent # Mc KHMER SIGN YUUKALEAPINTU +1920..1922 ; Vowel_Dependent # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U +1923..1926 ; Vowel_Dependent # Mc [4] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AU +1927..1928 ; Vowel_Dependent # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +19B0..19C0 ; Vowel_Dependent # Mc [17] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN IY +1A17..1A18 ; Vowel_Dependent # Mn [2] BUGINESE VOWEL SIGN I..BUGINESE VOWEL SIGN U +1A19..1A1B ; Vowel_Dependent # Mc [3] BUGINESE VOWEL SIGN E..BUGINESE VOWEL SIGN AE +1A61 ; Vowel_Dependent # Mc TAI THAM VOWEL SIGN A +1A62 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN MAI SAT +1A63..1A64 ; Vowel_Dependent # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A65..1A6C ; Vowel_Dependent # Mn [8] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN OA BELOW +1A6D..1A72 ; Vowel_Dependent # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI +1A73..1A74 ; Vowel_Dependent # Mn [2] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN MAI KANG +1B35 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN TEDUNG +1B36..1B3A ; Vowel_Dependent # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA +1B3B ; Vowel_Dependent # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +1B3C ; Vowel_Dependent # Mn BALINESE VOWEL SIGN LA LENGA +1B3D..1B41 ; Vowel_Dependent # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1B42 ; Vowel_Dependent # Mn BALINESE VOWEL SIGN PEPET +1B43 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN PEPET TEDUNG +1BA4..1BA5 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PANGHULU..SUNDANESE VOWEL SIGN PANYUKU +1BA6..1BA7 ; Vowel_Dependent # Mc [2] SUNDANESE VOWEL SIGN PANAELAENG..SUNDANESE VOWEL SIGN PANOLONG +1BA8..1BA9 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE7 ; Vowel_Dependent # Mc BATAK VOWEL SIGN E +1BE8..1BE9 ; Vowel_Dependent # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BEA..1BEC ; Vowel_Dependent # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BED ; Vowel_Dependent # Mn BATAK VOWEL SIGN KARO O +1BEE ; Vowel_Dependent # Mc BATAK VOWEL SIGN U +1BEF ; Vowel_Dependent # Mn BATAK VOWEL SIGN U FOR SIMALUNGUN SA +1C26..1C2B ; Vowel_Dependent # Mc [6] LEPCHA VOWEL SIGN AA..LEPCHA VOWEL SIGN UU +1C2C ; Vowel_Dependent # Mn LEPCHA VOWEL SIGN E +A823..A824 ; Vowel_Dependent # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A825..A826 ; Vowel_Dependent # Mn [2] SYLOTI NAGRI VOWEL SIGN U..SYLOTI NAGRI VOWEL SIGN E +A827 ; Vowel_Dependent # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Vowel_Dependent # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A947..A94E ; Vowel_Dependent # Mn [8] REJANG VOWEL SIGN I..REJANG VOWEL SIGN EA +A9B4..A9B5 ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9B6..A9B9 ; Vowel_Dependent # Mn [4] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BA..A9BB ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +A9BC ; Vowel_Dependent # Mn JAVANESE VOWEL SIGN PEPET +AA29..AA2E ; Vowel_Dependent # Mn [6] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN OE +AA2F..AA30 ; Vowel_Dependent # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA31..AA32 ; Vowel_Dependent # Mn [2] CHAM VOWEL SIGN AU..CHAM VOWEL SIGN UE +AAB0 ; Vowel_Dependent # Mn TAI VIET MAI KANG +AAB1 ; Vowel_Dependent # Lo TAI VIET VOWEL AA +AAB2..AAB4 ; Vowel_Dependent # Mn [3] TAI VIET VOWEL I..TAI VIET VOWEL U +AAB5..AAB6 ; Vowel_Dependent # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB7..AAB8 ; Vowel_Dependent # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AAB9..AABD ; Vowel_Dependent # Lo [5] TAI VIET VOWEL UEA..TAI VIET VOWEL AN +AABE ; Vowel_Dependent # Mn TAI VIET VOWEL AM +AAEB..AAEF ; Vowel_Dependent # Mc [5] MEETEI MAYEK VOWEL SIGN II..MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE5 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN ANAP +ABE6..ABE7 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE8 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABE9..ABEA ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +10A01..10A03 ; Vowel_Dependent # Mn [3] KHAROSHTHI VOWEL SIGN I..KHAROSHTHI VOWEL SIGN VOCALIC R +10A05..10A06 ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O +10A0C ; Vowel_Dependent # Mn KHAROSHTHI VOWEL LENGTH MARK +11038..11045 ; Vowel_Dependent # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +110B0..110B2 ; Vowel_Dependent # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II +110B3..110B6 ; Vowel_Dependent # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI +110B7..110B8 ; Vowel_Dependent # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11127..11132 ; Vowel_Dependent # Mn [12] CHAKMA VOWEL SIGN A..CHAKMA AU MARK +111B3..111BF ; Vowel_Dependent # Mn [13] SHARADA VOWEL SIGN AA..SHARADA VOWEL SIGN AU +116AD..116B5 ; Vowel_Dependent # Mn [9] TAKRI VOWEL SIGN AA..TAKRI VOWEL SIGN AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel + +# (Other) Vowels (reanalyzed as ordinary alphabetic letters or marks) + +# [Not derivable] + +1963..196D ; Vowel # Lo [11] TAI LE LETTER A..TAI LE LETTER AI +A85E..A861 ; Vowel # Lo [4] PHAGS-PA LETTER I..PHAGS-PA LETTER O +A866 ; Vowel # Lo [1] PHAGS-PA LETTER EE +A922..A925 ; Vowel # Lo [4] KAYAH LI LETTER A..KAYAH LI LETTER OO +A926..A92A ; Vowel # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Placeholder + +# Consonant Placeholder +# This includes generic placeholders used for +# Indic script layout (NBSP and dotted circle), as well as a few script- +# specific vowel-holder characters which are not technically +# consonants, but serve instead as bases for placement of vowel marks. + +# [Not derivable] + +00A0 ; Consonant_Placeholder # Zs NO-BREAK SPACE +0A72..0A73 ; Consonant_Placeholder # Lo [2] GURMUKHI IRI..GURMUKHI URA +1900 ; Consonant_Placeholder # Lo LIMBU VOWEL-CARRIER LETTER +25CC ; Consonant_Placeholder # So DOTTED CIRCLE + +# ================================================ + +# Indic_Syllabic_Category=Consonant + +# Consonant (ordinary abugida consonants, with inherent vowels) + +# [Not derivable] + +0915..0939 ; Consonant # Lo [35] DEVANAGARI LETTER KA..DEVANAGARI LETTER HA +0958..095F ; Consonant # Lo [8] DEVANAGARI LETTER QA..DEVANAGARI LETTER YYA +0979..097F ; Consonant # Lo [7] DEVANAGARI LETTER ZHA..DEVANAGARI LETTER BBA +0995..09A8 ; Consonant # Lo [20] BENGALI LETTER KA..BENGALI LETTER NA +09AA..09B0 ; Consonant # Lo [7] BENGALI LETTER PA..BENGALI LETTER RA +09B2 ; Consonant # Lo BENGALI LETTER LA +09B6..09B9 ; Consonant # Lo [4] BENGALI LETTER SHA..BENGALI LETTER HA +09DC..09DD ; Consonant # Lo [2] BENGALI LETTER RRA..BENGALI LETTER RHA +09DF ; Consonant # Lo BENGALI LETTER YYA +09F0..09F1 ; Consonant # Lo [2] BENGALI LETTER RA WITH MIDDLE DIAGONAL..BENGALI LETTER RA WITH LOWER DIAGONAL +0A15..0A28 ; Consonant # Lo [20] GURMUKHI LETTER KA..GURMUKHI LETTER NA +0A2A..0A30 ; Consonant # Lo [7] GURMUKHI LETTER PA..GURMUKHI LETTER RA +0A32..0A33 ; Consonant # Lo [2] GURMUKHI LETTER LA..GURMUKHI LETTER LLA +0A35..0A36 ; Consonant # Lo [2] GURMUKHI LETTER VA..GURMUKHI LETTER SHA +0A38..0A39 ; Consonant # Lo [2] GURMUKHI LETTER SA..GURMUKHI LETTER HA +0A59..0A5C ; Consonant # Lo [4] GURMUKHI LETTER KHHA..GURMUKHI LETTER RRA +0A5E ; Consonant # Lo GURMUKHI LETTER FA +0A95..0AA8 ; Consonant # Lo [20] GUJARATI LETTER KA..GUJARATI LETTER NA +0AAA..0AB0 ; Consonant # Lo [7] GUJARATI LETTER PA..GUJARATI LETTER RA +0AB2..0AB3 ; Consonant # Lo [2] GUJARATI LETTER LA..GUJARATI LETTER LLA +0AB5..0AB9 ; Consonant # Lo [5] GUJARATI LETTER VA..GUJARATI LETTER HA +0B15..0B28 ; Consonant # Lo [20] ORIYA LETTER KA..ORIYA LETTER NA +0B2A..0B30 ; Consonant # Lo [7] ORIYA LETTER PA..ORIYA LETTER RA +0B32..0B33 ; Consonant # Lo [2] ORIYA LETTER LA..ORIYA LETTER LLA +0B35..0B39 ; Consonant # Lo [5] ORIYA LETTER VA..ORIYA LETTER HA +0B5C..0B5D ; Consonant # Lo [2] ORIYA LETTER RRA..ORIYA LETTER RHA +0B5F ; Consonant # Lo ORIYA LETTER YYA +0B71 ; Consonant # Lo ORIYA LETTER WA +0B95 ; Consonant # Lo TAMIL LETTER KA +0B99..0B9A ; Consonant # Lo [2] TAMIL LETTER NGA..TAMIL LETTER CA +0B9C ; Consonant # Lo TAMIL LETTER JA +0B9E..0B9F ; Consonant # Lo [2] TAMIL LETTER NYA..TAMIL LETTER TTA +0BA3..0BA4 ; Consonant # Lo [2] TAMIL LETTER NNA..TAMIL LETTER TA +0BA8..0BAA ; Consonant # Lo [3] TAMIL LETTER NA..TAMIL LETTER PA +0BAE..0BB9 ; Consonant # Lo [12] TAMIL LETTER MA..TAMIL LETTER HA +0C15..0C28 ; Consonant # Lo [20] TELUGU LETTER KA..TELUGU LETTER NA +0C2A..0C33 ; Consonant # Lo [10] TELUGU LETTER PA..TELUGU LETTER LLA +0C35..0C39 ; Consonant # Lo [5] TELUGU LETTER VA..TELUGU LETTER HA +0C58..0C59 ; Consonant # Lo [2] TELUGU LETTER TSA..TELUGU LETTER DZA +0C95..0CA8 ; Consonant # Lo [20] KANNADA LETTER KA..KANNADA LETTER NA +0CAA..0CB3 ; Consonant # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA +0CB5..0CB9 ; Consonant # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA +0CDE ; Consonant # Lo KANNADA LETTER FA +0D15..0D3A ; Consonant # Lo [38] MALAYALAM LETTER KA..MALAYALAM LETTER TTTA +0D9A..0DB1 ; Consonant # Lo [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA +0DB3..0DBB ; Consonant # Lo [9] SINHALA LETTER SANYAKA DAYANNA..SINHALA LETTER RAYANNA +0DBD ; Consonant # Lo SINHALA LETTER DANTAJA LAYANNA +0DC0..0DC6 ; Consonant # Lo [7] SINHALA LETTER VAYANNA..SINHALA LETTER FAYANNA +0E01..0E2E ; Consonant # Lo [46] THAI CHARACTER KO KAI..THAI CHARACTER NOKHUK +0E81..0E82 ; Consonant # Lo [2] LAO LETTER KO..LAO LETTER KHO SUNG +0E84 ; Consonant # Lo LAO LETTER KHO TAM +0E87..0E88 ; Consonant # Lo [2] LAO LETTER NGO..LAO LETTER CO +0E8A ; Consonant # Lo LAO LETTER SO TAM +0E8D ; Consonant # Lo LAO LETTER NYO +0E94..0E97 ; Consonant # Lo [4] LAO LETTER DO..LAO LETTER THO TAM +0E99..0E9F ; Consonant # Lo [7] LAO LETTER NO..LAO LETTER FO SUNG +0EA1..0EA3 ; Consonant # Lo [3] LAO LETTER MO..LAO LETTER LO LING +0EA5 ; Consonant # Lo LAO LETTER LO LOOT +0EA7 ; Consonant # Lo LAO LETTER WO +0EAA..0EAB ; Consonant # Lo [2] LAO LETTER SO SUNG..LAO LETTER HO SUNG +0EAD..0EAE ; Consonant # Lo [2] LAO LETTER O..LAO LETTER HO TAM +0EDC..0EDD ; Consonant # Lo [2] LAO HO NO..LAO HO MO +0F40..0F47 ; Consonant # Lo [8] TIBETAN LETTER KA..TIBETAN LETTER JA +0F49..0F6C ; Consonant # Lo [36] TIBETAN LETTER NYA..TIBETAN LETTER RRA +1000..1020 ; Consonant # Lo [33] MYANMAR LETTER KA..MYANMAR LETTER LLA +103F ; Consonant # Lo MYANMAR LETTER GREAT SA +1050..1051 ; Consonant # Lo [2] MYANMAR LETTER SHA..MYANMAR LETTER SSA +105A..105D ; Consonant # Lo [4] MYANMAR LETTER MON NGA..MYANMAR LETTER MON BBE +1061 ; Consonant # Lo MYANMAR LETTER SGAW KAREN SHA +1065..1066 ; Consonant # Lo [2] MYANMAR LETTER WESTERN PWO KAREN THA..MYANMAR LETTER WESTERN PWO KAREN PWA +106E..1070 ; Consonant # Lo [3] MYANMAR LETTER EASTERN PWO KAREN NNA..MYANMAR LETTER EASTERN PWO KAREN GHWA +1075..1081 ; Consonant # Lo [13] MYANMAR LETTER SHAN KA..MYANMAR LETTER SHAN HA +108E ; Consonant # Lo MYANMAR LETTER RUMAI PALAUNG FA +1703..170C ; Consonant # Lo [10] TAGALOG LETTER KA..TAGALOG LETTER YA +170E..1711 ; Consonant # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1723..1731 ; Consonant # Lo [15] HANUNOO LETTER KA..HANUNOO LETTER HA +1743..1751 ; Consonant # Lo [15] BUHID LETTER KA..BUHID LETTER HA +1763..176C ; Consonant # Lo [10] TAGBANWA LETTER KA..TAGBANWA LETTER YA +176E..1770 ; Consonant # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA +1780..17A2 ; Consonant # Lo [35] KHMER LETTER KA..KHMER LETTER QA +1901..191C ; Consonant # Lo [28] LIMBU LETTER KA..LIMBU LETTER HA +1950..1962 ; Consonant # Lo [19] TAI LE LETTER KA..TAI LE LETTER NA +1980..19AB ; Consonant # Lo [44] NEW TAI LUE LETTER HIGH QA..NEW TAI LUE LETTER LOW SUA +1A00..1A16 ; Consonant # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA +1A20..1A4C ; Consonant # Lo [45] TAI THAM LETTER HIGH KA..TAI THAM LETTER LOW HA +1A53..1A54 ; Consonant # Lo [2] TAI THAM LETTER LAE..TAI THAM LETTER GREAT SA +1B13..1B33 ; Consonant # Lo [33] BALINESE LETTER KA..BALINESE LETTER HA +1B45..1B4B ; Consonant # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B8A..1BA0 ; Consonant # Lo [23] SUNDANESE LETTER KA..SUNDANESE LETTER HA +1BAE..1BAF ; Consonant # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA +1BBB..1BBD ; Consonant # Lo [3] SUNDANESE LETTER REU..SUNDANESE LETTER BHA +1BC0..1BE3 ; Consonant # Lo [36] BATAK LETTER A..BATAK LETTER MBA +1C00..1C23 ; Consonant # Lo [36] LEPCHA LETTER KA..LEPCHA LETTER A +1C4D..1C4F ; Consonant # Lo [3] LEPCHA LETTER TTA..LEPCHA LETTER DDA +A807..A80A ; Consonant # Lo [4] SYLOTI NAGRI LETTER KO..SYLOTI NAGRI LETTER GHO +A80C..A822 ; Consonant # Lo [23] SYLOTI NAGRI LETTER CO..SYLOTI NAGRI LETTER HO +A840..A85D ; Consonant # Lo [30] PHAGS-PA LETTER KA..PHAGS-PA LETTER A +A862..A865 ; Consonant # Lo [4] PHAGS-PA LETTER QA..PHAGS-PA LETTER GGA +A869..A870 ; Consonant # Lo [8] PHAGS-PA LETTER TTA..PHAGS-PA LETTER ASPIRATED FA +A872 ; Consonant # Lo PHAGS-PA SUPERFIXED LETTER RA +A892..A8B3 ; Consonant # Lo [34] SAURASHTRA LETTER KA..SAURASHTRA LETTER LLA +A90A..A921 ; Consonant # Lo [24] KAYAH LI LETTER KA..KAYAH LI LETTER CA +A930..A946 ; Consonant # Lo [23] REJANG LETTER KA..REJANG LETTER A +A989..A98B ; Consonant # Lo [3] JAVANESE LETTER PA CEREK..JAVANESE LETTER NGA LELET RASWADI +A98F..A9B2 ; Consonant # Lo [34] JAVANESE LETTER KA..JAVANESE LETTER HA +AA06..AA28 ; Consonant # Lo [35] CHAM LETTER KA..CHAM LETTER HA +AA60..AA6F ; Consonant # Lo [16] MYANMAR LETTER KHAMTI GA..MYANMAR LETTER KHAMTI FA +AA71..AA73 ; Consonant # Lo [3] MYANMAR LETTER KHAMTI XA..MYAMNAR LETTER KHAMTI RA +AA7A ; Consonant # Lo MYANMAR LETTER AITON RA +AA80..AAAF ; Consonant # Lo [48] TAI VIET LETTER LOW KO..TAI VIET LETTER HIGH O +AAE2..AAEA ; Consonant # Lo [9] MEETEI MAYEK LETTER CHA..MEETEI MAYEK LETTER SSA +ABC0..ABCD ; Consonant # Lo [14] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER HUK +ABD0 ; Consonant # Lo MEETEI MAYEK LETTER PHAM +ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTER BHAM +10A00 ; Consonant # Lo KHAROSHTHI LETTER A +10A10..10A13 ; Consonant # Lo [4] KHAROSHTHI LETTER KA..KHAROSHTHI LETTER GHA +10A15..10A17 ; Consonant # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA +10A19..10A33 ; Consonant # Lo [27] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER TTTHA +11013..11037 ; Consonant # Lo [37] BRAHMI LETTER KA..BRAHMI LETTER OLD TAMIL NNNA +1108D..110AF ; Consonant # Lo [35] KAITHI LETTER KA..KAITHI LETTER HA +11107..11126 ; Consonant # Lo [32] CHAKMA LETTER KAA..CHAKMA LETTER HAA +11191..111B2 ; Consonant # Lo [34] SHARADA LETTER KA..SHARADA LETTER HA +1168A..116AA ; Consonant # Lo [34] TAKRI LETTER KA..TAKRI LETTER RRA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Dead + +# Dead Consonant (special consonant with killed vowel) + +# [Not derivable] + +09CE ; Consonant_Dead # Lo BENGALI LETTER KHANDA TA +0D7A..0D7F ; Consonant_Dead # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Repha + +# Repha Form of RA (reanalyzed in some scripts) + +# [Not derivable] + +0D4E ; Consonant_Repha # Lo MALAYALAM LETTER DOT REPH +17CC ; Consonant_Repha # Mn KHMER SIGN ROBAT +1B03 ; Consonant_Repha # Mn BALINESE SIGN SURANG +1B81 ; Consonant_Repha # Mn SUNDANESE SIGN PANGLAYAR +A982 ; Consonant_Repha # Mn JAVANESE SIGN LAYAR + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Subjoined + +# Subjoined Consonant (C2 form subtending a base consonant in Tibetan, etc.) + +# [Not derivable] + +0F8D..0F97 ; Consonant_Subjoined # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Consonant_Subjoined # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +1929..192B ; Consonant_Subjoined # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1BA1 ; Consonant_Subjoined # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA2..1BA3 ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BAC..1BAD ; Consonant_Subjoined # Mc [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C24..1C25 ; Consonant_Subjoined # Mc [2] LEPCHA SUBJOINED LETTER YA..LEPCHA SUBJOINED LETTER RA +A867..A868 ; Consonant_Subjoined # Lo [2] PHAGS-PA SUBJOINED LETTER WA..PHAGS-PA SUBJOINED LETTER YA +A871 ; Consonant_Subjoined # Lo PHAGS-PA SUBJOINED LETTER RA +A9BD ; Consonant_Subjoined # Mc JAVANESE CONSONANT SIGN KERET + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Medial + +# Medial Consonant (medial liquid, occurring in clusters) + +# [Not derivable] + +0A75 ; Consonant_Medial # Mn GURMUKHI SIGN YAKASH +0EBC ; Consonant_Medial # Mn LAO SEMIVOWEL SIGN LO +0EBD ; Consonant_Medial # Lo LAO SEMIVOWEL SIGN NYO +103B..103C ; Consonant_Medial # Mc [2] MYANMAR CONSONANT SIGN MEDIAL YA..MYANMAR CONSONANT SIGN MEDIAL RA +103D..103E ; Consonant_Medial # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +105E..1060 ; Consonant_Medial # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Consonant_Medial # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +1A55 ; Consonant_Medial # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A56 ; Consonant_Medial # Mn TAI THAM CONSONANT SIGN MEDIAL LA +A9BE..A9BF ; Consonant_Medial # Mc JAVANESE CONSONANT SIGN PENGKAL..JAVANESE CONSONANT SIGN CAKRA +AA33..AA34 ; Consonant_Medial # Mc [2] CHAM CONSONANT SIGN YA..CHAM CONSONANT SIGN RA +AA35..AA36 ; Consonant_Medial # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Final + +# Final Consonant (special final forms which do not take vowels) + +# [Not derivable] + +1930..1931 ; Consonant_Final # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Consonant_Final # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +19C1..19C7 ; Consonant_Final # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B +1A57 ; Consonant_Final # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A58..1A5E ; Consonant_Final # Mn [7] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN SA +1BBE..1BBF ; Consonant_Final # Lo [2] SUNDANESE LETTER FINAL K..SUNDANESE LETTER FINAL M +1BF0..1BF1 ; Consonant_Final # Mn [2] BATAK CONSONANT SIGN NG..BATAK CONSONANT SIGN H +1C2D..1C33 ; Consonant_Final # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +A8B4 ; Consonant_Final # Mc SAURASHTRA CONSONANT SIGN HAARU +A94F..A951 ; Consonant_Final # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A952 ; Consonant_Final # Mc REJANG CONSONANT SIGN H +AA40..AA42 ; Consonant_Final # Lo [3] CHAM LETTER FINAL K..CHAM LETTER FINAL NG +AA43 ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL NG +AA44..AA4B ; Consonant_Final # Lo [8] CHAM LETTER FINAL CH..CHAM LETTER FINAL SS +AA4C ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL M +AA4D ; Consonant_Final # Mc CHAM CONSONANT SIGN FINAL H +ABDB..ABE2 ; Consonant_Final # Lo [8] MEETEI MAYEK LETTER KOK LONSUM..MEETEI MAYEK LETTER I LONSUM + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Head_Letter + +# Head Letter (Tibetan) + +# [Not derivable] + +0F88..0F8C ; Consonant_Head_Letter # Lo [5] TIBETAN SIGN LCE TSA CAN..TIBETAN SIGN INVERTED MCHU CAN + +# ================================================ + +# Indic_Syllabic_Category=Modifying_Letter + +# Reanalyzed letters not participating in the abugida structure, but +# serving to modify the sound of an adjacent vowel or consonant. +# Note that this is not the same as General_Category=Modifier_Letter. + +# [Not derivable] + +0B83 ; Modifying_Letter # Lo TAMIL SIGN VISARGA (aytham) + +# ================================================ + +# Indic_Syllabic_Category=Tone_Letter + +# Tone Letter (spacing lexical tone mark with status as a letter) + +# [Not derivable] + +1970..1974 ; Tone_Letter # Lo [5] TAI LE LETTER TONE-2..TAI LE LETTER TONE-6 +AAC0 ; Tone_Letter # Lo TAI VIET TONE MAI NUENG +AAC2 ; Tone_Letter # Lo TAI VIET TONE MAI SONG + +# ================================================ + +# Indic_Syllabic_Category=Tone_Mark + +# Tone Mark (nonspacing or spacing lexical tone mark) +# Excludes Vedic tone marks, which are more akin to cantillation marks. + +# [Not derivable] + +0E48..0E4B ; Tone_Mark # Mn [4] THAI CHARACTER MAI EK..THAI CHARACTER MAI CHATTAWA +0EC8..0ECB ; Tone_Mark # Mn [4] LAO TONE MAI EK..LAO TONE MAI CATAWA +1037 ; Tone_Mark # Mn MYANMAR SIGN DOT BELOW +1063..1064 ; Tone_Mark # Mc [2] MYANMAR TONE MARK SGAW KAREN HATHI..MYANMAR TONE MARK SGAW KAREN KE PHO +1069..106D ; Tone_Mark # Mc [5] MYANMAR SIGN WESTERN PWO KAREN TONE-1..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1087..108C ; Tone_Mark # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108D ; Tone_Mark # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +108F ; Tone_Mark # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109B ; Tone_Mark # Mc [2] MYANMAR SIGN KHAMTI TONE-1..MYANMAR SIGN KHAMTI TONE-3 +19C8..19C9 ; Tone_Mark # Mc [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A75..1A79 ; Tone_Mark # Mn [5] TAI THAM SIGN TONE-1..TAI THAM SIGN KHUEN TONE-5 +A92B..A92D ; Tone_Mark # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +AA7B ; Tone_Mark # Mc MYANMAR SIGN PAO KAREN TONE +AABF ; Tone_Mark # Mn TAI VIET TONE MAI EK +AAC1 ; Tone_Mark # Mn TAI VIET TONE MAI THO +ABEC ; Tone_Mark # Mc MEETEI MAYEK LUM IYEK + +# ================================================ + +# Indic_Syllabic_Category=Register_Shifter + +# Register Shifter (shifts register for consonants, akin to a tone mark) + +# [Not derivable] + +17C9..17CA ; Register_Shifter # Mn [2] KHMER SIGN MUUSIKATOAN..KHMER SIGN TRIISAP + +# EOF diff --git a/data/6.2.0-indic-positional-category.txt b/data/6.2.0-indic-positional-category.txt new file mode 100644 index 0000000..03a043e --- /dev/null +++ b/data/6.2.0-indic-positional-category.txt @@ -0,0 +1,446 @@ +# IndicMatraCategory-6.2.0.txt +# Date: 2012-05-15, 21:10:00 GMT [KW] +# +# Unicode Character Database +# Copyright (c) 1991-2012 Unicode, Inc. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# For documentation, see UAX #44. +# +# This file defines the following provisional property: +# +# Indic_Matra_Category enumerated property +# +# NB: Provisional properties and data files have no associated stability +# guarantees. They are provided in part to determine the possible usefulness +# of a property or other data and to encourage analysis and further investigation +# which may result in their improvement. Provisional properties and +# data files may change arbitrarily, or may even be removed in a future version of the +# Unicode Character Database, if they prove not to be useful. +# +# Scope: This provisional property is aimed at the problem of +# the specification of syllabic structure for Indic scripts. +# Because dependent vowels (and visible viramas, where they occur) +# are placed in notional slots around the consonant (or consonant +# cluster) core of an Indic syllable, there may be cooccurrence +# constraints or other interactions. Also, it may be desirable, +# in cases where more than one dependent vowel may occur in +# sequence, as for example, in a top slot and a bottom slot, to +# specify preferred orders for spelling. As such, this property +# is designed primarily to supplement the Indic_Syllabic_Category +# property. +# +# Note that this provisional property is *not* intended as +# a prescriptive property regarding display or font design, +# for a number of reasons. Good font design requires information +# that is outside the context of a character encoding standard, +# and is best handled in other venues. For Indic dependent +# vowels, in particular: +# +# 1. Matra placement may vary somewhat based on typeface design. +# 2. Matra placement, even within a single script, may vary +# somewhat according to historic period or local conventions. +# 3. Matra placement may be changed by explicit orthographic reform +# decisions. +# 4. Matras may ligate in various ways with a consonant (or even +# other elements of a syllable) instead of occurring in a +# discrete location. +# 4. Matra display may be contextually determined. This is +# notable, for example, in the Tamil script, where the shape +# and placement of -u and -uu vowels depends strongly on +# which consonant they adjoin. +# +# Format: +# Field 0 Code Point or Code Point Range +# Field 1 Indic_Matra_Category +# +# A comment field shows General_Category property values and character names. +# +# The scripts assessed as containing dependent vowels or viramas in the +# structural sense used for the Indic_Matra_Category are: +# +# Devanagari, Bengali, Gurmukhi, Gujarati, Oriya, Tamil, Telugu, +# Kannada, Malayalam, Sinhala, Thai, Lao, Tibetan, Myanmar, +# Tagalog, Hanunoo, Buhid, Tagbanwa, Khmer, Limbu, New Tai Lue, +# Buginese, Tai Tham, Balinese, Sundanese, Batak, Lepcha, +# Syloti Nagri, Saurashtra, Rejang, Javanese, Cham, Tai Viet, +# Meetei Mayek, Kharoshthi, Brahmi, Kaithi, Chakma, Sharada, Takri +# +# All characters for all other scripts not in that list +# take the default value for this property. +# +# See IndicSyllabicCategory.txt for a slightly more extended +# list of Indic scripts, including those which do not have +# dependent vowel characters. Currently, those additional +# Indic scripts without dependent vowel characters are +# Tai Le, Phags-pa, and Kayah Li. +# + +# ================================================ + +# Property: Indic_Matra_Category +# +# All code points not explicitly listed for Indic_Matra_Category +# have the value NA (Not_Applicable). +# +# @missing: 0000..10FFFF; NA + +# Only Indic dependent vowels (Indic_Syllabic_Category=Vowel_Dependent) +# and viramas (Indic_Syllabic_Category=Virama) +# have a non-default value for this property. + +# ------------------------------------------------ + +# Indic_Matra_Category=Right + +093B ; Right # Mc DEVANAGARI VOWEL SIGN OOE +093E ; Right # Mc DEVANAGARI VOWEL SIGN AA +0940 ; Right # Mc DEVANAGARI VOWEL SIGN II +0949..094C ; Right # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094F ; Right # Mc DEVANAGARI VOWEL SIGN AW +09BE ; Right # Mc BENGALI VOWEL SIGN AA +09C0 ; Right # Mc BENGALI VOWEL SIGN II +09D7 ; Right # Mc BENGALI AU LENGTH MARK +0A3E ; Right # Mc GURMUKHI VOWEL SIGN AA +0A40 ; Right # Mc GURMUKHI VOWEL SIGN II +0ABE ; Right # Mc GUJARATI VOWEL SIGN AA +0AC0 ; Right # Mc GUJARATI VOWEL SIGN II +0ACB..0ACC ; Right # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0B3E ; Right # Mc ORIYA VOWEL SIGN AA +0B40 ; Right # Mc ORIYA VOWEL SIGN II +0BBE..0BBF ; Right # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BD7 ; Right # Mc TAMIL AU LENGTH MARK +0C41..0C44 ; Right # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0CBE ; Right # Mc KANNADA VOWEL SIGN AA +0CC1..0CC4 ; Right # Mc [4] KANNADA VOWEL SIGN U..KANNADA VOWEL SIGN VOCALIC RR +0CD5..0CD6 ; Right # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0D3E..0D40 ; Right # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D42 ; Right # Mn [2] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN UU +# Note: U and UU form complex ligatures with consonants in older Malayalam orthography +0D57 ; Right # Mc MALAYALAM AU LENGTH MARK +0DCF..0DD1 ; Right # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD8 ; Right # Mc SINHALA VOWEL SIGN GAETTA-PILLA +0DDF ; Right # Mc SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Right # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Right # Lo THAI CHARACTER SARA A +0E32..0E33 ; Right # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E45 ; Right # Lo THAI CHARACTER LAKKHANGYAO +0EB0 ; Right # Lo LAO VOWEL SIGN A +0EB2..0EB3 ; Right # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +102B..102C ; Right # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +1056..1057 ; Right # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1062 ; Right # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Right # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1083 ; Right # Mc MYANMAR VOWEL SIGN SHAN AA +109C ; Right # Mc MYANMAR VOWEL SIGN AITON A +17B6 ; Right # Mc KHMER VOWEL SIGN AA +17C8 ; Right # Mc KHMER SIGN YUUKALEAPINTU +1923..1924 ; Right # Mc [2] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AI +19B0..19B4 ; Right # Mc [5] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN UU +19B8..19B9 ; Right # Mc [2] NEW TAI LUE VOWEL SIGN OA..NEW TAI LUE VOWEL SIGN UE +19BB..19C0 ; Right # Mc [6] NEW TAI LUE VOWEL SIGN AAY..NEW TAI LUE VOWEL SIGN IY +1A1A ; Right # Mc BUGINESE VOWEL SIGN O +1A61 ; Right # Mc TAI THAM VOWEL SIGN A +1A63..1A64 ; Right # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A6D ; Right # Mc TAI THAM VOWEL SIGN OY +1B35 ; Right # Mc BALINESE VOWEL SIGN TEDUNG +1B44 ; Right # Mc BALINESE ADEG ADEG +1BA7 ; Right # Mc SUNDANESE VOWEL SIGN PANOLONG +1BAA ; Right # Mc SUNDANESE SIGN PAMAAEH +1BF2..1BF3 ; Right # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +1C26 ; Right # Mc LEPCHA VOWEL SIGN AA +1C2A..1C2B ; Right # Mc [2] LEPCHA VOWEL SIGN U..LEPCHA VOWEL SIGN UU +A823..A824 ; Right # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A827 ; Right # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Right # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A953 ; Right # Mc REJANG VIRAMA +A9B4..A9B5 ; Right # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +AAB1 ; Right # Lo TAI VIET VOWEL AA +AABA ; Right # Lo TAI VIET VOWEL UA +AABD ; Right # Lo TAI VIET VOWEL AN +AAEF ; Right # Mc MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE6..ABE7 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE9..ABEA ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +110B0 ; Right # Mc KAITHI VOWEL SIGN AA +110B2 ; Right # Mc KAITHI VOWEL SIGN II +110B7..110B8 ; Right # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +111B3 ; Right # Mc SHARADA VOWEL SIGN AA +111B5 ; Right # Mc SHARADA VOWEL SIGN II +111C0 ; Right # Mc SHARADA SIGN VIRAMA +116AF ; Right # Mc TAKRI VOWEL SIGN II + +# Indic_Matra_Category=Left + +093F ; Left # Mc DEVANAGARI VOWEL SIGN I +094E ; Left # Mc DEVANAGARI VOWEL SIGN PRISHTHAMATRA E +09BF ; Left # Mc BENGALI VOWEL SIGN I +09C7..09C8 ; Left # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +0A3F ; Left # Mc GURMUKHI VOWEL SIGN I +0ABF ; Left # Mc GUJARATI VOWEL SIGN I +0B47 ; Left # Mc ORIYA VOWEL SIGN E +0BC6..0BC8 ; Left # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0D46..0D48 ; Left # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0DD9 ; Left # Mc SINHALA VOWEL SIGN KOMBUVA +0DDB ; Left # Mc SINHALA VOWEL SIGN KOMBU DEKA +1031 ; Left # Mc MYANMAR VOWEL SIGN E +1084 ; Left # Mc MYANMAR VOWEL SIGN SHAN E +17C1..17C3 ; Left # Mc [3] KHMER VOWEL SIGN E..KHMER VOWEL SIGN AI +19B5..19B7 ; Left # Mc [3] NEW TAI LUE VOWEL SIGN E..NEW TAI LUE VOWEL SIGN O +19BA ; Left # Mc NEW TAI LUE VOWEL SIGN AY +1A19 ; Left # Mc BUGINESE VOWEL SIGN E +1A1B ; Left # Mc BUGINESE VOWEL SIGN AE +1A6E..1A72 ; Left # Mc [5] TAI THAM VOWEL SIGN E..TAI THAM VOWEL SIGN THAM AI +1B3E..1B3F ; Left # Mc [2] BALINESE VOWEL SIGN TALING..BALINESE VOWEL SIGN TALING REPA +1BA6 ; Left # Mc SUNDANESE VOWEL SIGN PANAELAENG +1C27..1C28 ; Left # Mc [2] LEPCHA VOWEL SIGN I..LEPCHA VOWEL SIGN O +A9BA..A9BB ; Left # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +AA2F..AA30 ; Left # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AAEB ; Left # Mc MEETEI MAYEK VOWEL SIGN II +AAEE ; Left # Mc MEETEI MAYEK VOWEL SIGN AU +110B1 ; Left # Mc KAITHI VOWEL SIGN I +1112C ; Left # Mc CHAKMA VOWEL SIGN E +111B4 ; Left # Mc SHARADA VOWEL SIGN I +116AE ; Left # Mc TAKRI VOWEL SIGN I + +# Indic_Matra_Category=Visual_Order_Left + +# These are dependent vowels that occur to the left of the consonant +# letter in a syllable, but which occur in scripts using the visual order +# model, instead of the logical order model. Because of the different +# model, these left-side vowels occur first in the backing store (before +# the consonant letter) and are not reordered during text rendering. +# +# [Derivation: Logical_Order_Exception=True] + +0E40..0E44 ; Visual_Order_Left # Lo [5] THAI CHARACTER SARA E..THAI CHARACTER SARA AI MAIMALAI +0EC0..0EC4 ; Visual_Order_Left # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +AAB5..AAB6 ; Visual_Order_Left # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB9 ; Visual_Order_Left # Lo TAI VIET VOWEL UEA +AABB..AABC ; Visual_Order_Left # Lo [2] TAI VIET VOWEL AUE..TAI VIET VOWEL AY + +# Indic_Matra_Category=Left_And_Right + +09CB..09CC ; Left_And_Right # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +0B4B ; Left_And_Right # Mc ORIYA VOWEL SIGN O +0BCA..0BCC ; Left_And_Right # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0D4A..0D4C ; Left_And_Right # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0DDC..0DDE ; Left_And_Right # Mc [3] SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA..SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA +17C0 ; Left_And_Right # Mc KHMER VOWEL SIGN IE +17C4..17C5 ; Left_And_Right # Mc [2] KHMER VOWEL SIGN OO..KHMER VOWEL SIGN AU +1B40..1B41 ; Left_And_Right # Mc [2] BALINESE VOWEL SIGN TALING TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG + +# Indic_Matra_Category=Top + +093A ; Top # Mn DEVANAGARI VOWEL SIGN OE +0945..0948 ; Top # Mn [4] DEVANAGARI VOWEL SIGN CANDRA E..DEVANAGARI VOWEL SIGN AI +0955 ; Top # Mn DEVANAGARI VOWEL SIGN CANDRA LONG E +0A47..0A48 ; Top # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Top # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0AC5 ; Top # Mn GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Top # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0B3F ; Top # Mn ORIYA VOWEL SIGN I +0B56 ; Top # Mn ORIYA AI LENGTH MARK +0BC0 ; Top # Mn TAMIL VOWEL SIGN II +0BCD ; Top # Mn TAMIL SIGN VIRAMA +0C3E..0C40 ; Top # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C46..0C47 ; Top # Mn [2] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN EE +0C4A..0C4C ; Top # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C4D ; Top # Mn TELUGU SIGN VIRAMA +0C55 ; Top # Mn TELUGU LENGTH MARK +0CBF ; Top # Mn KANNADA VOWEL SIGN I +0CC6 ; Top # Mn KANNADA VOWEL SIGN E +0CCC ; Top # Mn KANNADA VOWEL SIGN AU +0CCD ; Top # Mn KANNADA SIGN VIRAMA +0D4D ; Top # Mn MALAYALAM SIGN VIRAMA +0DCA ; Top # Mn SINHALA SIGN AL-LAKUNA +0DD2..0DD3 ; Top # Mn [2] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN DIGA IS-PILLA +0E31 ; Top # Mn THAI CHARACTER MAI HAN-AKAT +0E34..0E37 ; Top # Mn [4] THAI CHARACTER SARA I..THAI CHARACTER SARA UEE +0E47 ; Top # Mn THAI CHARACTER MAITAIKHU +0E4E ; Top # Mn THAI CHARACTER YAMAKKAN +0EB1 ; Top # Mn LAO VOWEL SIGN MAI KAN +0EB4..0EB7 ; Top # Mn [4] LAO VOWEL SIGN I..LAO VOWEL SIGN YY +0EBB ; Top # Mn LAO VOWEL SIGN MAI KON +0F72 ; Top # Mn TIBETAN VOWEL SIGN I +0F7A..0F7D ; Top # Mn [4] TIBETAN VOWEL SIGN E..TIBETAN VOWEL SIGN OO +0F80 ; Top # Mn TIBETAN VOWEL SIGN REVERSED I +102D..102E ; Top # Mn [2] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN II +1032..1035 ; Top # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +103A ; Top # Mn MYANMAR SIGN ASAT +1071..1074 ; Top # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1085..1086 ; Top # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109D ; Top # Mn MYANMAR VOWEL SIGN AITON AI +1712 ; Top # Mn TAGALOG VOWEL SIGN I +1732 ; Top # Mn HANUNOO VOWEL SIGN I +1752 ; Top # Mn BUHID VOWEL SIGN I +1772 ; Top # Mn TAGBANWA VOWEL SIGN I +17B7..17BA ; Top # Mn [4] KHMER VOWEL SIGN I..KHMER VOWEL SIGN YY +17D1 ; Top # Mn KHMER SIGN VIRIAM +1920..1921 ; Top # Mn [2] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN I +1927..1928 ; Top # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +1A17 ; Top # Mn BUGINESE VOWEL SIGN I +1A62 ; Top # Mn TAI THAM VOWEL SIGN MAI SAT +1A65..1A68 ; Top # Mn [4] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN UUE +1A6B ; Top # Mn TAI THAM VOWEL SIGN O +1A73..1A74 ; Top # Mn [2] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN MAI KANG +1B36..1B37 ; Top # Mn [2] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN ULU SARI +1B42 ; Top # Mn BALINESE VOWEL SIGN PEPET +1BA4 ; Top # Mn SUNDANESE VOWEL SIGN PANGHULU +1BA8..1BA9 ; Top # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +A806 ; Top # Mn SYLOTI NAGRI SIGN HASANTA +A826 ; Top # Mn SYLOTI NAGRI VOWEL SIGN E +A94A ; Top # Mn REJANG VOWEL SIGN AI +A9B6..A9B7 ; Top # Mn [2] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN WULU MELIK +A9BC ; Top # Mn JAVANESE VOWEL SIGN PEPET +AA29..AA2C ; Top # Mn [4] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN EI +AA2E ; Top # Mn CHAM VOWEL SIGN OE +AA31 ; Top # Mn CHAM VOWEL SIGN AU +AAB0 ; Top # Mn TAI VIET MAI KANG +AAB2..AAB3 ; Top # Mn [2] TAI VIET VOWEL I..TAI VIET VOWEL UE +AAB7..AAB8 ; Top # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AABE ; Top # Mn TAI VIET VOWEL AM +AAED ; Top # Mn MEETEI MAYEK VOWEL SIGN AAI +ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP +10A05 ; Top # Mn KHAROSHTHI VOWEL SIGN E +11038..1103B ; Top # Mn [4] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN II +11042..11045 ; Top # Mn [4] BRAHMI VOWEL SIGN E..BRAHMI VOWEL SIGN AU +11046 ; Top # Mn BRAHMI VIRAMA +110B5..110B6 ; Top # Mn [2] KAITHI VOWEL SIGN E..KAITHI VOWEL SIGN AI +11127..11129 ; Top # Mn [3] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN II +1112D ; Top # Mn CHAKMA VOWEL SIGN AI +11130 ; Top # Mn CHAKMA VOWEL SIGN OI +11134 ; Top # Mn CHAKMA MAAYYAA +111BC..111BE ; Top # Mn [3] SHARADA VOWEL SIGN E..SHARADA VOWEL SIGN O +116AD ; Top # Mn TAKRI VOWEL SIGN AA +116B2..116B5 ; Top # Mn [4] TAKRI VOWEL SIGN E..TAKRI VOWEL SIGN AU +116B6 ; Top # Mn TAKRI SIGN VIRAMA + +# Indic_Matra_Category=Bottom + +0941..0944 ; Bottom # Mn [4] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN VOCALIC RR +094D ; Bottom # Mn DEVANAGARI SIGN VIRAMA +0956..0957 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN UE..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09C1..09C4 ; Bottom # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09CD ; Bottom # Mn BENGALI SIGN VIRAMA +09E2..09E3 ; Bottom # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A41..0A42 ; Bottom # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A4D ; Bottom # Mn GURMUKHI SIGN VIRAMA +0AC1..0AC4 ; Bottom # Mn [4] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN VOCALIC RR +0ACD ; Bottom # Mn GUJARATI SIGN VIRAMA +0AE2..0AE3 ; Bottom # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B41..0B44 ; Bottom # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B4D ; Bottom # Mn ORIYA SIGN VIRAMA +0B62..0B63 ; Bottom # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BC1..0BC2 ; Bottom # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +# Note: U and UU have contextually variable placement in Tamil. +0C56 ; Bottom # Mn TELUGU AI LENGTH MARK +0C62..0C63 ; Bottom # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CE2..0CE3 ; Bottom # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D43..0D44 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC R..MALAYALAM VOWEL SIGN VOCALIC RR +0D62..0D63 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DD4 ; Bottom # Mn SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Bottom # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0E38..0E39 ; Bottom # Mn [2] THAI CHARACTER SARA U..THAI CHARACTER SARA UU +0E3A ; Bottom # Mn THAI CHARACTER PHINTHU +0EB8..0EB9 ; Bottom # Mn [2] LAO VOWEL SIGN U..LAO VOWEL SIGN UU +0F71 ; Bottom # Mn TIBETAN VOWEL SIGN AA +0F74..0F75 ; Bottom # Mn [2] TIBETAN VOWEL SIGN U..TIBETAN VOWEL SIGN UU +0F84 ; Bottom # Mn TIBETAN MARK HALANTA +102F..1030 ; Bottom # Mn [2] MYANMAR VOWEL SIGN U..MYANMAR VOWEL SIGN UU +1058..1059 ; Bottom # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1713 ; Bottom # Mn TAGALOG VOWEL SIGN U +1714 ; Bottom # Mn TAGALOG SIGN VIRAMA +1733 ; Bottom # Mn HANUNOO VOWEL SIGN U +1734 ; Bottom # Mn HANUNOO SIGN PAMUDPOD +1753 ; Bottom # Mn BUHID VOWEL SIGN U +1773 ; Bottom # Mn TAGBANWA VOWEL SIGN U +17BB..17BD ; Bottom # Mn [3] KHMER VOWEL SIGN U..KHMER VOWEL SIGN UA +1922 ; Bottom # Mn LIMBU VOWEL SIGN U +1A18 ; Bottom # Mn BUGINESE VOWEL SIGN U +1A69..1A6A ; Bottom # Mn [2] TAI THAM VOWEL SIGN U..TAI THAM VOWEL SIGN UU +1A6C ; Bottom # Mn TAI THAM VOWEL SIGN OA BELOW +1B38..1B3A ; Bottom # Mn [3] BALINESE VOWEL SIGN SUKU..BALINESE VOWEL SIGN RA REPA +1BA5 ; Bottom # Mn SUNDANESE VOWEL SIGN PANYUKU +1C2C ; Bottom # Mn LEPCHA VOWEL SIGN E +A825 ; Bottom # Mn SYLOTI NAGRI VOWEL SIGN U +A8C4 ; Bottom # Mn SAURASHTRA SIGN VIRAMA +A947..A949 ; Bottom # Mn [3] REJANG VOWEL SIGN I..REJANG VOWEL SIGN E +A94B..A94E ; Bottom # Mn [4] REJANG VOWEL SIGN O..REJANG VOWEL SIGN EA +A9B8..A9B9 ; Bottom # Mn [2] JAVANESE VOWEL SIGN SUKU..JAVANESE VOWEL SIGN SUKU MENDUT +AA2D ; Bottom # Mn CHAM VOWEL SIGN U +AA32 ; Bottom # Mn CHAM VOWEL SIGN UE +AAB4 ; Bottom # Mn TAI VIET VOWEL U +AAEC ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UU +ABE8 ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK +10A02..10A03 ; Bottom # Mn [2] KHAROSHTHI VOWEL SIGN U..KHAROSHTHI VOWEL SIGN VOCALIC R +10A0C ; Bottom # Mn KHAROSHTHI VOWEL LENGTH MARK +1103C..11041 ; Bottom # Mn [6] BRAHMI VOWEL SIGN U..BRAHMI VOWEL SIGN VOCALIC LL +110B3..110B4 ; Bottom # Mn [2] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN UU +110B9 ; Bottom # Mn KAITHI SIGN VIRAMA +1112A..1112B ; Bottom # Mn [2] CHAKMA VOWEL SIGN U..CHAKMA VOWEL SIGN UU +11131..11132 ; Bottom # Mn [2] CHAKMA O MARK..CHAKMA AU MARK +111B6..111BB ; Bottom # Mn [6] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN VOCALIC LL +116B0..116B1 ; Bottom # Mn [2] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN UU + +# Indic_Matra_Category=Top_And_Bottom + +0C48 ; Top_And_Bottom # Mn TELUGU VOWEL SIGN AI +0F73 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN II +0F76..0F79 ; Top_And_Bottom # Mn [4] TIBETAN VOWEL SIGN VOCALIC R..TIBETAN VOWEL SIGN VOCALIC LL +0F81 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN REVERSED II +1B3C ; Top_And_Bottom # Mn BALINESE VOWEL SIGN LA LENGA +1112E..1112F ; Top_And_Bottom # Mn [2] CHAKMA VOWEL SIGN O..CHAKMA VOWEL SIGN AU + +# Indic_Matra_Category=Top_And_Right + +0AC9 ; Top_And_Right # Mc GUJARATI VOWEL SIGN CANDRA O +0B57 ; Top_And_Right # Mc ORIYA AU LENGTH MARK +0CC0 ; Top_And_Right # Mc KANNADA VOWEL SIGN II +0CC7..0CC8 ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +1925..1926 ; Top_And_Right # Mc [2] LIMBU VOWEL SIGN OO..LIMBU VOWEL SIGN AU +1B43 ; Top_And_Right # Mc BALINESE VOWEL SIGN PEPET TEDUNG +111BF ; Top_And_Right # Mc SHARADA VOWEL SIGN AU + +# Indic_Matra_Category=Top_And_Left + +0B48 ; Top_And_Left # Mc ORIYA VOWEL SIGN AI +0DDA ; Top_And_Left # Mc SINHALA VOWEL SIGN DIGA KOMBUVA +17BE ; Top_And_Left # Mc KHMER VOWEL SIGN OE +1C29 ; Top_And_Left # Mc LEPCHA VOWEL SIGN OO + +# Indic_Matra_Category=Top_And_Left_And_Right + +0B4C ; Top_And_Left_And_Right # Mc ORIYA VOWEL SIGN AU +17BF ; Top_And_Left_And_Right # Mc KHMER VOWEL SIGN YA + +# Indic_Matra_Category=Bottom_And_Right + +1B3B ; Bottom_And_Right # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +A9C0 ; Bottom_And_Right # Mc JAVANESE PANGKON + +# Indic_Matra_Category=Top_And_Bottom_And_Right + +1B3D ; Top_And_Bottom_And_Right # Mc BALINESE VOWEL SIGN LA LENGA TEDUNG + +# Indic_Matra_Category=Overstruck + +10A01 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN I +10A06 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN O + +# Indic_Matra_Category=Invisible + +# The Invisible category refers to viramas for certain script +# which are used only to control consonant stacking or cluster +# formation, and which have no visible display on their own. + +1039 ; Invisible # Mn MYANMAR SIGN VIRAMA +17D2 ; Invisible # Mn KHMER SIGN COENG +1A60 ; Invisible # Mn TAI THAM SIGN SAKOT +AAF6 ; Invisible # Mn MEETEI MAYEK VIRAMA +10A3F ; Invisible # Mn KHAROSHTHI VIRAMA +11133 ; Invisible # Mn CHAKMA VIRAMA + +# EOF diff --git a/data/6.2.0-indic-syllabic-category.txt b/data/6.2.0-indic-syllabic-category.txt new file mode 100644 index 0000000..fd03ea3 --- /dev/null +++ b/data/6.2.0-indic-syllabic-category.txt @@ -0,0 +1,796 @@ +# IndicSyllabicCategory-6.2.0.txt +# Date: 2012-05-15, 21:12:00 GMT [KW] +# +# Unicode Character Database +# Copyright (c) 1991-2012 Unicode, Inc. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# For documentation, see UAX #44. +# +# This file defines the following provisional property: +# +# Indic_Syllabic_Category enumerated property +# +# NB: Provisional properties and data files have no associated stability +# guarantees. They are provided in part to determine the possible usefulness +# of a property or other data and to encourage analysis and further investigation +# which may result in their improvement. Provisional properties and +# data files may change arbitrarily, or may even be removed in a future version of the +# Unicode Character Database, if they prove not to be useful. +# +# Scope: This provisional property is aimed at two general problem +# areas involving the analysis and processing of Indic scripts: +# +# 1. Specification of syllabic structure. +# 2. Specification of segmentation rules. +# +# Both of these problem areas may benefit from having defined subtypes +# of Indic script characters which are relevant to how Indic +# syllables (or aksaras) are constructed. Note that rules for +# syllabic structure in Indic scripts may differ significantly +# from how phonological syllables are defined. +# +# Format: +# Field 0 Code Point or Code Point Range +# Field 1 Indic_Syllabic_Category +# +# A comment field shows General_Category property values and character names. +# +# The scripts assessed as Indic in the +# structural sense used for the Indic_Syllabic_Category are: +# +# Devanagari, Bengali, Gurmukhi, Gujarati, Oriya, Tamil, Telugu, +# Kannada, Malayalam, Sinhala, Thai, Lao, Tibetan, Myanmar, +# Tagalog, Hanunoo, Buhid, Tagbanwa, Khmer, Limbu, Tai Le, New Tai Lue, +# Buginese, Tai Tham, Balinese, Sundanese, Batak, Lepcha, +# Syloti Nagri, Phags-Pa, Saurashtra, Kayah Li, Rejang, Javanese, Cham, Tai Viet, +# Meetei Mayek, Kharoshthi, Brahmi, Kaithi, Chakma, Sharada, Takri +# +# All characters for all other scripts not in that list +# take the default value for this property, unless they +# are individually listed in this data file. +# + +# ================================================ + +# Property: Indic_Syllabic_Category +# +# All code points not explicitly listed for Indic_Syllabic_Category +# have the value Other. +# +# @missing: 0000..10FFFF; Other + +# ================================================ + +# Indic_Syllabic_Category=Bindu + +# Bindu/Anusvara (nasalization or -n) +# Excludes various Vedic nasalization signs. + +# [Not derivable] + +0900..0902 ; Bindu # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +0981 ; Bindu # Mn BENGALI SIGN CANDRABINDU +0982 ; Bindu # Mc BENGALI SIGN ANUSVARA +0A01..0A02 ; Bindu # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A70 ; Bindu # Mn GURMUKHI TIPPI +0A81..0A82 ; Bindu # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0B01 ; Bindu # Mn ORIYA SIGN CANDRABINDU +0B02 ; Bindu # Mc ORIYA SIGN ANUSVARA +0B82 ; Bindu # Mn TAMIL SIGN ANUSVARA +0C01..0C02 ; Bindu # Mc [2] TELUGU SIGN CANDRABINDU..TELUGU SIGN ANUSVARA +0C82 ; Bindu # Mc KANNADA SIGN ANUSVARA +0D02 ; Bindu # Mc MALAYALAM SIGN ANUSVARA +0D82 ; Bindu # Mc SINHALA SIGN ANUSVARAYA +0E4D ; Bindu # Mn THAI CHARACTER NIKHAHIT +0ECD ; Bindu # Mn LAO NIGGAHITA +0F7E ; Bindu # Mn TIBETAN SIGN RJES SU NGA RO +0F82..0F83 ; Bindu # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +1036 ; Bindu # Mn MYANMAR SIGN ANUSVARA +17C6 ; Bindu # Mn KHMER SIGN NIKAHIT +1932 ; Bindu # Mn LIMBU SMALL LETTER ANUSVARA +1B00..1B02 ; Bindu # Mn [3] BALINESE SIGN ULU RICEM..BALINESE SIGN CECEK +A80B ; Bindu # Mn SYLOTI NAGRI SIGN ANUSVARA +A873 ; Bindu # Lo PHAGS-PA LETTER CANDRABINDU +A980..A981 ; Bindu # Mn [2] JAVANESE SIGN PANYANGGA..JAVANESE SIGN CECAK +1B80 ; Bindu # Mn SUNDANESE SIGN PANYECEK +1C34..1C35 ; Bindu # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A880 ; Bindu # Mc SAURASHTRA SIGN ANUSVARA +10A0E ; Bindu # Mn KHAROSHTHI SIGN ANUSVARA +11000 ; Bindu # Mc BRAHMI SIGN CANDRABINDU +11001 ; Bindu # Mn BRAHMI SIGN ANUSVARA +11080..11081 ; Bindu # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +11100..11101 ; Bindu # Mn CHAKMA SIGN CANDRABINDU..CHAKMA SIGN ANUSVARA +11180..11181 ; Bindu # Mn SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +116AB ; Bindu # Mn TAKRI SIGN ANUSVARA + +# ================================================ + +# Indic_Syllabic_Category=Visarga + +# Visarga (-h) +# Includes specialized case for Sanskrit: ardhavisarga +# Excludes letters for jihvamuliya and upadhmaniya, which are +# related, but structured somewhat differently. + +# [Not derivable] + +0903 ; Visarga # Mc DEVANAGARI SIGN VISARGA +0983 ; Visarga # Mc BENGALI SIGN VISARGA +0A03 ; Visarga # Mc GURMUKHI SIGN VISARGA +0A83 ; Visarga # Mc GUJARATI SIGN VISARGA +0B03 ; Visarga # Mc ORIYA SIGN VISARGA +0C03 ; Visarga # Mc TELUGU SIGN VISARGA +0C83 ; Visarga # Mc KANNADA SIGN VISARGA +0D03 ; Visarga # Mc MALAYALAM SIGN VISARGA +0D83 ; Visarga # Mc SINHALA SIGN VISARGAYA +0F7F ; Visarga # Mc TIBETAN SIGN RNAM BCAD +1038 ; Visarga # Mc MYANMAR SIGN VISARGA +17C7 ; Visarga # Mc KHMER SIGN REAHMUK +1B04 ; Visarga # Mc BALINESE SIGN BISAH +1B82 ; Visarga # Mc SUNDANESE SIGN PANGWISAD +1CF2 ; Visarga # Mc VEDIC SIGN ARDHAVISARGA +1CF3 ; Visarga # Mc VEDIC SIGN ROTATED ARDHAVISARGA +A881 ; Visarga # Mc SAURASHTRA SIGN VISARGA +A983 ; Visarga # Mc JAVANESE SIGN WIGNYAN +AAF5 ; Visarga # Mc MEETEI MAYEK VOWEL SIGN VISARGA +10A0F ; Visarga # Mn KHAROSHTHI SIGN VISARGA +11002 ; Visarga # Mc BRAHMI SIGN VISARGA +11082 ; Visarga # Mc KAITHI SIGN VISARGA +11102 ; Visarga # Mn CHAKMA SIGN VISARGA +11182 ; Visarga # Mn SHARADA SIGN VISARGA +116AC ; Visarga # Mc TAKRI SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Avagraha + +# Avagraha (elision of initial a- in sandhi) + +# [Not derivable] + +093D ; Avagraha # Lo DEVANAGARI SIGN AVAGRAHA +09BD ; Avagraha # Lo BENGALI SIGN AVAGRAHA +0ABD ; Avagraha # Lo GUJARATI SIGN AVAGRAHA +0B3D ; Avagraha # Lo ORIYA SIGN AVAGRAHA +0C3D ; Avagraha # Lo TELUGU SIGN AVAGRAHA +0CBD ; Avagraha # Lo KANNADA SIGN AVAGRAHA +0D3D ; Avagraha # Lo MALAYALAM SIGN AVAGRAHA +0F85 ; Avagraha # Po TIBETAN MARK PALUTA +17DC ; Avagraha # Lo KHMER SIGN AVAKRAHASANYA +1BBA ; Avagraha # Lo SUNDANESE AVAGRAHA +111C1 ; Avagraha # Lo SHARADA SIGN AVAGRAHA + +# ================================================ + +# Indic_Syllabic_Category=Nukta + +# Nukta (diacritic for borrowed consonants) + +# [Derivation: (ccc=7) - 1037] + +093C ; Nukta # Mn DEVANAGARI SIGN NUKTA +09BC ; Nukta # Mn BENGALI SIGN NUKTA +0A3C ; Nukta # Mn GURMUKHI SIGN NUKTA +0ABC ; Nukta # Mn GUJARATI SIGN NUKTA +0B3C ; Nukta # Mn ORIYA SIGN NUKTA +0CBC ; Nukta # Mn KANNADA SIGN NUKTA +1B34 ; Nukta # Mn BALINESE SIGN REREKAN +1BE6 ; Nukta # Mn BATAK SIGN TOMPI +1C37 ; Nukta # Mn LEPCHA SIGN NUKTA +A9B3 ; Nukta # Mn JAVANESE SIGN CECAK TELU +110BA ; Nukta # Mn KAITHI SIGN NUKTA +116B7 ; Nukta # Mn TAKRI SIGN NUKTA + +# ================================================ + +# Indic_Syllabic_Category=Virama + +# Virama (killing of inherent vowel in consonant sequence, +# or consonant stacker, depending on model) +# Also includes pure killers. + +# [Derivation: (ccc=9) + 0E4E + 17D1] + +094D ; Virama # Mn DEVANAGARI SIGN VIRAMA +09CD ; Virama # Mn BENGALI SIGN VIRAMA +0A4D ; Virama # Mn GURMUKHI SIGN VIRAMA +0ACD ; Virama # Mn GUJARATI SIGN VIRAMA +0B4D ; Virama # Mn ORIYA SIGN VIRAMA +0BCD ; Virama # Mn TAMIL SIGN VIRAMA +0C4D ; Virama # Mn TELUGU SIGN VIRAMA +0CCD ; Virama # Mn KANNADA SIGN VIRAMA +0D4D ; Virama # Mn MALAYALAM SIGN VIRAMA +0DCA ; Virama # Mn SINHALA SIGN AL-LAKUNA +0E3A ; Virama # Mn THAI CHARACTER PHINTHU +0E4E ; Virama # Mn THAI CHARACTER YAMAKKAN +0F84 ; Virama # Mn TIBETAN MARK HALANTA +1039..103A ; Virama # Mn [2] MYANMAR SIGN VIRAMA..MYANMAR SIGN ASAT +1714 ; Virama # Mn TAGALOG SIGN VIRAMA +1734 ; Virama # Mn HANUNOO SIGN PAMUDPOD +17D1..17D2 ; Virama # Mn [2] KHMER SIGN VIRIAM..KHMER SIGN COENG +1A60 ; Virama # Mn TAI THAM SIGN SAKOT +1B44 ; Virama # Mc BALINESE ADEG ADEG +1BAA ; Virama # Mc SUNDANESE SIGN PAMAAEH +1BAB ; Virama # Mc SUNDANESE SIGN VIRAMA +1BF2..1BF3 ; Virama # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +A806 ; Virama # Mn SYLOTI NAGRI SIGN HASANTA +A8C4 ; Virama # Mn SAURASHTRA SIGN VIRAMA +A953 ; Virama # Mc REJANG VIRAMA +A9C0 ; Virama # Mc JAVANESE PANGKON +AAF6 ; Virama # Mn MEETEI MAYEK VIRAMA +ABED ; Virama # Mn MEETEI MAYEK APUN IYEK +10A3F ; Virama # Mn KHAROSHTHI VIRAMA +11046 ; Virama # Mn BRAHMI VIRAMA +110B9 ; Virama # Mn KAITHI SIGN VIRAMA +11133..11134 ; Virama # Mn CHAKMA VIRAMA..CHAKMA MAAYYAA +111C0 ; Virama # Mc SHARADA SIGN VIRAMA +116B6 ; Virama # Mn TAKRI SIGN VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Independent + +# Independent Vowels (contrasted with matras) + +# [Not derivable] + +0904..0914 ; Vowel_Independent # Lo [17] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER AU +0960..0961 ; Vowel_Independent # Lo [2] DEVANAGARI LETTER VOCALIC RR..DEVANAGARI LETTER VOCALIC LL +0972..0977 ; Vowel_Independent # Lo [6] DEVANAGARI LETTER CANDRA A..DEVANAGARI LETTER UUE +0985..098C ; Vowel_Independent # Lo [8] BENGALI LETTER A..BENGALI LETTER VOCALIC L +098F..0990 ; Vowel_Independent # Lo [2] BENGALI LETTER E..BENGALI LETTER AI +0993..0994 ; Vowel_Independent # Lo [2] BENGALI LETTER O..BENGALI LETTER AU +09E0..09E1 ; Vowel_Independent # Lo [2] BENGALI LETTER VOCALIC RR..BENGALI LETTER VOCALIC LL +0A05..0A0A ; Vowel_Independent # Lo [6] GURMUKHI LETTER A..GURMUKHI LETTER UU +0A0F..0A10 ; Vowel_Independent # Lo [2] GURMUKHI LETTER EE..GURMUKHI LETTER AI +0A13..0A14 ; Vowel_Independent # Lo [2] GURMUKHI LETTER OO..GURMUKHI LETTER AU +0A85..0A8D ; Vowel_Independent # Lo [9] GUJARATI LETTER A..GUJARATI VOWEL CANDRA E +0A8F..0A91 ; Vowel_Independent # Lo [3] GUJARATI LETTER E..GUJARATI VOWEL CANDRA O +0A93..0A94 ; Vowel_Independent # Lo [2] GUJARATI LETTER O..GUJARATI LETTER AU +0AE0..0AE1 ; Vowel_Independent # Lo [2] GUJARATI LETTER VOCALIC RR..GUJARATI LETTER VOCALIC LL +0B05..0B0C ; Vowel_Independent # Lo [8] ORIYA LETTER A..ORIYA LETTER VOCALIC L +0B0F..0B10 ; Vowel_Independent # Lo [2] ORIYA LETTER E..ORIYA LETTER AI +0B13..0B14 ; Vowel_Independent # Lo [2] ORIYA LETTER O..ORIYA LETTER AU +0B60..0B61 ; Vowel_Independent # Lo [2] ORIYA LETTER VOCALIC RR..ORIYA LETTER VOCALIC LL +0B85..0B8A ; Vowel_Independent # Lo [6] TAMIL LETTER A..TAMIL LETTER UU +0B8E..0B90 ; Vowel_Independent # Lo [3] TAMIL LETTER E..TAMIL LETTER AI +0B92..0B94 ; Vowel_Independent # Lo [3] TAMIL LETTER O..TAMIL LETTER AU +0C05..0C0C ; Vowel_Independent # Lo [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L +0C0E..0C10 ; Vowel_Independent # Lo [3] TELUGU LETTER E..TELUGU LETTER AI +0C12..0C14 ; Vowel_Independent # Lo [3] TELUGU LETTER O..TELUGU LETTER AU +0C60..0C61 ; Vowel_Independent # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL +0C85..0C8C ; Vowel_Independent # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L +0C8E..0C90 ; Vowel_Independent # Lo [3] KANNADA LETTER E..KANNADA LETTER AI +0C92..0C94 ; Vowel_Independent # Lo [3] KANNADA LETTER O..KANNADA LETTER AU +0CE0..0CE1 ; Vowel_Independent # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL +0D05..0D0C ; Vowel_Independent # Lo [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L +0D0E..0D10 ; Vowel_Independent # Lo [3] MALAYALAM LETTER E..MALAYALAM LETTER AI +0D12..0D14 ; Vowel_Independent # Lo [3] MALAYALAM LETTER O..MALAYALAM LETTER AU +0D60..0D61 ; Vowel_Independent # Lo [2] MALAYALAM LETTER VOCALIC RR..MALAYALAM LETTER VOCALIC LL +0D85..0D96 ; Vowel_Independent # Lo [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA +1021..102A ; Vowel_Independent # Lo [10] MYANMAR LETTER A..MYANMAR LETTER AU +1052..1055 ; Vowel_Independent # Lo [4] MYANMAR LETTER VOCALIC R..MYANMAR LETTER VOCALIC LL +1700..1702 ; Vowel_Independent # Lo [3] TAGALOG LETTER A..TAGALOG LETTER U +1720..1722 ; Vowel_Independent # Lo [3] HANUNOO LETTER A..HANUNOO LETTER U +1740..1742 ; Vowel_Independent # Lo [3] BUHID LETTER A..BUHID LETTER U +1760..1762 ; Vowel_Independent # Lo [3] TAGBANWA LETTER A..TAGBANWA LETTER U +17A3..17B3 ; Vowel_Independent # Lo [17] KHMER INDEPENDENT VOWEL QAQ..KHMER INDEPENDENT VOWEL QAU +1A4D..1A52 ; Vowel_Independent # Lo [6] TAI THAM LETTER I..TAI THAM LETTER OO +1B05..1B12 ; Vowel_Independent # Lo [14] BALINESE LETTER AKARA..BALINESE LETTER OKARA TEDUNG +1B83..1B89 ; Vowel_Independent # Lo [7] SUNDANESE LETTER A..SUNDANESE LETTER EU +1BE4..1BE5 ; Vowel_Independent # Lo [2] BATAK LETTER I..BATAK LETTER U +A800..A801 ; Vowel_Independent # Lo [2] SYLOTI NAGRI LETTER A..SYLOTI NAGRI LETTER I +A803..A805 ; Vowel_Independent # Lo [3] SYLOTI NAGRI LETTER U..SYLOTI NAGRI LETTER O +A882..A891 ; Vowel_Independent # Lo [16] SAURASHTRA LETTER A..SAURASHTRA LETTER AU +A984..A988 ; Vowel_Independent # Lo [5] JAVANESE LETTER A..JAVANESE LETTER U +A98C..A98E ; Vowel_Independent # Lo [3] JAVANESE LETTER E..JAVANESE LETTER O +AA00..AA05 ; Vowel_Independent # Lo [6] CHAM LETTER A..CHAM LETTER O +AAE0..AAE1 ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER E..MEETEI MAYEK LETTER O +ABCE..ABCF ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER UN..MEETEI MAYEK LETTER I +ABD1 ; Vowel_Independent # Lo MEETEI MAYEK LETTER ATIYA +11005..11012 ; Vowel_Independent # Lo [14] BRAHMI LETTER A..BRAHMI LETTER AU +11083..1108C ; Vowel_Independent # Lo [10] KAITHI LETTER A..KAITHI LETTER AU +11103..11106 ; Vowel_Independent # Lo [4] CHAKMA LETTER AA..CHAKMA LETTER E +11183..11190 ; Vowel_Independent # Lo [14] SHARADA LETTER A..SHARADA LETTER AU +11680..11689 ; Vowel_Independent # Lo [10] TAKRI LETTER A..TAKRI LETTER AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Dependent + +# Dependent Vowels (contrasted with independent vowels and/or with complex placement) +# Matras (in Indic scripts) + +# [Not derivable] + +093A ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN OE +093B ; Vowel_Dependent # Mc DEVANAGARI VOWEL SIGN OOE +093E..0940 ; Vowel_Dependent # Mc [3] DEVANAGARI VOWEL SIGN AA..DEVANAGARI VOWEL SIGN II +0941..0948 ; Vowel_Dependent # Mn [8] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN AI +0949..094C ; Vowel_Dependent # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094E..094F ; Vowel_Dependent # Mc [2] DEVANAGARI VOWEL SIGN PRISHTHAMATRA E..DEVANAGARI VOWEL SIGN AW +0955..0957 ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN CANDRA LONG E..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Vowel_Dependent # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BE..09C0 ; Vowel_Dependent # Mc [3] BENGALI VOWEL SIGN AA..BENGALI VOWEL SIGN II +09C1..09C4 ; Vowel_Dependent # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09C7..09C8 ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +09CB..09CC ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +09D7 ; Vowel_Dependent # Mc BENGALI AU LENGTH MARK +09E2..09E3 ; Vowel_Dependent # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3E..0A40 ; Vowel_Dependent # Mc [3] GURMUKHI VOWEL SIGN AA..GURMUKHI VOWEL SIGN II +0A41..0A42 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A47..0A48 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0ABE..0AC0 ; Vowel_Dependent # Mc [3] GUJARATI VOWEL SIGN AA..GUJARATI VOWEL SIGN II +0AC1..0AC5 ; Vowel_Dependent # Mn [5] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AC9 ; Vowel_Dependent # Mc GUJARATI VOWEL SIGN CANDRA O +0ACB..0ACC ; Vowel_Dependent # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0AE2..0AE3 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3E ; Vowel_Dependent # Mc ORIYA VOWEL SIGN AA +0B3F ; Vowel_Dependent # Mn ORIYA VOWEL SIGN I +0B40 ; Vowel_Dependent # Mc ORIYA VOWEL SIGN II +0B41..0B44 ; Vowel_Dependent # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B47..0B48 ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI +0B4B..0B4C ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN O..ORIYA VOWEL SIGN AU +0B56 ; Vowel_Dependent # Mn ORIYA AI LENGTH MARK +0B57 ; Vowel_Dependent # Mc ORIYA AU LENGTH MARK +0B62..0B63 ; Vowel_Dependent # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BBE..0BBF ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC0 ; Vowel_Dependent # Mn TAMIL VOWEL SIGN II +0BC1..0BC2 ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BC6..0BC8 ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0BCA..0BCC ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0BD7 ; Vowel_Dependent # Mc TAMIL AU LENGTH MARK +0C3E..0C40 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C41..0C44 ; Vowel_Dependent # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C46..0C48 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI +0C4A..0C4C ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C55..0C56 ; Vowel_Dependent # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK +0C62..0C63 ; Vowel_Dependent # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBE ; Vowel_Dependent # Mc KANNADA VOWEL SIGN AA +0CBF ; Vowel_Dependent # Mn KANNADA VOWEL SIGN I +0CC0..0CC4 ; Vowel_Dependent # Mc [5] KANNADA VOWEL SIGN II..KANNADA VOWEL SIGN VOCALIC RR +0CC6 ; Vowel_Dependent # Mn KANNADA VOWEL SIGN E +0CC7..0CC8 ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +0CCC ; Vowel_Dependent # Mn KANNADA VOWEL SIGN AU +0CD5..0CD6 ; Vowel_Dependent # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CE2..0CE3 ; Vowel_Dependent # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D3E..0D40 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D44 ; Vowel_Dependent # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR +0D46..0D48 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0D4A..0D4C ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0D57 ; Vowel_Dependent # Mc MALAYALAM AU LENGTH MARK +0D62..0D63 ; Vowel_Dependent # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DCF..0DD1 ; Vowel_Dependent # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD2..0DD4 ; Vowel_Dependent # Mn [3] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Vowel_Dependent # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0DD8..0DDF ; Vowel_Dependent # Mc [8] SINHALA VOWEL SIGN GAETTA-PILLA..SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Vowel_Dependent # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Vowel_Dependent # Lo THAI CHARACTER SARA A +0E31 ; Vowel_Dependent # Mn THAI CHARACTER MAI HAN-AKAT +0E32..0E33 ; Vowel_Dependent # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E34..0E39 ; Vowel_Dependent # Mn [6] THAI CHARACTER SARA I..THAI CHARACTER SARA UU +0E40..0E45 ; Vowel_Dependent # Lo [6] THAI CHARACTER SARA E..THAI CHARACTER LAKKHANGYAO +0E47 ; Vowel_Dependent # Mn THAI CHARACTER MAITAIKHU +0EB0 ; Vowel_Dependent # Lo LAO VOWEL SIGN A +0EB1 ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KAN +0EB2..0EB3 ; Vowel_Dependent # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0EB4..0EB9 ; Vowel_Dependent # Mn [6] LAO VOWEL SIGN I..LAO VOWEL SIGN UU +0EBB ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KON +0EC0..0EC4 ; Vowel_Dependent # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +0F71..0F7D ; Vowel_Dependent # Mn [13] TIBETAN VOWEL SIGN AA..TIBETAN VOWEL SIGN OO +0F80..0F81 ; Vowel_Dependent # Mn [2] TIBETAN VOWEL SIGN REVERSED I..TIBETAN VOWEL SIGN REVERSED II +102B..102C ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +102D..1030 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN UU +1031 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN E +1032..1035 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +1056..1057 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1058..1059 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1062 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1071..1074 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1083..1084 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN SHAN AA..MYANMAR VOWEL SIGN SHAN E +1085..1086 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109C ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN AITON A +109D ; Vowel_Dependent # Mn MYANMAR VOWEL SIGN AITON AI +1712..1713 ; Vowel_Dependent # Mn [2] TAGALOG VOWEL SIGN I..TAGALOG VOWEL SIGN U +1732..1733 ; Vowel_Dependent # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1752..1753 ; Vowel_Dependent # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U +1772..1773 ; Vowel_Dependent # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U +17B6 ; Vowel_Dependent # Mc KHMER VOWEL SIGN AA +17B7..17BD ; Vowel_Dependent # Mn [7] KHMER VOWEL SIGN I..KHMER VOWEL SIGN UA +17BE..17C5 ; Vowel_Dependent # Mc [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU +17C8 ; Vowel_Dependent # Mc KHMER SIGN YUUKALEAPINTU +1920..1922 ; Vowel_Dependent # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U +1923..1926 ; Vowel_Dependent # Mc [4] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AU +1927..1928 ; Vowel_Dependent # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +19B0..19C0 ; Vowel_Dependent # Mc [17] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN IY +1A17..1A18 ; Vowel_Dependent # Mn [2] BUGINESE VOWEL SIGN I..BUGINESE VOWEL SIGN U +1A19..1A1B ; Vowel_Dependent # Mc [3] BUGINESE VOWEL SIGN E..BUGINESE VOWEL SIGN AE +1A61 ; Vowel_Dependent # Mc TAI THAM VOWEL SIGN A +1A62 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN MAI SAT +1A63..1A64 ; Vowel_Dependent # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A65..1A6C ; Vowel_Dependent # Mn [8] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN OA BELOW +1A6D..1A72 ; Vowel_Dependent # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI +1A73..1A74 ; Vowel_Dependent # Mn [2] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN MAI KANG +1B35 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN TEDUNG +1B36..1B3A ; Vowel_Dependent # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA +1B3B ; Vowel_Dependent # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +1B3C ; Vowel_Dependent # Mn BALINESE VOWEL SIGN LA LENGA +1B3D..1B41 ; Vowel_Dependent # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1B42 ; Vowel_Dependent # Mn BALINESE VOWEL SIGN PEPET +1B43 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN PEPET TEDUNG +1BA4..1BA5 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PANGHULU..SUNDANESE VOWEL SIGN PANYUKU +1BA6..1BA7 ; Vowel_Dependent # Mc [2] SUNDANESE VOWEL SIGN PANAELAENG..SUNDANESE VOWEL SIGN PANOLONG +1BA8..1BA9 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE7 ; Vowel_Dependent # Mc BATAK VOWEL SIGN E +1BE8..1BE9 ; Vowel_Dependent # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BEA..1BEC ; Vowel_Dependent # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BED ; Vowel_Dependent # Mn BATAK VOWEL SIGN KARO O +1BEE ; Vowel_Dependent # Mc BATAK VOWEL SIGN U +1BEF ; Vowel_Dependent # Mn BATAK VOWEL SIGN U FOR SIMALUNGUN SA +1C26..1C2B ; Vowel_Dependent # Mc [6] LEPCHA VOWEL SIGN AA..LEPCHA VOWEL SIGN UU +1C2C ; Vowel_Dependent # Mn LEPCHA VOWEL SIGN E +A823..A824 ; Vowel_Dependent # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A825..A826 ; Vowel_Dependent # Mn [2] SYLOTI NAGRI VOWEL SIGN U..SYLOTI NAGRI VOWEL SIGN E +A827 ; Vowel_Dependent # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Vowel_Dependent # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A947..A94E ; Vowel_Dependent # Mn [8] REJANG VOWEL SIGN I..REJANG VOWEL SIGN EA +A9B4..A9B5 ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9B6..A9B9 ; Vowel_Dependent # Mn [4] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BA..A9BB ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +A9BC ; Vowel_Dependent # Mn JAVANESE VOWEL SIGN PEPET +AA29..AA2E ; Vowel_Dependent # Mn [6] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN OE +AA2F..AA30 ; Vowel_Dependent # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA31..AA32 ; Vowel_Dependent # Mn [2] CHAM VOWEL SIGN AU..CHAM VOWEL SIGN UE +AAB0 ; Vowel_Dependent # Mn TAI VIET MAI KANG +AAB1 ; Vowel_Dependent # Lo TAI VIET VOWEL AA +AAB2..AAB4 ; Vowel_Dependent # Mn [3] TAI VIET VOWEL I..TAI VIET VOWEL U +AAB5..AAB6 ; Vowel_Dependent # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB7..AAB8 ; Vowel_Dependent # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AAB9..AABD ; Vowel_Dependent # Lo [5] TAI VIET VOWEL UEA..TAI VIET VOWEL AN +AABE ; Vowel_Dependent # Mn TAI VIET VOWEL AM +AAEB..AAEF ; Vowel_Dependent # Mc [5] MEETEI MAYEK VOWEL SIGN II..MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE5 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN ANAP +ABE6..ABE7 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE8 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABE9..ABEA ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +10A01..10A03 ; Vowel_Dependent # Mn [3] KHAROSHTHI VOWEL SIGN I..KHAROSHTHI VOWEL SIGN VOCALIC R +10A05..10A06 ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O +10A0C ; Vowel_Dependent # Mn KHAROSHTHI VOWEL LENGTH MARK +11038..11045 ; Vowel_Dependent # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +110B0..110B2 ; Vowel_Dependent # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II +110B3..110B6 ; Vowel_Dependent # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI +110B7..110B8 ; Vowel_Dependent # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11127..11132 ; Vowel_Dependent # Mn [12] CHAKMA VOWEL SIGN A..CHAKMA AU MARK +111B3..111BF ; Vowel_Dependent # Mn [13] SHARADA VOWEL SIGN AA..SHARADA VOWEL SIGN AU +116AD..116B5 ; Vowel_Dependent # Mn [9] TAKRI VOWEL SIGN AA..TAKRI VOWEL SIGN AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel + +# (Other) Vowels (reanalyzed as ordinary alphabetic letters or marks) + +# [Not derivable] + +1963..196D ; Vowel # Lo [11] TAI LE LETTER A..TAI LE LETTER AI +A85E..A861 ; Vowel # Lo [4] PHAGS-PA LETTER I..PHAGS-PA LETTER O +A866 ; Vowel # Lo [1] PHAGS-PA LETTER EE +A922..A925 ; Vowel # Lo [4] KAYAH LI LETTER A..KAYAH LI LETTER OO +A926..A92A ; Vowel # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Placeholder + +# Consonant Placeholder +# This includes generic placeholders used for +# Indic script layout (NBSP and dotted circle), as well as a few script- +# specific vowel-holder characters which are not technically +# consonants, but serve instead as bases for placement of vowel marks. + +# [Not derivable] + +00A0 ; Consonant_Placeholder # Zs NO-BREAK SPACE +0A72..0A73 ; Consonant_Placeholder # Lo [2] GURMUKHI IRI..GURMUKHI URA +1900 ; Consonant_Placeholder # Lo LIMBU VOWEL-CARRIER LETTER +25CC ; Consonant_Placeholder # So DOTTED CIRCLE + +# ================================================ + +# Indic_Syllabic_Category=Consonant + +# Consonant (ordinary abugida consonants, with inherent vowels) + +# [Not derivable] + +0915..0939 ; Consonant # Lo [35] DEVANAGARI LETTER KA..DEVANAGARI LETTER HA +0958..095F ; Consonant # Lo [8] DEVANAGARI LETTER QA..DEVANAGARI LETTER YYA +0979..097F ; Consonant # Lo [7] DEVANAGARI LETTER ZHA..DEVANAGARI LETTER BBA +0995..09A8 ; Consonant # Lo [20] BENGALI LETTER KA..BENGALI LETTER NA +09AA..09B0 ; Consonant # Lo [7] BENGALI LETTER PA..BENGALI LETTER RA +09B2 ; Consonant # Lo BENGALI LETTER LA +09B6..09B9 ; Consonant # Lo [4] BENGALI LETTER SHA..BENGALI LETTER HA +09DC..09DD ; Consonant # Lo [2] BENGALI LETTER RRA..BENGALI LETTER RHA +09DF ; Consonant # Lo BENGALI LETTER YYA +09F0..09F1 ; Consonant # Lo [2] BENGALI LETTER RA WITH MIDDLE DIAGONAL..BENGALI LETTER RA WITH LOWER DIAGONAL +0A15..0A28 ; Consonant # Lo [20] GURMUKHI LETTER KA..GURMUKHI LETTER NA +0A2A..0A30 ; Consonant # Lo [7] GURMUKHI LETTER PA..GURMUKHI LETTER RA +0A32..0A33 ; Consonant # Lo [2] GURMUKHI LETTER LA..GURMUKHI LETTER LLA +0A35..0A36 ; Consonant # Lo [2] GURMUKHI LETTER VA..GURMUKHI LETTER SHA +0A38..0A39 ; Consonant # Lo [2] GURMUKHI LETTER SA..GURMUKHI LETTER HA +0A59..0A5C ; Consonant # Lo [4] GURMUKHI LETTER KHHA..GURMUKHI LETTER RRA +0A5E ; Consonant # Lo GURMUKHI LETTER FA +0A95..0AA8 ; Consonant # Lo [20] GUJARATI LETTER KA..GUJARATI LETTER NA +0AAA..0AB0 ; Consonant # Lo [7] GUJARATI LETTER PA..GUJARATI LETTER RA +0AB2..0AB3 ; Consonant # Lo [2] GUJARATI LETTER LA..GUJARATI LETTER LLA +0AB5..0AB9 ; Consonant # Lo [5] GUJARATI LETTER VA..GUJARATI LETTER HA +0B15..0B28 ; Consonant # Lo [20] ORIYA LETTER KA..ORIYA LETTER NA +0B2A..0B30 ; Consonant # Lo [7] ORIYA LETTER PA..ORIYA LETTER RA +0B32..0B33 ; Consonant # Lo [2] ORIYA LETTER LA..ORIYA LETTER LLA +0B35..0B39 ; Consonant # Lo [5] ORIYA LETTER VA..ORIYA LETTER HA +0B5C..0B5D ; Consonant # Lo [2] ORIYA LETTER RRA..ORIYA LETTER RHA +0B5F ; Consonant # Lo ORIYA LETTER YYA +0B71 ; Consonant # Lo ORIYA LETTER WA +0B95 ; Consonant # Lo TAMIL LETTER KA +0B99..0B9A ; Consonant # Lo [2] TAMIL LETTER NGA..TAMIL LETTER CA +0B9C ; Consonant # Lo TAMIL LETTER JA +0B9E..0B9F ; Consonant # Lo [2] TAMIL LETTER NYA..TAMIL LETTER TTA +0BA3..0BA4 ; Consonant # Lo [2] TAMIL LETTER NNA..TAMIL LETTER TA +0BA8..0BAA ; Consonant # Lo [3] TAMIL LETTER NA..TAMIL LETTER PA +0BAE..0BB9 ; Consonant # Lo [12] TAMIL LETTER MA..TAMIL LETTER HA +0C15..0C28 ; Consonant # Lo [20] TELUGU LETTER KA..TELUGU LETTER NA +0C2A..0C33 ; Consonant # Lo [10] TELUGU LETTER PA..TELUGU LETTER LLA +0C35..0C39 ; Consonant # Lo [5] TELUGU LETTER VA..TELUGU LETTER HA +0C58..0C59 ; Consonant # Lo [2] TELUGU LETTER TSA..TELUGU LETTER DZA +0C95..0CA8 ; Consonant # Lo [20] KANNADA LETTER KA..KANNADA LETTER NA +0CAA..0CB3 ; Consonant # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA +0CB5..0CB9 ; Consonant # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA +0CDE ; Consonant # Lo KANNADA LETTER FA +0D15..0D3A ; Consonant # Lo [38] MALAYALAM LETTER KA..MALAYALAM LETTER TTTA +0D9A..0DB1 ; Consonant # Lo [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA +0DB3..0DBB ; Consonant # Lo [9] SINHALA LETTER SANYAKA DAYANNA..SINHALA LETTER RAYANNA +0DBD ; Consonant # Lo SINHALA LETTER DANTAJA LAYANNA +0DC0..0DC6 ; Consonant # Lo [7] SINHALA LETTER VAYANNA..SINHALA LETTER FAYANNA +0E01..0E2E ; Consonant # Lo [46] THAI CHARACTER KO KAI..THAI CHARACTER NOKHUK +0E81..0E82 ; Consonant # Lo [2] LAO LETTER KO..LAO LETTER KHO SUNG +0E84 ; Consonant # Lo LAO LETTER KHO TAM +0E87..0E88 ; Consonant # Lo [2] LAO LETTER NGO..LAO LETTER CO +0E8A ; Consonant # Lo LAO LETTER SO TAM +0E8D ; Consonant # Lo LAO LETTER NYO +0E94..0E97 ; Consonant # Lo [4] LAO LETTER DO..LAO LETTER THO TAM +0E99..0E9F ; Consonant # Lo [7] LAO LETTER NO..LAO LETTER FO SUNG +0EA1..0EA3 ; Consonant # Lo [3] LAO LETTER MO..LAO LETTER LO LING +0EA5 ; Consonant # Lo LAO LETTER LO LOOT +0EA7 ; Consonant # Lo LAO LETTER WO +0EAA..0EAB ; Consonant # Lo [2] LAO LETTER SO SUNG..LAO LETTER HO SUNG +0EAD..0EAE ; Consonant # Lo [2] LAO LETTER O..LAO LETTER HO TAM +0EDC..0EDD ; Consonant # Lo [2] LAO HO NO..LAO HO MO +0F40..0F47 ; Consonant # Lo [8] TIBETAN LETTER KA..TIBETAN LETTER JA +0F49..0F6C ; Consonant # Lo [36] TIBETAN LETTER NYA..TIBETAN LETTER RRA +1000..1020 ; Consonant # Lo [33] MYANMAR LETTER KA..MYANMAR LETTER LLA +103F ; Consonant # Lo MYANMAR LETTER GREAT SA +1050..1051 ; Consonant # Lo [2] MYANMAR LETTER SHA..MYANMAR LETTER SSA +105A..105D ; Consonant # Lo [4] MYANMAR LETTER MON NGA..MYANMAR LETTER MON BBE +1061 ; Consonant # Lo MYANMAR LETTER SGAW KAREN SHA +1065..1066 ; Consonant # Lo [2] MYANMAR LETTER WESTERN PWO KAREN THA..MYANMAR LETTER WESTERN PWO KAREN PWA +106E..1070 ; Consonant # Lo [3] MYANMAR LETTER EASTERN PWO KAREN NNA..MYANMAR LETTER EASTERN PWO KAREN GHWA +1075..1081 ; Consonant # Lo [13] MYANMAR LETTER SHAN KA..MYANMAR LETTER SHAN HA +108E ; Consonant # Lo MYANMAR LETTER RUMAI PALAUNG FA +1703..170C ; Consonant # Lo [10] TAGALOG LETTER KA..TAGALOG LETTER YA +170E..1711 ; Consonant # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1723..1731 ; Consonant # Lo [15] HANUNOO LETTER KA..HANUNOO LETTER HA +1743..1751 ; Consonant # Lo [15] BUHID LETTER KA..BUHID LETTER HA +1763..176C ; Consonant # Lo [10] TAGBANWA LETTER KA..TAGBANWA LETTER YA +176E..1770 ; Consonant # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA +1780..17A2 ; Consonant # Lo [35] KHMER LETTER KA..KHMER LETTER QA +1901..191C ; Consonant # Lo [28] LIMBU LETTER KA..LIMBU LETTER HA +1950..1962 ; Consonant # Lo [19] TAI LE LETTER KA..TAI LE LETTER NA +1980..19AB ; Consonant # Lo [44] NEW TAI LUE LETTER HIGH QA..NEW TAI LUE LETTER LOW SUA +1A00..1A16 ; Consonant # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA +1A20..1A4C ; Consonant # Lo [45] TAI THAM LETTER HIGH KA..TAI THAM LETTER LOW HA +1A53..1A54 ; Consonant # Lo [2] TAI THAM LETTER LAE..TAI THAM LETTER GREAT SA +1B13..1B33 ; Consonant # Lo [33] BALINESE LETTER KA..BALINESE LETTER HA +1B45..1B4B ; Consonant # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B8A..1BA0 ; Consonant # Lo [23] SUNDANESE LETTER KA..SUNDANESE LETTER HA +1BAE..1BAF ; Consonant # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA +1BBB..1BBD ; Consonant # Lo [3] SUNDANESE LETTER REU..SUNDANESE LETTER BHA +1BC0..1BE3 ; Consonant # Lo [36] BATAK LETTER A..BATAK LETTER MBA +1C00..1C23 ; Consonant # Lo [36] LEPCHA LETTER KA..LEPCHA LETTER A +1C4D..1C4F ; Consonant # Lo [3] LEPCHA LETTER TTA..LEPCHA LETTER DDA +A807..A80A ; Consonant # Lo [4] SYLOTI NAGRI LETTER KO..SYLOTI NAGRI LETTER GHO +A80C..A822 ; Consonant # Lo [23] SYLOTI NAGRI LETTER CO..SYLOTI NAGRI LETTER HO +A840..A85D ; Consonant # Lo [30] PHAGS-PA LETTER KA..PHAGS-PA LETTER A +A862..A865 ; Consonant # Lo [4] PHAGS-PA LETTER QA..PHAGS-PA LETTER GGA +A869..A870 ; Consonant # Lo [8] PHAGS-PA LETTER TTA..PHAGS-PA LETTER ASPIRATED FA +A872 ; Consonant # Lo PHAGS-PA SUPERFIXED LETTER RA +A892..A8B3 ; Consonant # Lo [34] SAURASHTRA LETTER KA..SAURASHTRA LETTER LLA +A90A..A921 ; Consonant # Lo [24] KAYAH LI LETTER KA..KAYAH LI LETTER CA +A930..A946 ; Consonant # Lo [23] REJANG LETTER KA..REJANG LETTER A +A989..A98B ; Consonant # Lo [3] JAVANESE LETTER PA CEREK..JAVANESE LETTER NGA LELET RASWADI +A98F..A9B2 ; Consonant # Lo [34] JAVANESE LETTER KA..JAVANESE LETTER HA +AA06..AA28 ; Consonant # Lo [35] CHAM LETTER KA..CHAM LETTER HA +AA60..AA6F ; Consonant # Lo [16] MYANMAR LETTER KHAMTI GA..MYANMAR LETTER KHAMTI FA +AA71..AA73 ; Consonant # Lo [3] MYANMAR LETTER KHAMTI XA..MYAMNAR LETTER KHAMTI RA +AA7A ; Consonant # Lo MYANMAR LETTER AITON RA +AA80..AAAF ; Consonant # Lo [48] TAI VIET LETTER LOW KO..TAI VIET LETTER HIGH O +AAE2..AAEA ; Consonant # Lo [9] MEETEI MAYEK LETTER CHA..MEETEI MAYEK LETTER SSA +ABC0..ABCD ; Consonant # Lo [14] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER HUK +ABD0 ; Consonant # Lo MEETEI MAYEK LETTER PHAM +ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTER BHAM +10A00 ; Consonant # Lo KHAROSHTHI LETTER A +10A10..10A13 ; Consonant # Lo [4] KHAROSHTHI LETTER KA..KHAROSHTHI LETTER GHA +10A15..10A17 ; Consonant # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA +10A19..10A33 ; Consonant # Lo [27] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER TTTHA +11013..11037 ; Consonant # Lo [37] BRAHMI LETTER KA..BRAHMI LETTER OLD TAMIL NNNA +1108D..110AF ; Consonant # Lo [35] KAITHI LETTER KA..KAITHI LETTER HA +11107..11126 ; Consonant # Lo [32] CHAKMA LETTER KAA..CHAKMA LETTER HAA +11191..111B2 ; Consonant # Lo [34] SHARADA LETTER KA..SHARADA LETTER HA +1168A..116AA ; Consonant # Lo [34] TAKRI LETTER KA..TAKRI LETTER RRA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Dead + +# Dead Consonant (special consonant with killed vowel) + +# [Not derivable] + +09CE ; Consonant_Dead # Lo BENGALI LETTER KHANDA TA +0D7A..0D7F ; Consonant_Dead # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Repha + +# Repha Form of RA (reanalyzed in some scripts) + +# [Not derivable] + +0D4E ; Consonant_Repha # Lo MALAYALAM LETTER DOT REPH +17CC ; Consonant_Repha # Mn KHMER SIGN ROBAT +1B03 ; Consonant_Repha # Mn BALINESE SIGN SURANG +1B81 ; Consonant_Repha # Mn SUNDANESE SIGN PANGLAYAR +A982 ; Consonant_Repha # Mn JAVANESE SIGN LAYAR + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Subjoined + +# Subjoined Consonant (C2 form subtending a base consonant in Tibetan, etc.) + +# [Not derivable] + +0F8D..0F97 ; Consonant_Subjoined # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Consonant_Subjoined # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +1929..192B ; Consonant_Subjoined # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1BA1 ; Consonant_Subjoined # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA2..1BA3 ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BAC..1BAD ; Consonant_Subjoined # Mc [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C24..1C25 ; Consonant_Subjoined # Mc [2] LEPCHA SUBJOINED LETTER YA..LEPCHA SUBJOINED LETTER RA +A867..A868 ; Consonant_Subjoined # Lo [2] PHAGS-PA SUBJOINED LETTER WA..PHAGS-PA SUBJOINED LETTER YA +A871 ; Consonant_Subjoined # Lo PHAGS-PA SUBJOINED LETTER RA +A9BD ; Consonant_Subjoined # Mc JAVANESE CONSONANT SIGN KERET + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Medial + +# Medial Consonant (medial liquid, occurring in clusters) + +# [Not derivable] + +0A75 ; Consonant_Medial # Mn GURMUKHI SIGN YAKASH +0EBC ; Consonant_Medial # Mn LAO SEMIVOWEL SIGN LO +0EBD ; Consonant_Medial # Lo LAO SEMIVOWEL SIGN NYO +103B..103C ; Consonant_Medial # Mc [2] MYANMAR CONSONANT SIGN MEDIAL YA..MYANMAR CONSONANT SIGN MEDIAL RA +103D..103E ; Consonant_Medial # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +105E..1060 ; Consonant_Medial # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Consonant_Medial # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +1A55 ; Consonant_Medial # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A56 ; Consonant_Medial # Mn TAI THAM CONSONANT SIGN MEDIAL LA +A9BE..A9BF ; Consonant_Medial # Mc JAVANESE CONSONANT SIGN PENGKAL..JAVANESE CONSONANT SIGN CAKRA +AA33..AA34 ; Consonant_Medial # Mc [2] CHAM CONSONANT SIGN YA..CHAM CONSONANT SIGN RA +AA35..AA36 ; Consonant_Medial # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Final + +# Final Consonant (special final forms which do not take vowels) + +# [Not derivable] + +1930..1931 ; Consonant_Final # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Consonant_Final # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +19C1..19C7 ; Consonant_Final # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B +1A57 ; Consonant_Final # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A58..1A5E ; Consonant_Final # Mn [7] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN SA +1BBE..1BBF ; Consonant_Final # Lo [2] SUNDANESE LETTER FINAL K..SUNDANESE LETTER FINAL M +1BF0..1BF1 ; Consonant_Final # Mn [2] BATAK CONSONANT SIGN NG..BATAK CONSONANT SIGN H +1C2D..1C33 ; Consonant_Final # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +A8B4 ; Consonant_Final # Mc SAURASHTRA CONSONANT SIGN HAARU +A94F..A951 ; Consonant_Final # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A952 ; Consonant_Final # Mc REJANG CONSONANT SIGN H +AA40..AA42 ; Consonant_Final # Lo [3] CHAM LETTER FINAL K..CHAM LETTER FINAL NG +AA43 ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL NG +AA44..AA4B ; Consonant_Final # Lo [8] CHAM LETTER FINAL CH..CHAM LETTER FINAL SS +AA4C ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL M +AA4D ; Consonant_Final # Mc CHAM CONSONANT SIGN FINAL H +ABDB..ABE2 ; Consonant_Final # Lo [8] MEETEI MAYEK LETTER KOK LONSUM..MEETEI MAYEK LETTER I LONSUM + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Head_Letter + +# Head Letter (Tibetan) + +# [Not derivable] + +0F88..0F8C ; Consonant_Head_Letter # Lo [5] TIBETAN SIGN LCE TSA CAN..TIBETAN SIGN INVERTED MCHU CAN + +# ================================================ + +# Indic_Syllabic_Category=Modifying_Letter + +# Reanalyzed letters not participating in the abugida structure, but +# serving to modify the sound of an adjacent vowel or consonant. +# Note that this is not the same as General_Category=Modifier_Letter. + +# [Not derivable] + +0B83 ; Modifying_Letter # Lo TAMIL SIGN VISARGA (aytham) + +# ================================================ + +# Indic_Syllabic_Category=Tone_Letter + +# Tone Letter (spacing lexical tone mark with status as a letter) + +# [Not derivable] + +1970..1974 ; Tone_Letter # Lo [5] TAI LE LETTER TONE-2..TAI LE LETTER TONE-6 +AAC0 ; Tone_Letter # Lo TAI VIET TONE MAI NUENG +AAC2 ; Tone_Letter # Lo TAI VIET TONE MAI SONG + +# ================================================ + +# Indic_Syllabic_Category=Tone_Mark + +# Tone Mark (nonspacing or spacing lexical tone mark) +# Excludes Vedic tone marks, which are more akin to cantillation marks. + +# [Not derivable] + +0E48..0E4B ; Tone_Mark # Mn [4] THAI CHARACTER MAI EK..THAI CHARACTER MAI CHATTAWA +0EC8..0ECB ; Tone_Mark # Mn [4] LAO TONE MAI EK..LAO TONE MAI CATAWA +1037 ; Tone_Mark # Mn MYANMAR SIGN DOT BELOW +1063..1064 ; Tone_Mark # Mc [2] MYANMAR TONE MARK SGAW KAREN HATHI..MYANMAR TONE MARK SGAW KAREN KE PHO +1069..106D ; Tone_Mark # Mc [5] MYANMAR SIGN WESTERN PWO KAREN TONE-1..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1087..108C ; Tone_Mark # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108D ; Tone_Mark # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +108F ; Tone_Mark # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109B ; Tone_Mark # Mc [2] MYANMAR SIGN KHAMTI TONE-1..MYANMAR SIGN KHAMTI TONE-3 +19C8..19C9 ; Tone_Mark # Mc [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A75..1A79 ; Tone_Mark # Mn [5] TAI THAM SIGN TONE-1..TAI THAM SIGN KHUEN TONE-5 +A92B..A92D ; Tone_Mark # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +AA7B ; Tone_Mark # Mc MYANMAR SIGN PAO KAREN TONE +AABF ; Tone_Mark # Mn TAI VIET TONE MAI EK +AAC1 ; Tone_Mark # Mn TAI VIET TONE MAI THO +ABEC ; Tone_Mark # Mc MEETEI MAYEK LUM IYEK + +# ================================================ + +# Indic_Syllabic_Category=Register_Shifter + +# Register Shifter (shifts register for consonants, akin to a tone mark) + +# [Not derivable] + +17C9..17CA ; Register_Shifter # Mn [2] KHMER SIGN MUUSIKATOAN..KHMER SIGN TRIISAP + +# EOF diff --git a/data/6.3.0-indic-positional-category.txt b/data/6.3.0-indic-positional-category.txt new file mode 100644 index 0000000..04cb932 --- /dev/null +++ b/data/6.3.0-indic-positional-category.txt @@ -0,0 +1,446 @@ +# IndicMatraCategory-6.3.0.txt +# Date: 2013-01-02, 08:33:00 GMT [KW, LI] +# +# Unicode Character Database +# Copyright (c) 1991-2013 Unicode, Inc. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# For documentation, see UAX #44, at http://www.unicode.org/reports/tr44/ +# +# This file defines the following provisional property: +# +# Indic_Matra_Category enumerated property +# +# NB: Provisional properties and data files have no associated stability +# guarantees. They are provided in part to determine the possible usefulness +# of a property or other data and to encourage analysis and further investigation +# which may result in their improvement. Provisional properties and +# data files may change arbitrarily, or may even be removed in a future version of the +# Unicode Character Database, if they prove not to be useful. +# +# Scope: This provisional property is aimed at the problem of +# the specification of syllabic structure for Indic scripts. +# Because dependent vowels (and visible viramas, where they occur) +# are placed in notional slots around the consonant (or consonant +# cluster) core of an Indic syllable, there may be cooccurrence +# constraints or other interactions. Also, it may be desirable, +# in cases where more than one dependent vowel may occur in +# sequence, as for example, in a top slot and a bottom slot, to +# specify preferred orders for spelling. As such, this property +# is designed primarily to supplement the Indic_Syllabic_Category +# property. +# +# Note that this provisional property is *not* intended as +# a prescriptive property regarding display or font design, +# for a number of reasons. Good font design requires information +# that is outside the context of a character encoding standard, +# and is best handled in other venues. For Indic dependent +# vowels, in particular: +# +# 1. Matra placement may vary somewhat based on typeface design. +# 2. Matra placement, even within a single script, may vary +# somewhat according to historic period or local conventions. +# 3. Matra placement may be changed by explicit orthographic reform +# decisions. +# 4. Matras may ligate in various ways with a consonant (or even +# other elements of a syllable) instead of occurring in a +# discrete location. +# 4. Matra display may be contextually determined. This is +# notable, for example, in the Tamil script, where the shape +# and placement of -u and -uu vowels depends strongly on +# which consonant they adjoin. +# +# Format: +# Field 0 Code Point or Code Point Range +# Field 1 Indic_Matra_Category +# +# A comment field shows General_Category property values and character names. +# +# The scripts assessed as containing dependent vowels or viramas in the +# structural sense used for the Indic_Matra_Category are: +# +# Devanagari, Bengali, Gurmukhi, Gujarati, Oriya, Tamil, Telugu, +# Kannada, Malayalam, Sinhala, Thai, Lao, Tibetan, Myanmar, +# Tagalog, Hanunoo, Buhid, Tagbanwa, Khmer, Limbu, New Tai Lue, +# Buginese, Tai Tham, Balinese, Sundanese, Batak, Lepcha, +# Syloti Nagri, Saurashtra, Rejang, Javanese, Cham, Tai Viet, +# Meetei Mayek, Kharoshthi, Brahmi, Kaithi, Chakma, Sharada, Takri +# +# All characters for all other scripts not in that list +# take the default value for this property. +# +# See IndicSyllabicCategory.txt for a slightly more extended +# list of Indic scripts, including those which do not have +# dependent vowel characters. Currently, those additional +# Indic scripts without dependent vowel characters are +# Tai Le, Phags-pa, and Kayah Li. +# + +# ================================================ + +# Property: Indic_Matra_Category +# +# All code points not explicitly listed for Indic_Matra_Category +# have the value NA (Not_Applicable). +# +# @missing: 0000..10FFFF; NA + +# Only Indic dependent vowels (Indic_Syllabic_Category=Vowel_Dependent) +# and viramas (Indic_Syllabic_Category=Virama) +# have a non-default value for this property. + +# ------------------------------------------------ + +# Indic_Matra_Category=Right + +093B ; Right # Mc DEVANAGARI VOWEL SIGN OOE +093E ; Right # Mc DEVANAGARI VOWEL SIGN AA +0940 ; Right # Mc DEVANAGARI VOWEL SIGN II +0949..094C ; Right # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094F ; Right # Mc DEVANAGARI VOWEL SIGN AW +09BE ; Right # Mc BENGALI VOWEL SIGN AA +09C0 ; Right # Mc BENGALI VOWEL SIGN II +09D7 ; Right # Mc BENGALI AU LENGTH MARK +0A3E ; Right # Mc GURMUKHI VOWEL SIGN AA +0A40 ; Right # Mc GURMUKHI VOWEL SIGN II +0ABE ; Right # Mc GUJARATI VOWEL SIGN AA +0AC0 ; Right # Mc GUJARATI VOWEL SIGN II +0ACB..0ACC ; Right # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0B3E ; Right # Mc ORIYA VOWEL SIGN AA +0B40 ; Right # Mc ORIYA VOWEL SIGN II +0BBE..0BBF ; Right # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BD7 ; Right # Mc TAMIL AU LENGTH MARK +0C41..0C44 ; Right # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0CBE ; Right # Mc KANNADA VOWEL SIGN AA +0CC1..0CC4 ; Right # Mc [4] KANNADA VOWEL SIGN U..KANNADA VOWEL SIGN VOCALIC RR +0CD5..0CD6 ; Right # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0D3E..0D40 ; Right # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D42 ; Right # Mn [2] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN UU +# Note: U and UU form complex ligatures with consonants in older Malayalam orthography +0D57 ; Right # Mc MALAYALAM AU LENGTH MARK +0DCF..0DD1 ; Right # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD8 ; Right # Mc SINHALA VOWEL SIGN GAETTA-PILLA +0DDF ; Right # Mc SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Right # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Right # Lo THAI CHARACTER SARA A +0E32..0E33 ; Right # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E45 ; Right # Lo THAI CHARACTER LAKKHANGYAO +0EB0 ; Right # Lo LAO VOWEL SIGN A +0EB2..0EB3 ; Right # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +102B..102C ; Right # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +1056..1057 ; Right # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1062 ; Right # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Right # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1083 ; Right # Mc MYANMAR VOWEL SIGN SHAN AA +109C ; Right # Mc MYANMAR VOWEL SIGN AITON A +17B6 ; Right # Mc KHMER VOWEL SIGN AA +17C8 ; Right # Mc KHMER SIGN YUUKALEAPINTU +1923..1924 ; Right # Mc [2] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AI +19B0..19B4 ; Right # Mc [5] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN UU +19B8..19B9 ; Right # Mc [2] NEW TAI LUE VOWEL SIGN OA..NEW TAI LUE VOWEL SIGN UE +19BB..19C0 ; Right # Mc [6] NEW TAI LUE VOWEL SIGN AAY..NEW TAI LUE VOWEL SIGN IY +1A1A ; Right # Mc BUGINESE VOWEL SIGN O +1A61 ; Right # Mc TAI THAM VOWEL SIGN A +1A63..1A64 ; Right # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A6D ; Right # Mc TAI THAM VOWEL SIGN OY +1B35 ; Right # Mc BALINESE VOWEL SIGN TEDUNG +1B44 ; Right # Mc BALINESE ADEG ADEG +1BA7 ; Right # Mc SUNDANESE VOWEL SIGN PANOLONG +1BAA ; Right # Mc SUNDANESE SIGN PAMAAEH +1BF2..1BF3 ; Right # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +1C26 ; Right # Mc LEPCHA VOWEL SIGN AA +1C2A..1C2B ; Right # Mc [2] LEPCHA VOWEL SIGN U..LEPCHA VOWEL SIGN UU +A823..A824 ; Right # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A827 ; Right # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Right # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A953 ; Right # Mc REJANG VIRAMA +A9B4..A9B5 ; Right # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +AAB1 ; Right # Lo TAI VIET VOWEL AA +AABA ; Right # Lo TAI VIET VOWEL UA +AABD ; Right # Lo TAI VIET VOWEL AN +AAEF ; Right # Mc MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE6..ABE7 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE9..ABEA ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +110B0 ; Right # Mc KAITHI VOWEL SIGN AA +110B2 ; Right # Mc KAITHI VOWEL SIGN II +110B7..110B8 ; Right # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +111B3 ; Right # Mc SHARADA VOWEL SIGN AA +111B5 ; Right # Mc SHARADA VOWEL SIGN II +111C0 ; Right # Mc SHARADA SIGN VIRAMA +116AF ; Right # Mc TAKRI VOWEL SIGN II + +# Indic_Matra_Category=Left + +093F ; Left # Mc DEVANAGARI VOWEL SIGN I +094E ; Left # Mc DEVANAGARI VOWEL SIGN PRISHTHAMATRA E +09BF ; Left # Mc BENGALI VOWEL SIGN I +09C7..09C8 ; Left # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +0A3F ; Left # Mc GURMUKHI VOWEL SIGN I +0ABF ; Left # Mc GUJARATI VOWEL SIGN I +0B47 ; Left # Mc ORIYA VOWEL SIGN E +0BC6..0BC8 ; Left # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0D46..0D48 ; Left # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0DD9 ; Left # Mc SINHALA VOWEL SIGN KOMBUVA +0DDB ; Left # Mc SINHALA VOWEL SIGN KOMBU DEKA +1031 ; Left # Mc MYANMAR VOWEL SIGN E +1084 ; Left # Mc MYANMAR VOWEL SIGN SHAN E +17C1..17C3 ; Left # Mc [3] KHMER VOWEL SIGN E..KHMER VOWEL SIGN AI +19B5..19B7 ; Left # Mc [3] NEW TAI LUE VOWEL SIGN E..NEW TAI LUE VOWEL SIGN O +19BA ; Left # Mc NEW TAI LUE VOWEL SIGN AY +1A19 ; Left # Mc BUGINESE VOWEL SIGN E +1A1B ; Left # Mc BUGINESE VOWEL SIGN AE +1A6E..1A72 ; Left # Mc [5] TAI THAM VOWEL SIGN E..TAI THAM VOWEL SIGN THAM AI +1B3E..1B3F ; Left # Mc [2] BALINESE VOWEL SIGN TALING..BALINESE VOWEL SIGN TALING REPA +1BA6 ; Left # Mc SUNDANESE VOWEL SIGN PANAELAENG +1C27..1C28 ; Left # Mc [2] LEPCHA VOWEL SIGN I..LEPCHA VOWEL SIGN O +A9BA..A9BB ; Left # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +AA2F..AA30 ; Left # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AAEB ; Left # Mc MEETEI MAYEK VOWEL SIGN II +AAEE ; Left # Mc MEETEI MAYEK VOWEL SIGN AU +110B1 ; Left # Mc KAITHI VOWEL SIGN I +1112C ; Left # Mc CHAKMA VOWEL SIGN E +111B4 ; Left # Mc SHARADA VOWEL SIGN I +116AE ; Left # Mc TAKRI VOWEL SIGN I + +# Indic_Matra_Category=Visual_Order_Left + +# These are dependent vowels that occur to the left of the consonant +# letter in a syllable, but which occur in scripts using the visual order +# model, instead of the logical order model. Because of the different +# model, these left-side vowels occur first in the backing store (before +# the consonant letter) and are not reordered during text rendering. +# +# [Derivation: Logical_Order_Exception=Yes] + +0E40..0E44 ; Visual_Order_Left # Lo [5] THAI CHARACTER SARA E..THAI CHARACTER SARA AI MAIMALAI +0EC0..0EC4 ; Visual_Order_Left # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +AAB5..AAB6 ; Visual_Order_Left # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB9 ; Visual_Order_Left # Lo TAI VIET VOWEL UEA +AABB..AABC ; Visual_Order_Left # Lo [2] TAI VIET VOWEL AUE..TAI VIET VOWEL AY + +# Indic_Matra_Category=Left_And_Right + +09CB..09CC ; Left_And_Right # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +0B4B ; Left_And_Right # Mc ORIYA VOWEL SIGN O +0BCA..0BCC ; Left_And_Right # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0D4A..0D4C ; Left_And_Right # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0DDC..0DDE ; Left_And_Right # Mc [3] SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA..SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA +17C0 ; Left_And_Right # Mc KHMER VOWEL SIGN IE +17C4..17C5 ; Left_And_Right # Mc [2] KHMER VOWEL SIGN OO..KHMER VOWEL SIGN AU +1B40..1B41 ; Left_And_Right # Mc [2] BALINESE VOWEL SIGN TALING TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG + +# Indic_Matra_Category=Top + +093A ; Top # Mn DEVANAGARI VOWEL SIGN OE +0945..0948 ; Top # Mn [4] DEVANAGARI VOWEL SIGN CANDRA E..DEVANAGARI VOWEL SIGN AI +0955 ; Top # Mn DEVANAGARI VOWEL SIGN CANDRA LONG E +0A47..0A48 ; Top # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Top # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0AC5 ; Top # Mn GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Top # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0B3F ; Top # Mn ORIYA VOWEL SIGN I +0B56 ; Top # Mn ORIYA AI LENGTH MARK +0BC0 ; Top # Mn TAMIL VOWEL SIGN II +0BCD ; Top # Mn TAMIL SIGN VIRAMA +0C3E..0C40 ; Top # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C46..0C47 ; Top # Mn [2] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN EE +0C4A..0C4C ; Top # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C4D ; Top # Mn TELUGU SIGN VIRAMA +0C55 ; Top # Mn TELUGU LENGTH MARK +0CBF ; Top # Mn KANNADA VOWEL SIGN I +0CC6 ; Top # Mn KANNADA VOWEL SIGN E +0CCC ; Top # Mn KANNADA VOWEL SIGN AU +0CCD ; Top # Mn KANNADA SIGN VIRAMA +0D4D ; Top # Mn MALAYALAM SIGN VIRAMA +0DCA ; Top # Mn SINHALA SIGN AL-LAKUNA +0DD2..0DD3 ; Top # Mn [2] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN DIGA IS-PILLA +0E31 ; Top # Mn THAI CHARACTER MAI HAN-AKAT +0E34..0E37 ; Top # Mn [4] THAI CHARACTER SARA I..THAI CHARACTER SARA UEE +0E47 ; Top # Mn THAI CHARACTER MAITAIKHU +0E4E ; Top # Mn THAI CHARACTER YAMAKKAN +0EB1 ; Top # Mn LAO VOWEL SIGN MAI KAN +0EB4..0EB7 ; Top # Mn [4] LAO VOWEL SIGN I..LAO VOWEL SIGN YY +0EBB ; Top # Mn LAO VOWEL SIGN MAI KON +0F72 ; Top # Mn TIBETAN VOWEL SIGN I +0F7A..0F7D ; Top # Mn [4] TIBETAN VOWEL SIGN E..TIBETAN VOWEL SIGN OO +0F80 ; Top # Mn TIBETAN VOWEL SIGN REVERSED I +102D..102E ; Top # Mn [2] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN II +1032..1035 ; Top # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +103A ; Top # Mn MYANMAR SIGN ASAT +1071..1074 ; Top # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1085..1086 ; Top # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109D ; Top # Mn MYANMAR VOWEL SIGN AITON AI +1712 ; Top # Mn TAGALOG VOWEL SIGN I +1732 ; Top # Mn HANUNOO VOWEL SIGN I +1752 ; Top # Mn BUHID VOWEL SIGN I +1772 ; Top # Mn TAGBANWA VOWEL SIGN I +17B7..17BA ; Top # Mn [4] KHMER VOWEL SIGN I..KHMER VOWEL SIGN YY +17D1 ; Top # Mn KHMER SIGN VIRIAM +1920..1921 ; Top # Mn [2] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN I +1927..1928 ; Top # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +1A17 ; Top # Mn BUGINESE VOWEL SIGN I +1A62 ; Top # Mn TAI THAM VOWEL SIGN MAI SAT +1A65..1A68 ; Top # Mn [4] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN UUE +1A6B ; Top # Mn TAI THAM VOWEL SIGN O +1A73..1A74 ; Top # Mn [2] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN MAI KANG +1B36..1B37 ; Top # Mn [2] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN ULU SARI +1B42 ; Top # Mn BALINESE VOWEL SIGN PEPET +1BA4 ; Top # Mn SUNDANESE VOWEL SIGN PANGHULU +1BA8..1BA9 ; Top # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +A806 ; Top # Mn SYLOTI NAGRI SIGN HASANTA +A826 ; Top # Mn SYLOTI NAGRI VOWEL SIGN E +A94A ; Top # Mn REJANG VOWEL SIGN AI +A9B6..A9B7 ; Top # Mn [2] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN WULU MELIK +A9BC ; Top # Mn JAVANESE VOWEL SIGN PEPET +AA29..AA2C ; Top # Mn [4] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN EI +AA2E ; Top # Mn CHAM VOWEL SIGN OE +AA31 ; Top # Mn CHAM VOWEL SIGN AU +AAB0 ; Top # Mn TAI VIET MAI KANG +AAB2..AAB3 ; Top # Mn [2] TAI VIET VOWEL I..TAI VIET VOWEL UE +AAB7..AAB8 ; Top # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AABE ; Top # Mn TAI VIET VOWEL AM +AAED ; Top # Mn MEETEI MAYEK VOWEL SIGN AAI +ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP +10A05 ; Top # Mn KHAROSHTHI VOWEL SIGN E +11038..1103B ; Top # Mn [4] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN II +11042..11045 ; Top # Mn [4] BRAHMI VOWEL SIGN E..BRAHMI VOWEL SIGN AU +11046 ; Top # Mn BRAHMI VIRAMA +110B5..110B6 ; Top # Mn [2] KAITHI VOWEL SIGN E..KAITHI VOWEL SIGN AI +11127..11129 ; Top # Mn [3] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN II +1112D ; Top # Mn CHAKMA VOWEL SIGN AI +11130 ; Top # Mn CHAKMA VOWEL SIGN OI +11134 ; Top # Mn CHAKMA MAAYYAA +111BC..111BE ; Top # Mn [3] SHARADA VOWEL SIGN E..SHARADA VOWEL SIGN O +116AD ; Top # Mn TAKRI VOWEL SIGN AA +116B2..116B5 ; Top # Mn [4] TAKRI VOWEL SIGN E..TAKRI VOWEL SIGN AU +116B6 ; Top # Mn TAKRI SIGN VIRAMA + +# Indic_Matra_Category=Bottom + +0941..0944 ; Bottom # Mn [4] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN VOCALIC RR +094D ; Bottom # Mn DEVANAGARI SIGN VIRAMA +0956..0957 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN UE..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09C1..09C4 ; Bottom # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09CD ; Bottom # Mn BENGALI SIGN VIRAMA +09E2..09E3 ; Bottom # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A41..0A42 ; Bottom # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A4D ; Bottom # Mn GURMUKHI SIGN VIRAMA +0AC1..0AC4 ; Bottom # Mn [4] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN VOCALIC RR +0ACD ; Bottom # Mn GUJARATI SIGN VIRAMA +0AE2..0AE3 ; Bottom # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B41..0B44 ; Bottom # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B4D ; Bottom # Mn ORIYA SIGN VIRAMA +0B62..0B63 ; Bottom # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BC1..0BC2 ; Bottom # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +# Note: U and UU have contextually variable placement in Tamil. +0C56 ; Bottom # Mn TELUGU AI LENGTH MARK +0C62..0C63 ; Bottom # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CE2..0CE3 ; Bottom # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D43..0D44 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC R..MALAYALAM VOWEL SIGN VOCALIC RR +0D62..0D63 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DD4 ; Bottom # Mn SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Bottom # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0E38..0E39 ; Bottom # Mn [2] THAI CHARACTER SARA U..THAI CHARACTER SARA UU +0E3A ; Bottom # Mn THAI CHARACTER PHINTHU +0EB8..0EB9 ; Bottom # Mn [2] LAO VOWEL SIGN U..LAO VOWEL SIGN UU +0F71 ; Bottom # Mn TIBETAN VOWEL SIGN AA +0F74..0F75 ; Bottom # Mn [2] TIBETAN VOWEL SIGN U..TIBETAN VOWEL SIGN UU +0F84 ; Bottom # Mn TIBETAN MARK HALANTA +102F..1030 ; Bottom # Mn [2] MYANMAR VOWEL SIGN U..MYANMAR VOWEL SIGN UU +1058..1059 ; Bottom # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1713 ; Bottom # Mn TAGALOG VOWEL SIGN U +1714 ; Bottom # Mn TAGALOG SIGN VIRAMA +1733 ; Bottom # Mn HANUNOO VOWEL SIGN U +1734 ; Bottom # Mn HANUNOO SIGN PAMUDPOD +1753 ; Bottom # Mn BUHID VOWEL SIGN U +1773 ; Bottom # Mn TAGBANWA VOWEL SIGN U +17BB..17BD ; Bottom # Mn [3] KHMER VOWEL SIGN U..KHMER VOWEL SIGN UA +1922 ; Bottom # Mn LIMBU VOWEL SIGN U +1A18 ; Bottom # Mn BUGINESE VOWEL SIGN U +1A69..1A6A ; Bottom # Mn [2] TAI THAM VOWEL SIGN U..TAI THAM VOWEL SIGN UU +1A6C ; Bottom # Mn TAI THAM VOWEL SIGN OA BELOW +1B38..1B3A ; Bottom # Mn [3] BALINESE VOWEL SIGN SUKU..BALINESE VOWEL SIGN RA REPA +1BA5 ; Bottom # Mn SUNDANESE VOWEL SIGN PANYUKU +1C2C ; Bottom # Mn LEPCHA VOWEL SIGN E +A825 ; Bottom # Mn SYLOTI NAGRI VOWEL SIGN U +A8C4 ; Bottom # Mn SAURASHTRA SIGN VIRAMA +A947..A949 ; Bottom # Mn [3] REJANG VOWEL SIGN I..REJANG VOWEL SIGN E +A94B..A94E ; Bottom # Mn [4] REJANG VOWEL SIGN O..REJANG VOWEL SIGN EA +A9B8..A9B9 ; Bottom # Mn [2] JAVANESE VOWEL SIGN SUKU..JAVANESE VOWEL SIGN SUKU MENDUT +AA2D ; Bottom # Mn CHAM VOWEL SIGN U +AA32 ; Bottom # Mn CHAM VOWEL SIGN UE +AAB4 ; Bottom # Mn TAI VIET VOWEL U +AAEC ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UU +ABE8 ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK +10A02..10A03 ; Bottom # Mn [2] KHAROSHTHI VOWEL SIGN U..KHAROSHTHI VOWEL SIGN VOCALIC R +10A0C ; Bottom # Mn KHAROSHTHI VOWEL LENGTH MARK +1103C..11041 ; Bottom # Mn [6] BRAHMI VOWEL SIGN U..BRAHMI VOWEL SIGN VOCALIC LL +110B3..110B4 ; Bottom # Mn [2] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN UU +110B9 ; Bottom # Mn KAITHI SIGN VIRAMA +1112A..1112B ; Bottom # Mn [2] CHAKMA VOWEL SIGN U..CHAKMA VOWEL SIGN UU +11131..11132 ; Bottom # Mn [2] CHAKMA O MARK..CHAKMA AU MARK +111B6..111BB ; Bottom # Mn [6] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN VOCALIC LL +116B0..116B1 ; Bottom # Mn [2] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN UU + +# Indic_Matra_Category=Top_And_Bottom + +0C48 ; Top_And_Bottom # Mn TELUGU VOWEL SIGN AI +0F73 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN II +0F76..0F79 ; Top_And_Bottom # Mn [4] TIBETAN VOWEL SIGN VOCALIC R..TIBETAN VOWEL SIGN VOCALIC LL +0F81 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN REVERSED II +1B3C ; Top_And_Bottom # Mn BALINESE VOWEL SIGN LA LENGA +1112E..1112F ; Top_And_Bottom # Mn [2] CHAKMA VOWEL SIGN O..CHAKMA VOWEL SIGN AU + +# Indic_Matra_Category=Top_And_Right + +0AC9 ; Top_And_Right # Mc GUJARATI VOWEL SIGN CANDRA O +0B57 ; Top_And_Right # Mc ORIYA AU LENGTH MARK +0CC0 ; Top_And_Right # Mc KANNADA VOWEL SIGN II +0CC7..0CC8 ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +1925..1926 ; Top_And_Right # Mc [2] LIMBU VOWEL SIGN OO..LIMBU VOWEL SIGN AU +1B43 ; Top_And_Right # Mc BALINESE VOWEL SIGN PEPET TEDUNG +111BF ; Top_And_Right # Mc SHARADA VOWEL SIGN AU + +# Indic_Matra_Category=Top_And_Left + +0B48 ; Top_And_Left # Mc ORIYA VOWEL SIGN AI +0DDA ; Top_And_Left # Mc SINHALA VOWEL SIGN DIGA KOMBUVA +17BE ; Top_And_Left # Mc KHMER VOWEL SIGN OE +1C29 ; Top_And_Left # Mc LEPCHA VOWEL SIGN OO + +# Indic_Matra_Category=Top_And_Left_And_Right + +0B4C ; Top_And_Left_And_Right # Mc ORIYA VOWEL SIGN AU +17BF ; Top_And_Left_And_Right # Mc KHMER VOWEL SIGN YA + +# Indic_Matra_Category=Bottom_And_Right + +1B3B ; Bottom_And_Right # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +A9C0 ; Bottom_And_Right # Mc JAVANESE PANGKON + +# Indic_Matra_Category=Top_And_Bottom_And_Right + +1B3D ; Top_And_Bottom_And_Right # Mc BALINESE VOWEL SIGN LA LENGA TEDUNG + +# Indic_Matra_Category=Overstruck + +10A01 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN I +10A06 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN O + +# Indic_Matra_Category=Invisible + +# The Invisible category refers to viramas for certain script +# which are used only to control consonant stacking or cluster +# formation, and which have no visible display on their own. + +1039 ; Invisible # Mn MYANMAR SIGN VIRAMA +17D2 ; Invisible # Mn KHMER SIGN COENG +1A60 ; Invisible # Mn TAI THAM SIGN SAKOT +AAF6 ; Invisible # Mn MEETEI MAYEK VIRAMA +10A3F ; Invisible # Mn KHAROSHTHI VIRAMA +11133 ; Invisible # Mn CHAKMA VIRAMA + +# EOF diff --git a/data/6.3.0-indic-syllabic-category.txt b/data/6.3.0-indic-syllabic-category.txt new file mode 100644 index 0000000..31f2e4b --- /dev/null +++ b/data/6.3.0-indic-syllabic-category.txt @@ -0,0 +1,796 @@ +# IndicSyllabicCategory-6.3.0.txt +# Date: 2013-08-01, 21:17:00 GMT [KW, LI] +# +# Unicode Character Database +# Copyright (c) 1991-2013 Unicode, Inc. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# For documentation, see UAX #44, at http://www.unicode.org/reports/tr44/ +# +# This file defines the following provisional property: +# +# Indic_Syllabic_Category enumerated property +# +# NB: Provisional properties and data files have no associated stability +# guarantees. They are provided in part to determine the possible usefulness +# of a property or other data and to encourage analysis and further investigation +# which may result in their improvement. Provisional properties and +# data files may change arbitrarily, or may even be removed in a future version of the +# Unicode Character Database, if they prove not to be useful. +# +# Scope: This provisional property is aimed at two general problem +# areas involving the analysis and processing of Indic scripts: +# +# 1. Specification of syllabic structure. +# 2. Specification of segmentation rules. +# +# Both of these problem areas may benefit from having defined subtypes +# of Indic script characters which are relevant to how Indic +# syllables (or aksaras) are constructed. Note that rules for +# syllabic structure in Indic scripts may differ significantly +# from how phonological syllables are defined. +# +# Format: +# Field 0 Code Point or Code Point Range +# Field 1 Indic_Syllabic_Category +# +# A comment field shows General_Category property values and character names. +# +# The scripts assessed as Indic in the +# structural sense used for the Indic_Syllabic_Category are: +# +# Devanagari, Bengali, Gurmukhi, Gujarati, Oriya, Tamil, Telugu, +# Kannada, Malayalam, Sinhala, Thai, Lao, Tibetan, Myanmar, +# Tagalog, Hanunoo, Buhid, Tagbanwa, Khmer, Limbu, Tai Le, New Tai Lue, +# Buginese, Tai Tham, Balinese, Sundanese, Batak, Lepcha, +# Syloti Nagri, Phags-Pa, Saurashtra, Kayah Li, Rejang, Javanese, Cham, Tai Viet, +# Meetei Mayek, Kharoshthi, Brahmi, Kaithi, Chakma, Sharada, Takri +# +# All characters for all other scripts not in that list +# take the default value for this property, unless they +# are individually listed in this data file. +# + +# ================================================ + +# Property: Indic_Syllabic_Category +# +# All code points not explicitly listed for Indic_Syllabic_Category +# have the value Other. +# +# @missing: 0000..10FFFF; Other + +# ================================================ + +# Indic_Syllabic_Category=Bindu + +# Bindu/Anusvara (nasalization or -n) +# Excludes various Vedic nasalization signs. + +# [Not derivable] + +0900..0902 ; Bindu # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +0981 ; Bindu # Mn BENGALI SIGN CANDRABINDU +0982 ; Bindu # Mc BENGALI SIGN ANUSVARA +0A01..0A02 ; Bindu # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A70 ; Bindu # Mn GURMUKHI TIPPI +0A81..0A82 ; Bindu # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0B01 ; Bindu # Mn ORIYA SIGN CANDRABINDU +0B02 ; Bindu # Mc ORIYA SIGN ANUSVARA +0B82 ; Bindu # Mn TAMIL SIGN ANUSVARA +0C01..0C02 ; Bindu # Mc [2] TELUGU SIGN CANDRABINDU..TELUGU SIGN ANUSVARA +0C82 ; Bindu # Mc KANNADA SIGN ANUSVARA +0D02 ; Bindu # Mc MALAYALAM SIGN ANUSVARA +0D82 ; Bindu # Mc SINHALA SIGN ANUSVARAYA +0E4D ; Bindu # Mn THAI CHARACTER NIKHAHIT +0ECD ; Bindu # Mn LAO NIGGAHITA +0F7E ; Bindu # Mn TIBETAN SIGN RJES SU NGA RO +0F82..0F83 ; Bindu # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +1036 ; Bindu # Mn MYANMAR SIGN ANUSVARA +17C6 ; Bindu # Mn KHMER SIGN NIKAHIT +1932 ; Bindu # Mn LIMBU SMALL LETTER ANUSVARA +1B00..1B02 ; Bindu # Mn [3] BALINESE SIGN ULU RICEM..BALINESE SIGN CECEK +1B80 ; Bindu # Mn SUNDANESE SIGN PANYECEK +1C34..1C35 ; Bindu # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A80B ; Bindu # Mn SYLOTI NAGRI SIGN ANUSVARA +A873 ; Bindu # Lo PHAGS-PA LETTER CANDRABINDU +A880 ; Bindu # Mc SAURASHTRA SIGN ANUSVARA +A980..A981 ; Bindu # Mn [2] JAVANESE SIGN PANYANGGA..JAVANESE SIGN CECAK +10A0E ; Bindu # Mn KHAROSHTHI SIGN ANUSVARA +11000 ; Bindu # Mc BRAHMI SIGN CANDRABINDU +11001 ; Bindu # Mn BRAHMI SIGN ANUSVARA +11080..11081 ; Bindu # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +11100..11101 ; Bindu # Mn [2] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN ANUSVARA +11180..11181 ; Bindu # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +116AB ; Bindu # Mn TAKRI SIGN ANUSVARA + +# ================================================ + +# Indic_Syllabic_Category=Visarga + +# Visarga (-h) +# Includes specialized case for Sanskrit: ardhavisarga +# Excludes letters for jihvamuliya and upadhmaniya, which are +# related, but structured somewhat differently. + +# [Not derivable] + +0903 ; Visarga # Mc DEVANAGARI SIGN VISARGA +0983 ; Visarga # Mc BENGALI SIGN VISARGA +0A03 ; Visarga # Mc GURMUKHI SIGN VISARGA +0A83 ; Visarga # Mc GUJARATI SIGN VISARGA +0B03 ; Visarga # Mc ORIYA SIGN VISARGA +0C03 ; Visarga # Mc TELUGU SIGN VISARGA +0C83 ; Visarga # Mc KANNADA SIGN VISARGA +0D03 ; Visarga # Mc MALAYALAM SIGN VISARGA +0D83 ; Visarga # Mc SINHALA SIGN VISARGAYA +0F7F ; Visarga # Mc TIBETAN SIGN RNAM BCAD +1038 ; Visarga # Mc MYANMAR SIGN VISARGA +17C7 ; Visarga # Mc KHMER SIGN REAHMUK +1B04 ; Visarga # Mc BALINESE SIGN BISAH +1B82 ; Visarga # Mc SUNDANESE SIGN PANGWISAD +1CF2 ; Visarga # Mc VEDIC SIGN ARDHAVISARGA +1CF3 ; Visarga # Mc VEDIC SIGN ROTATED ARDHAVISARGA +A881 ; Visarga # Mc SAURASHTRA SIGN VISARGA +A983 ; Visarga # Mc JAVANESE SIGN WIGNYAN +AAF5 ; Visarga # Mc MEETEI MAYEK VOWEL SIGN VISARGA +10A0F ; Visarga # Mn KHAROSHTHI SIGN VISARGA +11002 ; Visarga # Mc BRAHMI SIGN VISARGA +11082 ; Visarga # Mc KAITHI SIGN VISARGA +11102 ; Visarga # Mn CHAKMA SIGN VISARGA +11182 ; Visarga # Mn SHARADA SIGN VISARGA +116AC ; Visarga # Mc TAKRI SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Avagraha + +# Avagraha (elision of initial a- in sandhi) + +# [Not derivable] + +093D ; Avagraha # Lo DEVANAGARI SIGN AVAGRAHA +09BD ; Avagraha # Lo BENGALI SIGN AVAGRAHA +0ABD ; Avagraha # Lo GUJARATI SIGN AVAGRAHA +0B3D ; Avagraha # Lo ORIYA SIGN AVAGRAHA +0C3D ; Avagraha # Lo TELUGU SIGN AVAGRAHA +0CBD ; Avagraha # Lo KANNADA SIGN AVAGRAHA +0D3D ; Avagraha # Lo MALAYALAM SIGN AVAGRAHA +0F85 ; Avagraha # Po TIBETAN MARK PALUTA +17DC ; Avagraha # Lo KHMER SIGN AVAKRAHASANYA +1BBA ; Avagraha # Lo SUNDANESE AVAGRAHA +111C1 ; Avagraha # Lo SHARADA SIGN AVAGRAHA + +# ================================================ + +# Indic_Syllabic_Category=Nukta + +# Nukta (diacritic for borrowed consonants) + +# [Derivation: (ccc=7) - 1037] + +093C ; Nukta # Mn DEVANAGARI SIGN NUKTA +09BC ; Nukta # Mn BENGALI SIGN NUKTA +0A3C ; Nukta # Mn GURMUKHI SIGN NUKTA +0ABC ; Nukta # Mn GUJARATI SIGN NUKTA +0B3C ; Nukta # Mn ORIYA SIGN NUKTA +0CBC ; Nukta # Mn KANNADA SIGN NUKTA +1B34 ; Nukta # Mn BALINESE SIGN REREKAN +1BE6 ; Nukta # Mn BATAK SIGN TOMPI +1C37 ; Nukta # Mn LEPCHA SIGN NUKTA +A9B3 ; Nukta # Mn JAVANESE SIGN CECAK TELU +110BA ; Nukta # Mn KAITHI SIGN NUKTA +116B7 ; Nukta # Mn TAKRI SIGN NUKTA + +# ================================================ + +# Indic_Syllabic_Category=Virama + +# Virama (killing of inherent vowel in consonant sequence, +# or consonant stacker, depending on model) +# Also includes pure killers. + +# [Derivation: (ccc=9) + 0E4E + 17D1] + +094D ; Virama # Mn DEVANAGARI SIGN VIRAMA +09CD ; Virama # Mn BENGALI SIGN VIRAMA +0A4D ; Virama # Mn GURMUKHI SIGN VIRAMA +0ACD ; Virama # Mn GUJARATI SIGN VIRAMA +0B4D ; Virama # Mn ORIYA SIGN VIRAMA +0BCD ; Virama # Mn TAMIL SIGN VIRAMA +0C4D ; Virama # Mn TELUGU SIGN VIRAMA +0CCD ; Virama # Mn KANNADA SIGN VIRAMA +0D4D ; Virama # Mn MALAYALAM SIGN VIRAMA +0DCA ; Virama # Mn SINHALA SIGN AL-LAKUNA +0E3A ; Virama # Mn THAI CHARACTER PHINTHU +0E4E ; Virama # Mn THAI CHARACTER YAMAKKAN +0F84 ; Virama # Mn TIBETAN MARK HALANTA +1039..103A ; Virama # Mn [2] MYANMAR SIGN VIRAMA..MYANMAR SIGN ASAT +1714 ; Virama # Mn TAGALOG SIGN VIRAMA +1734 ; Virama # Mn HANUNOO SIGN PAMUDPOD +17D1..17D2 ; Virama # Mn [2] KHMER SIGN VIRIAM..KHMER SIGN COENG +1A60 ; Virama # Mn TAI THAM SIGN SAKOT +1B44 ; Virama # Mc BALINESE ADEG ADEG +1BAA ; Virama # Mc SUNDANESE SIGN PAMAAEH +1BAB ; Virama # Mc SUNDANESE SIGN VIRAMA +1BF2..1BF3 ; Virama # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +A806 ; Virama # Mn SYLOTI NAGRI SIGN HASANTA +A8C4 ; Virama # Mn SAURASHTRA SIGN VIRAMA +A953 ; Virama # Mc REJANG VIRAMA +A9C0 ; Virama # Mc JAVANESE PANGKON +AAF6 ; Virama # Mn MEETEI MAYEK VIRAMA +ABED ; Virama # Mn MEETEI MAYEK APUN IYEK +10A3F ; Virama # Mn KHAROSHTHI VIRAMA +11046 ; Virama # Mn BRAHMI VIRAMA +110B9 ; Virama # Mn KAITHI SIGN VIRAMA +11133..11134 ; Virama # Mn [2] CHAKMA VIRAMA..CHAKMA MAAYYAA +111C0 ; Virama # Mc SHARADA SIGN VIRAMA +116B6 ; Virama # Mn TAKRI SIGN VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Independent + +# Independent Vowels (contrasted with matras) + +# [Not derivable] + +0904..0914 ; Vowel_Independent # Lo [17] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER AU +0960..0961 ; Vowel_Independent # Lo [2] DEVANAGARI LETTER VOCALIC RR..DEVANAGARI LETTER VOCALIC LL +0972..0977 ; Vowel_Independent # Lo [6] DEVANAGARI LETTER CANDRA A..DEVANAGARI LETTER UUE +0985..098C ; Vowel_Independent # Lo [8] BENGALI LETTER A..BENGALI LETTER VOCALIC L +098F..0990 ; Vowel_Independent # Lo [2] BENGALI LETTER E..BENGALI LETTER AI +0993..0994 ; Vowel_Independent # Lo [2] BENGALI LETTER O..BENGALI LETTER AU +09E0..09E1 ; Vowel_Independent # Lo [2] BENGALI LETTER VOCALIC RR..BENGALI LETTER VOCALIC LL +0A05..0A0A ; Vowel_Independent # Lo [6] GURMUKHI LETTER A..GURMUKHI LETTER UU +0A0F..0A10 ; Vowel_Independent # Lo [2] GURMUKHI LETTER EE..GURMUKHI LETTER AI +0A13..0A14 ; Vowel_Independent # Lo [2] GURMUKHI LETTER OO..GURMUKHI LETTER AU +0A85..0A8D ; Vowel_Independent # Lo [9] GUJARATI LETTER A..GUJARATI VOWEL CANDRA E +0A8F..0A91 ; Vowel_Independent # Lo [3] GUJARATI LETTER E..GUJARATI VOWEL CANDRA O +0A93..0A94 ; Vowel_Independent # Lo [2] GUJARATI LETTER O..GUJARATI LETTER AU +0AE0..0AE1 ; Vowel_Independent # Lo [2] GUJARATI LETTER VOCALIC RR..GUJARATI LETTER VOCALIC LL +0B05..0B0C ; Vowel_Independent # Lo [8] ORIYA LETTER A..ORIYA LETTER VOCALIC L +0B0F..0B10 ; Vowel_Independent # Lo [2] ORIYA LETTER E..ORIYA LETTER AI +0B13..0B14 ; Vowel_Independent # Lo [2] ORIYA LETTER O..ORIYA LETTER AU +0B60..0B61 ; Vowel_Independent # Lo [2] ORIYA LETTER VOCALIC RR..ORIYA LETTER VOCALIC LL +0B85..0B8A ; Vowel_Independent # Lo [6] TAMIL LETTER A..TAMIL LETTER UU +0B8E..0B90 ; Vowel_Independent # Lo [3] TAMIL LETTER E..TAMIL LETTER AI +0B92..0B94 ; Vowel_Independent # Lo [3] TAMIL LETTER O..TAMIL LETTER AU +0C05..0C0C ; Vowel_Independent # Lo [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L +0C0E..0C10 ; Vowel_Independent # Lo [3] TELUGU LETTER E..TELUGU LETTER AI +0C12..0C14 ; Vowel_Independent # Lo [3] TELUGU LETTER O..TELUGU LETTER AU +0C60..0C61 ; Vowel_Independent # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL +0C85..0C8C ; Vowel_Independent # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L +0C8E..0C90 ; Vowel_Independent # Lo [3] KANNADA LETTER E..KANNADA LETTER AI +0C92..0C94 ; Vowel_Independent # Lo [3] KANNADA LETTER O..KANNADA LETTER AU +0CE0..0CE1 ; Vowel_Independent # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL +0D05..0D0C ; Vowel_Independent # Lo [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L +0D0E..0D10 ; Vowel_Independent # Lo [3] MALAYALAM LETTER E..MALAYALAM LETTER AI +0D12..0D14 ; Vowel_Independent # Lo [3] MALAYALAM LETTER O..MALAYALAM LETTER AU +0D60..0D61 ; Vowel_Independent # Lo [2] MALAYALAM LETTER VOCALIC RR..MALAYALAM LETTER VOCALIC LL +0D85..0D96 ; Vowel_Independent # Lo [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA +1021..102A ; Vowel_Independent # Lo [10] MYANMAR LETTER A..MYANMAR LETTER AU +1052..1055 ; Vowel_Independent # Lo [4] MYANMAR LETTER VOCALIC R..MYANMAR LETTER VOCALIC LL +1700..1702 ; Vowel_Independent # Lo [3] TAGALOG LETTER A..TAGALOG LETTER U +1720..1722 ; Vowel_Independent # Lo [3] HANUNOO LETTER A..HANUNOO LETTER U +1740..1742 ; Vowel_Independent # Lo [3] BUHID LETTER A..BUHID LETTER U +1760..1762 ; Vowel_Independent # Lo [3] TAGBANWA LETTER A..TAGBANWA LETTER U +17A3..17B3 ; Vowel_Independent # Lo [17] KHMER INDEPENDENT VOWEL QAQ..KHMER INDEPENDENT VOWEL QAU +1A4D..1A52 ; Vowel_Independent # Lo [6] TAI THAM LETTER I..TAI THAM LETTER OO +1B05..1B12 ; Vowel_Independent # Lo [14] BALINESE LETTER AKARA..BALINESE LETTER OKARA TEDUNG +1B83..1B89 ; Vowel_Independent # Lo [7] SUNDANESE LETTER A..SUNDANESE LETTER EU +1BE4..1BE5 ; Vowel_Independent # Lo [2] BATAK LETTER I..BATAK LETTER U +A800..A801 ; Vowel_Independent # Lo [2] SYLOTI NAGRI LETTER A..SYLOTI NAGRI LETTER I +A803..A805 ; Vowel_Independent # Lo [3] SYLOTI NAGRI LETTER U..SYLOTI NAGRI LETTER O +A882..A891 ; Vowel_Independent # Lo [16] SAURASHTRA LETTER A..SAURASHTRA LETTER AU +A984..A988 ; Vowel_Independent # Lo [5] JAVANESE LETTER A..JAVANESE LETTER U +A98C..A98E ; Vowel_Independent # Lo [3] JAVANESE LETTER E..JAVANESE LETTER O +AA00..AA05 ; Vowel_Independent # Lo [6] CHAM LETTER A..CHAM LETTER O +AAE0..AAE1 ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER E..MEETEI MAYEK LETTER O +ABCE..ABCF ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER UN..MEETEI MAYEK LETTER I +ABD1 ; Vowel_Independent # Lo MEETEI MAYEK LETTER ATIYA +11005..11012 ; Vowel_Independent # Lo [14] BRAHMI LETTER A..BRAHMI LETTER AU +11083..1108C ; Vowel_Independent # Lo [10] KAITHI LETTER A..KAITHI LETTER AU +11103..11106 ; Vowel_Independent # Lo [4] CHAKMA LETTER AA..CHAKMA LETTER E +11183..11190 ; Vowel_Independent # Lo [14] SHARADA LETTER A..SHARADA LETTER AU +11680..11689 ; Vowel_Independent # Lo [10] TAKRI LETTER A..TAKRI LETTER AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Dependent + +# Dependent Vowels (contrasted with independent vowels and/or with complex placement) +# Matras (in Indic scripts) + +# [Not derivable] + +093A ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN OE +093B ; Vowel_Dependent # Mc DEVANAGARI VOWEL SIGN OOE +093E..0940 ; Vowel_Dependent # Mc [3] DEVANAGARI VOWEL SIGN AA..DEVANAGARI VOWEL SIGN II +0941..0948 ; Vowel_Dependent # Mn [8] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN AI +0949..094C ; Vowel_Dependent # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094E..094F ; Vowel_Dependent # Mc [2] DEVANAGARI VOWEL SIGN PRISHTHAMATRA E..DEVANAGARI VOWEL SIGN AW +0955..0957 ; Vowel_Dependent # Mn [3] DEVANAGARI VOWEL SIGN CANDRA LONG E..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Vowel_Dependent # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BE..09C0 ; Vowel_Dependent # Mc [3] BENGALI VOWEL SIGN AA..BENGALI VOWEL SIGN II +09C1..09C4 ; Vowel_Dependent # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09C7..09C8 ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +09CB..09CC ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +09D7 ; Vowel_Dependent # Mc BENGALI AU LENGTH MARK +09E2..09E3 ; Vowel_Dependent # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3E..0A40 ; Vowel_Dependent # Mc [3] GURMUKHI VOWEL SIGN AA..GURMUKHI VOWEL SIGN II +0A41..0A42 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A47..0A48 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0ABE..0AC0 ; Vowel_Dependent # Mc [3] GUJARATI VOWEL SIGN AA..GUJARATI VOWEL SIGN II +0AC1..0AC5 ; Vowel_Dependent # Mn [5] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AC9 ; Vowel_Dependent # Mc GUJARATI VOWEL SIGN CANDRA O +0ACB..0ACC ; Vowel_Dependent # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0AE2..0AE3 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3E ; Vowel_Dependent # Mc ORIYA VOWEL SIGN AA +0B3F ; Vowel_Dependent # Mn ORIYA VOWEL SIGN I +0B40 ; Vowel_Dependent # Mc ORIYA VOWEL SIGN II +0B41..0B44 ; Vowel_Dependent # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B47..0B48 ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI +0B4B..0B4C ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN O..ORIYA VOWEL SIGN AU +0B56 ; Vowel_Dependent # Mn ORIYA AI LENGTH MARK +0B57 ; Vowel_Dependent # Mc ORIYA AU LENGTH MARK +0B62..0B63 ; Vowel_Dependent # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BBE..0BBF ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC0 ; Vowel_Dependent # Mn TAMIL VOWEL SIGN II +0BC1..0BC2 ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BC6..0BC8 ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0BCA..0BCC ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0BD7 ; Vowel_Dependent # Mc TAMIL AU LENGTH MARK +0C3E..0C40 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C41..0C44 ; Vowel_Dependent # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C46..0C48 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI +0C4A..0C4C ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C55..0C56 ; Vowel_Dependent # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK +0C62..0C63 ; Vowel_Dependent # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBE ; Vowel_Dependent # Mc KANNADA VOWEL SIGN AA +0CBF ; Vowel_Dependent # Mn KANNADA VOWEL SIGN I +0CC0..0CC4 ; Vowel_Dependent # Mc [5] KANNADA VOWEL SIGN II..KANNADA VOWEL SIGN VOCALIC RR +0CC6 ; Vowel_Dependent # Mn KANNADA VOWEL SIGN E +0CC7..0CC8 ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +0CCC ; Vowel_Dependent # Mn KANNADA VOWEL SIGN AU +0CD5..0CD6 ; Vowel_Dependent # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CE2..0CE3 ; Vowel_Dependent # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D3E..0D40 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D44 ; Vowel_Dependent # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR +0D46..0D48 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0D4A..0D4C ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0D57 ; Vowel_Dependent # Mc MALAYALAM AU LENGTH MARK +0D62..0D63 ; Vowel_Dependent # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DCF..0DD1 ; Vowel_Dependent # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD2..0DD4 ; Vowel_Dependent # Mn [3] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Vowel_Dependent # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0DD8..0DDF ; Vowel_Dependent # Mc [8] SINHALA VOWEL SIGN GAETTA-PILLA..SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Vowel_Dependent # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Vowel_Dependent # Lo THAI CHARACTER SARA A +0E31 ; Vowel_Dependent # Mn THAI CHARACTER MAI HAN-AKAT +0E32..0E33 ; Vowel_Dependent # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E34..0E39 ; Vowel_Dependent # Mn [6] THAI CHARACTER SARA I..THAI CHARACTER SARA UU +0E40..0E45 ; Vowel_Dependent # Lo [6] THAI CHARACTER SARA E..THAI CHARACTER LAKKHANGYAO +0E47 ; Vowel_Dependent # Mn THAI CHARACTER MAITAIKHU +0EB0 ; Vowel_Dependent # Lo LAO VOWEL SIGN A +0EB1 ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KAN +0EB2..0EB3 ; Vowel_Dependent # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0EB4..0EB9 ; Vowel_Dependent # Mn [6] LAO VOWEL SIGN I..LAO VOWEL SIGN UU +0EBB ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KON +0EC0..0EC4 ; Vowel_Dependent # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +0F71..0F7D ; Vowel_Dependent # Mn [13] TIBETAN VOWEL SIGN AA..TIBETAN VOWEL SIGN OO +0F80..0F81 ; Vowel_Dependent # Mn [2] TIBETAN VOWEL SIGN REVERSED I..TIBETAN VOWEL SIGN REVERSED II +102B..102C ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +102D..1030 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN UU +1031 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN E +1032..1035 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +1056..1057 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1058..1059 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1062 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1071..1074 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1083..1084 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN SHAN AA..MYANMAR VOWEL SIGN SHAN E +1085..1086 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109C ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN AITON A +109D ; Vowel_Dependent # Mn MYANMAR VOWEL SIGN AITON AI +1712..1713 ; Vowel_Dependent # Mn [2] TAGALOG VOWEL SIGN I..TAGALOG VOWEL SIGN U +1732..1733 ; Vowel_Dependent # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1752..1753 ; Vowel_Dependent # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U +1772..1773 ; Vowel_Dependent # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U +17B6 ; Vowel_Dependent # Mc KHMER VOWEL SIGN AA +17B7..17BD ; Vowel_Dependent # Mn [7] KHMER VOWEL SIGN I..KHMER VOWEL SIGN UA +17BE..17C5 ; Vowel_Dependent # Mc [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU +17C8 ; Vowel_Dependent # Mc KHMER SIGN YUUKALEAPINTU +1920..1922 ; Vowel_Dependent # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U +1923..1926 ; Vowel_Dependent # Mc [4] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AU +1927..1928 ; Vowel_Dependent # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +19B0..19C0 ; Vowel_Dependent # Mc [17] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN IY +1A17..1A18 ; Vowel_Dependent # Mn [2] BUGINESE VOWEL SIGN I..BUGINESE VOWEL SIGN U +1A19..1A1B ; Vowel_Dependent # Mc [3] BUGINESE VOWEL SIGN E..BUGINESE VOWEL SIGN AE +1A61 ; Vowel_Dependent # Mc TAI THAM VOWEL SIGN A +1A62 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN MAI SAT +1A63..1A64 ; Vowel_Dependent # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A65..1A6C ; Vowel_Dependent # Mn [8] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN OA BELOW +1A6D..1A72 ; Vowel_Dependent # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI +1A73..1A74 ; Vowel_Dependent # Mn [2] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN MAI KANG +1B35 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN TEDUNG +1B36..1B3A ; Vowel_Dependent # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA +1B3B ; Vowel_Dependent # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +1B3C ; Vowel_Dependent # Mn BALINESE VOWEL SIGN LA LENGA +1B3D..1B41 ; Vowel_Dependent # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1B42 ; Vowel_Dependent # Mn BALINESE VOWEL SIGN PEPET +1B43 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN PEPET TEDUNG +1BA4..1BA5 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PANGHULU..SUNDANESE VOWEL SIGN PANYUKU +1BA6..1BA7 ; Vowel_Dependent # Mc [2] SUNDANESE VOWEL SIGN PANAELAENG..SUNDANESE VOWEL SIGN PANOLONG +1BA8..1BA9 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE7 ; Vowel_Dependent # Mc BATAK VOWEL SIGN E +1BE8..1BE9 ; Vowel_Dependent # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BEA..1BEC ; Vowel_Dependent # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BED ; Vowel_Dependent # Mn BATAK VOWEL SIGN KARO O +1BEE ; Vowel_Dependent # Mc BATAK VOWEL SIGN U +1BEF ; Vowel_Dependent # Mn BATAK VOWEL SIGN U FOR SIMALUNGUN SA +1C26..1C2B ; Vowel_Dependent # Mc [6] LEPCHA VOWEL SIGN AA..LEPCHA VOWEL SIGN UU +1C2C ; Vowel_Dependent # Mn LEPCHA VOWEL SIGN E +A823..A824 ; Vowel_Dependent # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A825..A826 ; Vowel_Dependent # Mn [2] SYLOTI NAGRI VOWEL SIGN U..SYLOTI NAGRI VOWEL SIGN E +A827 ; Vowel_Dependent # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Vowel_Dependent # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A947..A94E ; Vowel_Dependent # Mn [8] REJANG VOWEL SIGN I..REJANG VOWEL SIGN EA +A9B4..A9B5 ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9B6..A9B9 ; Vowel_Dependent # Mn [4] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BA..A9BB ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +A9BC ; Vowel_Dependent # Mn JAVANESE VOWEL SIGN PEPET +AA29..AA2E ; Vowel_Dependent # Mn [6] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN OE +AA2F..AA30 ; Vowel_Dependent # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA31..AA32 ; Vowel_Dependent # Mn [2] CHAM VOWEL SIGN AU..CHAM VOWEL SIGN UE +AAB0 ; Vowel_Dependent # Mn TAI VIET MAI KANG +AAB1 ; Vowel_Dependent # Lo TAI VIET VOWEL AA +AAB2..AAB4 ; Vowel_Dependent # Mn [3] TAI VIET VOWEL I..TAI VIET VOWEL U +AAB5..AAB6 ; Vowel_Dependent # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB7..AAB8 ; Vowel_Dependent # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AAB9..AABD ; Vowel_Dependent # Lo [5] TAI VIET VOWEL UEA..TAI VIET VOWEL AN +AABE ; Vowel_Dependent # Mn TAI VIET VOWEL AM +AAEB..AAEF ; Vowel_Dependent # Mc [5] MEETEI MAYEK VOWEL SIGN II..MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE5 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN ANAP +ABE6..ABE7 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE8 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABE9..ABEA ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +10A01..10A03 ; Vowel_Dependent # Mn [3] KHAROSHTHI VOWEL SIGN I..KHAROSHTHI VOWEL SIGN VOCALIC R +10A05..10A06 ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O +10A0C ; Vowel_Dependent # Mn KHAROSHTHI VOWEL LENGTH MARK +11038..11045 ; Vowel_Dependent # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +110B0..110B2 ; Vowel_Dependent # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II +110B3..110B6 ; Vowel_Dependent # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI +110B7..110B8 ; Vowel_Dependent # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11127..11132 ; Vowel_Dependent # Mn [12] CHAKMA VOWEL SIGN A..CHAKMA AU MARK +111B3..111BF ; Vowel_Dependent # Mn [13] SHARADA VOWEL SIGN AA..SHARADA VOWEL SIGN AU +116AD..116B5 ; Vowel_Dependent # Mn [9] TAKRI VOWEL SIGN AA..TAKRI VOWEL SIGN AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel + +# (Other) Vowels (reanalyzed as ordinary alphabetic letters or marks) + +# [Not derivable] + +1963..196D ; Vowel # Lo [11] TAI LE LETTER A..TAI LE LETTER AI +A85E..A861 ; Vowel # Lo [4] PHAGS-PA LETTER I..PHAGS-PA LETTER O +A866 ; Vowel # Lo [1] PHAGS-PA LETTER EE +A922..A925 ; Vowel # Lo [4] KAYAH LI LETTER A..KAYAH LI LETTER OO +A926..A92A ; Vowel # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Placeholder + +# Consonant Placeholder +# This includes generic placeholders used for +# Indic script layout (NBSP and dotted circle), as well as a few script- +# specific vowel-holder characters which are not technically +# consonants, but serve instead as bases for placement of vowel marks. + +# [Not derivable] + +00A0 ; Consonant_Placeholder # Zs NO-BREAK SPACE +0A72..0A73 ; Consonant_Placeholder # Lo [2] GURMUKHI IRI..GURMUKHI URA +1900 ; Consonant_Placeholder # Lo LIMBU VOWEL-CARRIER LETTER +25CC ; Consonant_Placeholder # So DOTTED CIRCLE + +# ================================================ + +# Indic_Syllabic_Category=Consonant + +# Consonant (ordinary abugida consonants, with inherent vowels) + +# [Not derivable] + +0915..0939 ; Consonant # Lo [37] DEVANAGARI LETTER KA..DEVANAGARI LETTER HA +0958..095F ; Consonant # Lo [8] DEVANAGARI LETTER QA..DEVANAGARI LETTER YYA +0979..097F ; Consonant # Lo [7] DEVANAGARI LETTER ZHA..DEVANAGARI LETTER BBA +0995..09A8 ; Consonant # Lo [20] BENGALI LETTER KA..BENGALI LETTER NA +09AA..09B0 ; Consonant # Lo [7] BENGALI LETTER PA..BENGALI LETTER RA +09B2 ; Consonant # Lo BENGALI LETTER LA +09B6..09B9 ; Consonant # Lo [4] BENGALI LETTER SHA..BENGALI LETTER HA +09DC..09DD ; Consonant # Lo [2] BENGALI LETTER RRA..BENGALI LETTER RHA +09DF ; Consonant # Lo BENGALI LETTER YYA +09F0..09F1 ; Consonant # Lo [2] BENGALI LETTER RA WITH MIDDLE DIAGONAL..BENGALI LETTER RA WITH LOWER DIAGONAL +0A15..0A28 ; Consonant # Lo [20] GURMUKHI LETTER KA..GURMUKHI LETTER NA +0A2A..0A30 ; Consonant # Lo [7] GURMUKHI LETTER PA..GURMUKHI LETTER RA +0A32..0A33 ; Consonant # Lo [2] GURMUKHI LETTER LA..GURMUKHI LETTER LLA +0A35..0A36 ; Consonant # Lo [2] GURMUKHI LETTER VA..GURMUKHI LETTER SHA +0A38..0A39 ; Consonant # Lo [2] GURMUKHI LETTER SA..GURMUKHI LETTER HA +0A59..0A5C ; Consonant # Lo [4] GURMUKHI LETTER KHHA..GURMUKHI LETTER RRA +0A5E ; Consonant # Lo GURMUKHI LETTER FA +0A95..0AA8 ; Consonant # Lo [20] GUJARATI LETTER KA..GUJARATI LETTER NA +0AAA..0AB0 ; Consonant # Lo [7] GUJARATI LETTER PA..GUJARATI LETTER RA +0AB2..0AB3 ; Consonant # Lo [2] GUJARATI LETTER LA..GUJARATI LETTER LLA +0AB5..0AB9 ; Consonant # Lo [5] GUJARATI LETTER VA..GUJARATI LETTER HA +0B15..0B28 ; Consonant # Lo [20] ORIYA LETTER KA..ORIYA LETTER NA +0B2A..0B30 ; Consonant # Lo [7] ORIYA LETTER PA..ORIYA LETTER RA +0B32..0B33 ; Consonant # Lo [2] ORIYA LETTER LA..ORIYA LETTER LLA +0B35..0B39 ; Consonant # Lo [5] ORIYA LETTER VA..ORIYA LETTER HA +0B5C..0B5D ; Consonant # Lo [2] ORIYA LETTER RRA..ORIYA LETTER RHA +0B5F ; Consonant # Lo ORIYA LETTER YYA +0B71 ; Consonant # Lo ORIYA LETTER WA +0B95 ; Consonant # Lo TAMIL LETTER KA +0B99..0B9A ; Consonant # Lo [2] TAMIL LETTER NGA..TAMIL LETTER CA +0B9C ; Consonant # Lo TAMIL LETTER JA +0B9E..0B9F ; Consonant # Lo [2] TAMIL LETTER NYA..TAMIL LETTER TTA +0BA3..0BA4 ; Consonant # Lo [2] TAMIL LETTER NNA..TAMIL LETTER TA +0BA8..0BAA ; Consonant # Lo [3] TAMIL LETTER NA..TAMIL LETTER PA +0BAE..0BB9 ; Consonant # Lo [12] TAMIL LETTER MA..TAMIL LETTER HA +0C15..0C28 ; Consonant # Lo [20] TELUGU LETTER KA..TELUGU LETTER NA +0C2A..0C33 ; Consonant # Lo [10] TELUGU LETTER PA..TELUGU LETTER LLA +0C35..0C39 ; Consonant # Lo [5] TELUGU LETTER VA..TELUGU LETTER HA +0C58..0C59 ; Consonant # Lo [2] TELUGU LETTER TSA..TELUGU LETTER DZA +0C95..0CA8 ; Consonant # Lo [20] KANNADA LETTER KA..KANNADA LETTER NA +0CAA..0CB3 ; Consonant # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA +0CB5..0CB9 ; Consonant # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA +0CDE ; Consonant # Lo KANNADA LETTER FA +0D15..0D3A ; Consonant # Lo [38] MALAYALAM LETTER KA..MALAYALAM LETTER TTTA +0D9A..0DB1 ; Consonant # Lo [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA +0DB3..0DBB ; Consonant # Lo [9] SINHALA LETTER SANYAKA DAYANNA..SINHALA LETTER RAYANNA +0DBD ; Consonant # Lo SINHALA LETTER DANTAJA LAYANNA +0DC0..0DC6 ; Consonant # Lo [7] SINHALA LETTER VAYANNA..SINHALA LETTER FAYANNA +0E01..0E2E ; Consonant # Lo [46] THAI CHARACTER KO KAI..THAI CHARACTER NOKHUK +0E81..0E82 ; Consonant # Lo [2] LAO LETTER KO..LAO LETTER KHO SUNG +0E84 ; Consonant # Lo LAO LETTER KHO TAM +0E87..0E88 ; Consonant # Lo [2] LAO LETTER NGO..LAO LETTER CO +0E8A ; Consonant # Lo LAO LETTER SO TAM +0E8D ; Consonant # Lo LAO LETTER NYO +0E94..0E97 ; Consonant # Lo [4] LAO LETTER DO..LAO LETTER THO TAM +0E99..0E9F ; Consonant # Lo [7] LAO LETTER NO..LAO LETTER FO SUNG +0EA1..0EA3 ; Consonant # Lo [3] LAO LETTER MO..LAO LETTER LO LING +0EA5 ; Consonant # Lo LAO LETTER LO LOOT +0EA7 ; Consonant # Lo LAO LETTER WO +0EAA..0EAB ; Consonant # Lo [2] LAO LETTER SO SUNG..LAO LETTER HO SUNG +0EAD..0EAE ; Consonant # Lo [2] LAO LETTER O..LAO LETTER HO TAM +0EDC..0EDD ; Consonant # Lo [2] LAO HO NO..LAO HO MO +0F40..0F47 ; Consonant # Lo [8] TIBETAN LETTER KA..TIBETAN LETTER JA +0F49..0F6C ; Consonant # Lo [36] TIBETAN LETTER NYA..TIBETAN LETTER RRA +1000..1020 ; Consonant # Lo [33] MYANMAR LETTER KA..MYANMAR LETTER LLA +103F ; Consonant # Lo MYANMAR LETTER GREAT SA +1050..1051 ; Consonant # Lo [2] MYANMAR LETTER SHA..MYANMAR LETTER SSA +105A..105D ; Consonant # Lo [4] MYANMAR LETTER MON NGA..MYANMAR LETTER MON BBE +1061 ; Consonant # Lo MYANMAR LETTER SGAW KAREN SHA +1065..1066 ; Consonant # Lo [2] MYANMAR LETTER WESTERN PWO KAREN THA..MYANMAR LETTER WESTERN PWO KAREN PWA +106E..1070 ; Consonant # Lo [3] MYANMAR LETTER EASTERN PWO KAREN NNA..MYANMAR LETTER EASTERN PWO KAREN GHWA +1075..1081 ; Consonant # Lo [13] MYANMAR LETTER SHAN KA..MYANMAR LETTER SHAN HA +108E ; Consonant # Lo MYANMAR LETTER RUMAI PALAUNG FA +1703..170C ; Consonant # Lo [10] TAGALOG LETTER KA..TAGALOG LETTER YA +170E..1711 ; Consonant # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1723..1731 ; Consonant # Lo [15] HANUNOO LETTER KA..HANUNOO LETTER HA +1743..1751 ; Consonant # Lo [15] BUHID LETTER KA..BUHID LETTER HA +1763..176C ; Consonant # Lo [10] TAGBANWA LETTER KA..TAGBANWA LETTER YA +176E..1770 ; Consonant # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA +1780..17A2 ; Consonant # Lo [35] KHMER LETTER KA..KHMER LETTER QA +1901..191C ; Consonant # Lo [28] LIMBU LETTER KA..LIMBU LETTER HA +1950..1962 ; Consonant # Lo [19] TAI LE LETTER KA..TAI LE LETTER NA +1980..19AB ; Consonant # Lo [44] NEW TAI LUE LETTER HIGH QA..NEW TAI LUE LETTER LOW SUA +1A00..1A16 ; Consonant # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA +1A20..1A4C ; Consonant # Lo [45] TAI THAM LETTER HIGH KA..TAI THAM LETTER LOW HA +1A53..1A54 ; Consonant # Lo [2] TAI THAM LETTER LAE..TAI THAM LETTER GREAT SA +1B13..1B33 ; Consonant # Lo [33] BALINESE LETTER KA..BALINESE LETTER HA +1B45..1B4B ; Consonant # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B8A..1BA0 ; Consonant # Lo [23] SUNDANESE LETTER KA..SUNDANESE LETTER HA +1BAE..1BAF ; Consonant # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA +1BBB..1BBD ; Consonant # Lo [3] SUNDANESE LETTER REU..SUNDANESE LETTER BHA +1BC0..1BE3 ; Consonant # Lo [36] BATAK LETTER A..BATAK LETTER MBA +1C00..1C23 ; Consonant # Lo [36] LEPCHA LETTER KA..LEPCHA LETTER A +1C4D..1C4F ; Consonant # Lo [3] LEPCHA LETTER TTA..LEPCHA LETTER DDA +A807..A80A ; Consonant # Lo [4] SYLOTI NAGRI LETTER KO..SYLOTI NAGRI LETTER GHO +A80C..A822 ; Consonant # Lo [23] SYLOTI NAGRI LETTER CO..SYLOTI NAGRI LETTER HO +A840..A85D ; Consonant # Lo [30] PHAGS-PA LETTER KA..PHAGS-PA LETTER A +A862..A865 ; Consonant # Lo [4] PHAGS-PA LETTER QA..PHAGS-PA LETTER GGA +A869..A870 ; Consonant # Lo [8] PHAGS-PA LETTER TTA..PHAGS-PA LETTER ASPIRATED FA +A872 ; Consonant # Lo PHAGS-PA SUPERFIXED LETTER RA +A892..A8B3 ; Consonant # Lo [34] SAURASHTRA LETTER KA..SAURASHTRA LETTER LLA +A90A..A921 ; Consonant # Lo [24] KAYAH LI LETTER KA..KAYAH LI LETTER CA +A930..A946 ; Consonant # Lo [23] REJANG LETTER KA..REJANG LETTER A +A989..A98B ; Consonant # Lo [3] JAVANESE LETTER PA CEREK..JAVANESE LETTER NGA LELET RASWADI +A98F..A9B2 ; Consonant # Lo [36] JAVANESE LETTER KA..JAVANESE LETTER HA +AA06..AA28 ; Consonant # Lo [35] CHAM LETTER KA..CHAM LETTER HA +AA60..AA6F ; Consonant # Lo [16] MYANMAR LETTER KHAMTI GA..MYANMAR LETTER KHAMTI FA +AA71..AA73 ; Consonant # Lo [3] MYANMAR LETTER KHAMTI XA..MYAMNAR LETTER KHAMTI RA +AA7A ; Consonant # Lo MYANMAR LETTER AITON RA +AA80..AAAF ; Consonant # Lo [48] TAI VIET LETTER LOW KO..TAI VIET LETTER HIGH O +AAE2..AAEA ; Consonant # Lo [9] MEETEI MAYEK LETTER CHA..MEETEI MAYEK LETTER SSA +ABC0..ABCD ; Consonant # Lo [14] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER HUK +ABD0 ; Consonant # Lo MEETEI MAYEK LETTER PHAM +ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTER BHAM +10A00 ; Consonant # Lo KHAROSHTHI LETTER A +10A10..10A13 ; Consonant # Lo [4] KHAROSHTHI LETTER KA..KHAROSHTHI LETTER GHA +10A15..10A17 ; Consonant # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA +10A19..10A33 ; Consonant # Lo [27] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER TTTHA +11013..11037 ; Consonant # Lo [37] BRAHMI LETTER KA..BRAHMI LETTER OLD TAMIL NNNA +1108D..110AF ; Consonant # Lo [35] KAITHI LETTER KA..KAITHI LETTER HA +11107..11126 ; Consonant # Lo [32] CHAKMA LETTER KAA..CHAKMA LETTER HAA +11191..111B2 ; Consonant # Lo [34] SHARADA LETTER KA..SHARADA LETTER HA +1168A..116AA ; Consonant # Lo [34] TAKRI LETTER KA..TAKRI LETTER RRA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Dead + +# Dead Consonant (special consonant with killed vowel) + +# [Not derivable] + +09CE ; Consonant_Dead # Lo BENGALI LETTER KHANDA TA +0D7A..0D7F ; Consonant_Dead # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Repha + +# Repha Form of RA (reanalyzed in some scripts) + +# [Not derivable] + +0D4E ; Consonant_Repha # Lo MALAYALAM LETTER DOT REPH +17CC ; Consonant_Repha # Mn KHMER SIGN ROBAT +1B03 ; Consonant_Repha # Mn BALINESE SIGN SURANG +1B81 ; Consonant_Repha # Mn SUNDANESE SIGN PANGLAYAR +A982 ; Consonant_Repha # Mn JAVANESE SIGN LAYAR + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Subjoined + +# Subjoined Consonant (C2 form subtending a base consonant in Tibetan, etc.) + +# [Not derivable] + +0F8D..0F97 ; Consonant_Subjoined # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Consonant_Subjoined # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +1929..192B ; Consonant_Subjoined # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1BA1 ; Consonant_Subjoined # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA2..1BA3 ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BAC..1BAD ; Consonant_Subjoined # Mc [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C24..1C25 ; Consonant_Subjoined # Mc [2] LEPCHA SUBJOINED LETTER YA..LEPCHA SUBJOINED LETTER RA +A867..A868 ; Consonant_Subjoined # Lo [2] PHAGS-PA SUBJOINED LETTER WA..PHAGS-PA SUBJOINED LETTER YA +A871 ; Consonant_Subjoined # Lo PHAGS-PA SUBJOINED LETTER RA +A9BD ; Consonant_Subjoined # Mc JAVANESE CONSONANT SIGN KERET + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Medial + +# Medial Consonant (medial liquid, occurring in clusters) + +# [Not derivable] + +0A75 ; Consonant_Medial # Mn GURMUKHI SIGN YAKASH +0EBC ; Consonant_Medial # Mn LAO SEMIVOWEL SIGN LO +0EBD ; Consonant_Medial # Lo LAO SEMIVOWEL SIGN NYO +103B..103C ; Consonant_Medial # Mc [2] MYANMAR CONSONANT SIGN MEDIAL YA..MYANMAR CONSONANT SIGN MEDIAL RA +103D..103E ; Consonant_Medial # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +105E..1060 ; Consonant_Medial # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Consonant_Medial # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +1A55 ; Consonant_Medial # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A56 ; Consonant_Medial # Mn TAI THAM CONSONANT SIGN MEDIAL LA +A9BE..A9BF ; Consonant_Medial # Mc [2] JAVANESE CONSONANT SIGN PENGKAL..JAVANESE CONSONANT SIGN CAKRA +AA33..AA34 ; Consonant_Medial # Mc [2] CHAM CONSONANT SIGN YA..CHAM CONSONANT SIGN RA +AA35..AA36 ; Consonant_Medial # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Final + +# Final Consonant (special final forms which do not take vowels) + +# [Not derivable] + +1930..1931 ; Consonant_Final # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Consonant_Final # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +19C1..19C7 ; Consonant_Final # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B +1A57 ; Consonant_Final # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A58..1A5E ; Consonant_Final # Mn [7] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN SA +1BBE..1BBF ; Consonant_Final # Lo [2] SUNDANESE LETTER FINAL K..SUNDANESE LETTER FINAL M +1BF0..1BF1 ; Consonant_Final # Mn [2] BATAK CONSONANT SIGN NG..BATAK CONSONANT SIGN H +1C2D..1C33 ; Consonant_Final # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +A8B4 ; Consonant_Final # Mc SAURASHTRA CONSONANT SIGN HAARU +A94F..A951 ; Consonant_Final # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A952 ; Consonant_Final # Mc REJANG CONSONANT SIGN H +AA40..AA42 ; Consonant_Final # Lo [3] CHAM LETTER FINAL K..CHAM LETTER FINAL NG +AA43 ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL NG +AA44..AA4B ; Consonant_Final # Lo [8] CHAM LETTER FINAL CH..CHAM LETTER FINAL SS +AA4C ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL M +AA4D ; Consonant_Final # Mc CHAM CONSONANT SIGN FINAL H +ABDB..ABE2 ; Consonant_Final # Lo [8] MEETEI MAYEK LETTER KOK LONSUM..MEETEI MAYEK LETTER I LONSUM + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Head_Letter + +# Head Letter (Tibetan) + +# [Not derivable] + +0F88..0F8C ; Consonant_Head_Letter # Lo [5] TIBETAN SIGN LCE TSA CAN..TIBETAN SIGN INVERTED MCHU CAN + +# ================================================ + +# Indic_Syllabic_Category=Modifying_Letter + +# Reanalyzed letters not participating in the abugida structure, but +# serving to modify the sound of an adjacent vowel or consonant. +# Note that this is not the same as General_Category=Modifier_Letter. + +# [Not derivable] + +0B83 ; Modifying_Letter # Lo TAMIL SIGN VISARGA (aytham) + +# ================================================ + +# Indic_Syllabic_Category=Tone_Letter + +# Tone Letter (spacing lexical tone mark with status as a letter) + +# [Not derivable] + +1970..1974 ; Tone_Letter # Lo [5] TAI LE LETTER TONE-2..TAI LE LETTER TONE-6 +AAC0 ; Tone_Letter # Lo TAI VIET TONE MAI NUENG +AAC2 ; Tone_Letter # Lo TAI VIET TONE MAI SONG + +# ================================================ + +# Indic_Syllabic_Category=Tone_Mark + +# Tone Mark (nonspacing or spacing lexical tone mark) +# Excludes Vedic tone marks, which are more akin to cantillation marks. + +# [Not derivable] + +0E48..0E4B ; Tone_Mark # Mn [4] THAI CHARACTER MAI EK..THAI CHARACTER MAI CHATTAWA +0EC8..0ECB ; Tone_Mark # Mn [4] LAO TONE MAI EK..LAO TONE MAI CATAWA +1037 ; Tone_Mark # Mn MYANMAR SIGN DOT BELOW +1063..1064 ; Tone_Mark # Mc [2] MYANMAR TONE MARK SGAW KAREN HATHI..MYANMAR TONE MARK SGAW KAREN KE PHO +1069..106D ; Tone_Mark # Mc [5] MYANMAR SIGN WESTERN PWO KAREN TONE-1..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1087..108C ; Tone_Mark # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108D ; Tone_Mark # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +108F ; Tone_Mark # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109B ; Tone_Mark # Mc [2] MYANMAR SIGN KHAMTI TONE-1..MYANMAR SIGN KHAMTI TONE-3 +19C8..19C9 ; Tone_Mark # Mc [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A75..1A79 ; Tone_Mark # Mn [5] TAI THAM SIGN TONE-1..TAI THAM SIGN KHUEN TONE-5 +A92B..A92D ; Tone_Mark # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +AA7B ; Tone_Mark # Mc MYANMAR SIGN PAO KAREN TONE +AABF ; Tone_Mark # Mn TAI VIET TONE MAI EK +AAC1 ; Tone_Mark # Mn TAI VIET TONE MAI THO +ABEC ; Tone_Mark # Mc MEETEI MAYEK LUM IYEK + +# ================================================ + +# Indic_Syllabic_Category=Register_Shifter + +# Register Shifter (shifts register for consonants, akin to a tone mark) + +# [Not derivable] + +17C9..17CA ; Register_Shifter # Mn [2] KHMER SIGN MUUSIKATOAN..KHMER SIGN TRIISAP + +# EOF diff --git a/data/7.0.0-indic-positional-category.txt b/data/7.0.0-indic-positional-category.txt new file mode 100644 index 0000000..c3a0943 --- /dev/null +++ b/data/7.0.0-indic-positional-category.txt @@ -0,0 +1,501 @@ +# IndicMatraCategory-7.0.0.txt +# Date: 2014-06-03, 07:00:00 GMT [KW, LI, AG, RP] +# +# Unicode Character Database +# Copyright (c) 1991-2014 Unicode, Inc. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# For documentation, see UAX #44: Unicode Character Database, +# at http://www.unicode.org/reports/tr44/ +# +# This file defines the following provisional property: +# +# Indic_Matra_Category enumerated property +# +# NB: Provisional properties and data files have no associated stability +# guarantees. They are provided in part to determine the possible usefulness +# of a property or other data and to encourage analysis and further investigation +# which may result in their improvement. Provisional properties and data files +# may change arbitrarily, or may even be removed in a future version of the +# Unicode Character Database, if they prove not to be useful. +# +# Scope: This provisional property is aimed at the problem of +# the specification of syllabic structure for Indic scripts. +# Because dependent vowels (and visible viramas, where they occur) +# are placed in notional slots around the consonant (or consonant +# cluster) core of an Indic syllable, there may be cooccurrence +# constraints or other interactions. Also, it may be desirable, +# in cases where more than one dependent vowel may occur in +# sequence, as for example, in a top slot and a bottom slot, to +# specify preferred orders for spelling. As such, this property +# is designed primarily to supplement the Indic_Syllabic_Category +# property. +# +# Note that this provisional property is *not* intended as +# a prescriptive property regarding display or font design, +# for a number of reasons. Good font design requires information +# that is outside the context of a character encoding standard, +# and is best handled in other venues. For Indic dependent +# vowels, in particular: +# +# 1. Matra placement may vary somewhat based on typeface design. +# 2. Matra placement, even within a single script, may vary +# somewhat according to historic period or local conventions. +# 3. Matra placement may be changed by explicit orthographic reform +# decisions. +# 4. Matras may ligate in various ways with a consonant (or even +# other elements of a syllable) instead of occurring in a +# discrete location. +# 5. Matra display may be contextually determined. This is +# notable, for example, in the Tamil script, where the shape +# and placement of -u and -uu vowels depends strongly on +# which consonant they adjoin. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Matra_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as containing dependent vowels or viramas in the +# structural sense used for the Indic_Matra_Category are the following: +# +# Balinese, Batak, Bengali, Brahmi, Buginese, Buhid, Chakma, Cham, +# Devanagari, Grantha, Gujarati, Gurmukhi, Hanunoo, Javanese, Kaithi, +# Kannada, Kharoshthi, Khmer, Khojki, Khudawadi, Lao, Lepcha, Limbu, +# Malayalam, Meetei Mayek, Modi, Myanmar, New Tai Lue, Oriya, Rejang, +# Saurashtra, Sharada, Siddham, Sinhala, Sundanese, Syloti Nagri, +# Tagalog, Tagbanwa, Tai Tham, Tai Viet, Takri, Tamil, Telugu, Thai, +# Tibetan, and Tirhuta. +# +# All characters for all other scripts not in that list +# take the default value for this property. +# +# See IndicSyllabicCategory.txt for a slightly more extended +# list of Indic scripts, including those which do not have +# dependent vowel characters. Currently, those additional +# Indic scripts without dependent vowel characters are +# Kayah Li, Mahajani, Phags-pa, and Tai Le. +# + +# ================================================ + +# Property: Indic_Matra_Category +# +# All code points not explicitly listed for Indic_Matra_Category +# have the value NA (not applicable). +# +# @missing: 0000..10FFFF; NA + +# Only characters from the following syllabic categories have +# a non-default value for the Indic_Matra_Category property: +# - dependent vowels (Indic_Syllabic_Category=Vowel_Dependent) +# - viramas (Indic_Syllabic_Category=Virama) +# - pure killers (Indic_Syllabic_Category=Pure_Killer) +# - gemination marks (Indic_Syllabic_Category=Gemination_Mark) +# - left-reordrant instances of medial consonants +# (Indic_Syllabic_Category=Consonant_Medial) +# - bindi (Indic_Syllabic_Category=Bindu) in Lepcha +# - repha forms of ra succeeding the main consonant +# (Indic_Syllabic_Category=Consonant_Succeeding_Repha) +# - register shifters (Indic_Syllabic_Category=Register_Shifter) + +# ------------------------------------------------ + +# Indic_Matra_Category=Right + +093B ; Right # Mc DEVANAGARI VOWEL SIGN OOE +093E ; Right # Mc DEVANAGARI VOWEL SIGN AA +0940 ; Right # Mc DEVANAGARI VOWEL SIGN II +0949..094C ; Right # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094F ; Right # Mc DEVANAGARI VOWEL SIGN AW +09BE ; Right # Mc BENGALI VOWEL SIGN AA +09C0 ; Right # Mc BENGALI VOWEL SIGN II +09D7 ; Right # Mc BENGALI AU LENGTH MARK +0A3E ; Right # Mc GURMUKHI VOWEL SIGN AA +0A40 ; Right # Mc GURMUKHI VOWEL SIGN II +0ABE ; Right # Mc GUJARATI VOWEL SIGN AA +0AC0 ; Right # Mc GUJARATI VOWEL SIGN II +0ACB..0ACC ; Right # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0B3E ; Right # Mc ORIYA VOWEL SIGN AA +0B40 ; Right # Mc ORIYA VOWEL SIGN II +0BBE..0BBF ; Right # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BD7 ; Right # Mc TAMIL AU LENGTH MARK +0C41..0C44 ; Right # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0CBE ; Right # Mc KANNADA VOWEL SIGN AA +0CC1..0CC4 ; Right # Mc [4] KANNADA VOWEL SIGN U..KANNADA VOWEL SIGN VOCALIC RR +0CD5..0CD6 ; Right # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0D3E..0D40 ; Right # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D42 ; Right # Mn [2] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN UU +# Note: U and UU form complex ligatures with consonants in older Malayalam orthography. +0D57 ; Right # Mc MALAYALAM AU LENGTH MARK +0DCF..0DD1 ; Right # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD8 ; Right # Mc SINHALA VOWEL SIGN GAETTA-PILLA +0DDF ; Right # Mc SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Right # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Right # Lo THAI CHARACTER SARA A +0E32..0E33 ; Right # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E45 ; Right # Lo THAI CHARACTER LAKKHANGYAO +0EB0 ; Right # Lo LAO VOWEL SIGN A +0EB2..0EB3 ; Right # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +102B..102C ; Right # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +1056..1057 ; Right # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1062 ; Right # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Right # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1083 ; Right # Mc MYANMAR VOWEL SIGN SHAN AA +109C ; Right # Mc MYANMAR VOWEL SIGN AITON A +17B6 ; Right # Mc KHMER VOWEL SIGN AA +17C8 ; Right # Mc KHMER SIGN YUUKALEAPINTU +1923..1924 ; Right # Mc [2] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AI +19B0..19B4 ; Right # Mc [5] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN UU +19B8..19B9 ; Right # Mc [2] NEW TAI LUE VOWEL SIGN OA..NEW TAI LUE VOWEL SIGN UE +19BB..19C0 ; Right # Mc [6] NEW TAI LUE VOWEL SIGN AAY..NEW TAI LUE VOWEL SIGN IY +1A1A ; Right # Mc BUGINESE VOWEL SIGN O +1A61 ; Right # Mc TAI THAM VOWEL SIGN A +1A63..1A64 ; Right # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A6D ; Right # Mc TAI THAM VOWEL SIGN OY +1B35 ; Right # Mc BALINESE VOWEL SIGN TEDUNG +1B44 ; Right # Mc BALINESE ADEG ADEG +1BA7 ; Right # Mc SUNDANESE VOWEL SIGN PANOLONG +1BAA ; Right # Mc SUNDANESE SIGN PAMAAEH +1BE7 ; Right # Mc BATAK VOWEL SIGN E +1BEA..1BEC ; Right # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BEE ; Right # Mc BATAK VOWEL SIGN U +1BF2..1BF3 ; Right # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +1C26 ; Right # Mc LEPCHA VOWEL SIGN AA +1C2A..1C2B ; Right # Mc [2] LEPCHA VOWEL SIGN U..LEPCHA VOWEL SIGN UU +A823..A824 ; Right # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A827 ; Right # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Right # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A953 ; Right # Mc REJANG VIRAMA +A9B4..A9B5 ; Right # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +AAB1 ; Right # Lo TAI VIET VOWEL AA +AABA ; Right # Lo TAI VIET VOWEL UA +AABD ; Right # Lo TAI VIET VOWEL AN +AAEF ; Right # Mc MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE6..ABE7 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE9..ABEA ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +110B0 ; Right # Mc KAITHI VOWEL SIGN AA +110B2 ; Right # Mc KAITHI VOWEL SIGN II +110B7..110B8 ; Right # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +111B3 ; Right # Mc SHARADA VOWEL SIGN AA +111B5 ; Right # Mc SHARADA VOWEL SIGN II +111C0 ; Right # Mc SHARADA SIGN VIRAMA +1122C..1122E ; Right # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +11235 ; Right # Mc KHOJKI SIGN VIRAMA +112E0 ; Right # Mc KHUDAWADI VOWEL SIGN AA +112E2 ; Right # Mc KHUDAWADI VOWEL SIGN II +1133E..1133F ; Right # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11341..11342 ; Right # Mc [2] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN UU +# Note: U and UU have contextually variable placement in Grantha. +11343..11344 ; Right # Mc [2] GRANTHA VOWEL SIGN VOCALIC R..GRANTHA VOWEL SIGN VOCALIC RR +1134D ; Right # Mc GRANTHA SIGN VIRAMA +11357 ; Right # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Right # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +114B0 ; Right # Mc TIRHUTA VOWEL SIGN AA +114B2 ; Right # Mc TIRHUTA VOWEL SIGN II +114BD ; Right # Mc TIRHUTA VOWEL SIGN SHORT O +115AF ; Right # Mc SIDDHAM VOWEL SIGN AA +115B1 ; Right # Mc SIDDHAM VOWEL SIGN II +11630..11632 ; Right # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +1163B..1163C ; Right # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +116AF ; Right # Mc TAKRI VOWEL SIGN II + +# Indic_Matra_Category=Left + +093F ; Left # Mc DEVANAGARI VOWEL SIGN I +094E ; Left # Mc DEVANAGARI VOWEL SIGN PRISHTHAMATRA E +09BF ; Left # Mc BENGALI VOWEL SIGN I +09C7..09C8 ; Left # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +0A3F ; Left # Mc GURMUKHI VOWEL SIGN I +0ABF ; Left # Mc GUJARATI VOWEL SIGN I +0B47 ; Left # Mc ORIYA VOWEL SIGN E +0BC6..0BC8 ; Left # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0D46..0D48 ; Left # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0DD9 ; Left # Mc SINHALA VOWEL SIGN KOMBUVA +0DDB ; Left # Mc SINHALA VOWEL SIGN KOMBU DEKA +1031 ; Left # Mc MYANMAR VOWEL SIGN E +1084 ; Left # Mc MYANMAR VOWEL SIGN SHAN E +17C1..17C3 ; Left # Mc [3] KHMER VOWEL SIGN E..KHMER VOWEL SIGN AI +19B5..19B7 ; Left # Mc [3] NEW TAI LUE VOWEL SIGN E..NEW TAI LUE VOWEL SIGN O +19BA ; Left # Mc NEW TAI LUE VOWEL SIGN AY +1A19 ; Left # Mc BUGINESE VOWEL SIGN E +1A55 ; Left # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A6E..1A72 ; Left # Mc [5] TAI THAM VOWEL SIGN E..TAI THAM VOWEL SIGN THAM AI +1B3E..1B3F ; Left # Mc [2] BALINESE VOWEL SIGN TALING..BALINESE VOWEL SIGN TALING REPA +1BA6 ; Left # Mc SUNDANESE VOWEL SIGN PANAELAENG +1C27..1C28 ; Left # Mc [2] LEPCHA VOWEL SIGN I..LEPCHA VOWEL SIGN O +1C34..1C35 ; Left # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A9BA..A9BB ; Left # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +AA2F..AA30 ; Left # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA34 ; Left # Mc CHAM CONSONANT SIGN RA +AAEB ; Left # Mc MEETEI MAYEK VOWEL SIGN II +AAEE ; Left # Mc MEETEI MAYEK VOWEL SIGN AU +110B1 ; Left # Mc KAITHI VOWEL SIGN I +1112C ; Left # Mc CHAKMA VOWEL SIGN E +111B4 ; Left # Mc SHARADA VOWEL SIGN I +112E1 ; Left # Mc KHUDAWADI VOWEL SIGN I +11347..11348 ; Left # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +114B1 ; Left # Mc TIRHUTA VOWEL SIGN I +114B9 ; Left # Mc TIRHUTA VOWEL SIGN E +115B0 ; Left # Mc SIDDHAM VOWEL SIGN I +115B8 ; Left # Mc SIDDHAM VOWEL SIGN E +116AE ; Left # Mc TAKRI VOWEL SIGN I + +# Indic_Matra_Category=Visual_Order_Left + +# These are dependent vowels that occur to the left of the consonant +# letter in a syllable, but which occur in scripts using the visual order +# model, instead of the logical order model. Because of the different +# model, these left-side vowels occur first in the backing store (before +# the consonant letter) and are not reordered during text rendering. +# +# [Derivation: Logical_Order_Exception=Yes] + +0E40..0E44 ; Visual_Order_Left # Lo [5] THAI CHARACTER SARA E..THAI CHARACTER SARA AI MAIMALAI +0EC0..0EC4 ; Visual_Order_Left # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +AAB5..AAB6 ; Visual_Order_Left # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB9 ; Visual_Order_Left # Lo TAI VIET VOWEL UEA +AABB..AABC ; Visual_Order_Left # Lo [2] TAI VIET VOWEL AUE..TAI VIET VOWEL AY + +# Indic_Matra_Category=Left_And_Right + +09CB..09CC ; Left_And_Right # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +0B4B ; Left_And_Right # Mc ORIYA VOWEL SIGN O +0BCA..0BCC ; Left_And_Right # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0D4A..0D4C ; Left_And_Right # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0DDC ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA +0DDE ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA +17C0 ; Left_And_Right # Mc KHMER VOWEL SIGN IE +17C4..17C5 ; Left_And_Right # Mc [2] KHMER VOWEL SIGN OO..KHMER VOWEL SIGN AU +1B40..1B41 ; Left_And_Right # Mc [2] BALINESE VOWEL SIGN TALING TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1134B..1134C ; Left_And_Right # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +114BC ; Left_And_Right # Mc TIRHUTA VOWEL SIGN O +114BE ; Left_And_Right # Mc TIRHUTA VOWEL SIGN AU +115BA ; Left_And_Right # Mc SIDDHAM VOWEL SIGN O + +# Indic_Matra_Category=Top + +093A ; Top # Mn DEVANAGARI VOWEL SIGN OE +0945..0948 ; Top # Mn [4] DEVANAGARI VOWEL SIGN CANDRA E..DEVANAGARI VOWEL SIGN AI +0955 ; Top # Mn DEVANAGARI VOWEL SIGN CANDRA LONG E +0A47..0A48 ; Top # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Top # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0A71 ; Top # Mn GURMUKHI ADDAK +0AC5 ; Top # Mn GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Top # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0B3F ; Top # Mn ORIYA VOWEL SIGN I +0B56 ; Top # Mn ORIYA AI LENGTH MARK +0BC0 ; Top # Mn TAMIL VOWEL SIGN II +0BCD ; Top # Mn TAMIL SIGN VIRAMA +0C3E..0C40 ; Top # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C46..0C47 ; Top # Mn [2] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN EE +0C4A..0C4D ; Top # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA +0C55 ; Top # Mn TELUGU LENGTH MARK +0CBF ; Top # Mn KANNADA VOWEL SIGN I +0CC6 ; Top # Mn KANNADA VOWEL SIGN E +0CCC..0CCD ; Top # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA +0D4D ; Top # Mn MALAYALAM SIGN VIRAMA +0DCA ; Top # Mn SINHALA SIGN AL-LAKUNA +0DD2..0DD3 ; Top # Mn [2] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN DIGA IS-PILLA +0E31 ; Top # Mn THAI CHARACTER MAI HAN-AKAT +0E34..0E37 ; Top # Mn [4] THAI CHARACTER SARA I..THAI CHARACTER SARA UEE +0E47 ; Top # Mn THAI CHARACTER MAITAIKHU +0E4E ; Top # Mn THAI CHARACTER YAMAKKAN +0EB1 ; Top # Mn LAO VOWEL SIGN MAI KAN +0EB4..0EB7 ; Top # Mn [4] LAO VOWEL SIGN I..LAO VOWEL SIGN YY +0EBB ; Top # Mn LAO VOWEL SIGN MAI KON +0F72 ; Top # Mn TIBETAN VOWEL SIGN I +0F7A..0F7D ; Top # Mn [4] TIBETAN VOWEL SIGN E..TIBETAN VOWEL SIGN OO +0F80 ; Top # Mn TIBETAN VOWEL SIGN REVERSED I +102D..102E ; Top # Mn [2] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN II +1032..1035 ; Top # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +103A ; Top # Mn MYANMAR SIGN ASAT +1071..1074 ; Top # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1085..1086 ; Top # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109D ; Top # Mn MYANMAR VOWEL SIGN AITON AI +1712 ; Top # Mn TAGALOG VOWEL SIGN I +1732 ; Top # Mn HANUNOO VOWEL SIGN I +1752 ; Top # Mn BUHID VOWEL SIGN I +1772 ; Top # Mn TAGBANWA VOWEL SIGN I +17B7..17BA ; Top # Mn [4] KHMER VOWEL SIGN I..KHMER VOWEL SIGN YY +17C9..17D1 ; Top # Mn [9] KHMER SIGN MUUSIKATOAN..KHMER SIGN VIRIAM +17D3 ; Top # Mn KHMER SIGN BATHAMASAT +1920..1921 ; Top # Mn [2] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN I +1927..1928 ; Top # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +1A17 ; Top # Mn BUGINESE VOWEL SIGN I +1A1B ; Top # Mn BUGINESE VOWEL SIGN AE +1A62 ; Top # Mn TAI THAM VOWEL SIGN MAI SAT +1A65..1A68 ; Top # Mn [4] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN UUE +1A6B ; Top # Mn TAI THAM VOWEL SIGN O +1A73..1A74 ; Top # Mn [2] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN MAI KANG +1B36..1B37 ; Top # Mn [2] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN ULU SARI +1B42 ; Top # Mn BALINESE VOWEL SIGN PEPET +1BA4 ; Top # Mn SUNDANESE VOWEL SIGN PANGHULU +1BA8..1BA9 ; Top # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE8..1BE9 ; Top # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BED ; Top # Mn BATAK VOWEL SIGN KARO O +1BEF ; Top # Mn BATAK VOWEL SIGN U FOR SIMALUNGUN SA +A806 ; Top # Mn SYLOTI NAGRI SIGN HASANTA +A826 ; Top # Mn SYLOTI NAGRI VOWEL SIGN E +A94A ; Top # Mn REJANG VOWEL SIGN AI +A9B6..A9B7 ; Top # Mn [2] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN WULU MELIK +A9BC ; Top # Mn JAVANESE VOWEL SIGN PEPET +AA29..AA2C ; Top # Mn [4] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN EI +AA2E ; Top # Mn CHAM VOWEL SIGN OE +AA31 ; Top # Mn CHAM VOWEL SIGN AU +AAB0 ; Top # Mn TAI VIET MAI KANG +AAB2..AAB3 ; Top # Mn [2] TAI VIET VOWEL I..TAI VIET VOWEL UE +AAB7..AAB8 ; Top # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AABE ; Top # Mn TAI VIET VOWEL AM +AAED ; Top # Mn MEETEI MAYEK VOWEL SIGN AAI +ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP +10A05 ; Top # Mn KHAROSHTHI VOWEL SIGN E +11038..1103B ; Top # Mn [4] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN II +11042..11046 ; Top # Mn [5] BRAHMI VOWEL SIGN E..BRAHMI VIRAMA +110B5..110B6 ; Top # Mn [2] KAITHI VOWEL SIGN E..KAITHI VOWEL SIGN AI +11127..11129 ; Top # Mn [3] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN II +1112D ; Top # Mn CHAKMA VOWEL SIGN AI +11130 ; Top # Mn CHAKMA VOWEL SIGN OI +11134 ; Top # Mn CHAKMA MAAYYAA +111BC..111BE ; Top # Mn [3] SHARADA VOWEL SIGN E..SHARADA VOWEL SIGN O +11230..11231 ; Top # Mn [2] KHOJKI VOWEL SIGN E..KHOJKI VOWEL SIGN AI +11237 ; Top # Mn KHOJKI SIGN SHADDA +112E5..112E8 ; Top # Mn [4] KHUDAWADI VOWEL SIGN E..KHUDAWADI VOWEL SIGN AU +11340 ; Top # Mn GRANTHA VOWEL SIGN II +114BA ; Top # Mn TIRHUTA VOWEL SIGN SHORT E +11639..1163A ; Top # Mn [2] MODI VOWEL SIGN E..MODI VOWEL SIGN AI +116AD ; Top # Mn TAKRI VOWEL SIGN AA +116B2..116B5 ; Top # Mn [4] TAKRI VOWEL SIGN E..TAKRI VOWEL SIGN AU +116B6 ; Top # Mc TAKRI SIGN VIRAMA + +# Indic_Matra_Category=Bottom + +0941..0944 ; Bottom # Mn [4] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN VOCALIC RR +094D ; Bottom # Mn DEVANAGARI SIGN VIRAMA +0956..0957 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN UE..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09C1..09C4 ; Bottom # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09CD ; Bottom # Mn BENGALI SIGN VIRAMA +09E2..09E3 ; Bottom # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A41..0A42 ; Bottom # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A4D ; Bottom # Mn GURMUKHI SIGN VIRAMA +0AC1..0AC4 ; Bottom # Mn [4] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN VOCALIC RR +0ACD ; Bottom # Mn GUJARATI SIGN VIRAMA +0AE2..0AE3 ; Bottom # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B41..0B44 ; Bottom # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B4D ; Bottom # Mn ORIYA SIGN VIRAMA +0B62..0B63 ; Bottom # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BC1..0BC2 ; Bottom # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +# Note: U and UU have contextually variable placement in Tamil. +0C56 ; Bottom # Mn TELUGU AI LENGTH MARK +0C62..0C63 ; Bottom # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CE2..0CE3 ; Bottom # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D43..0D44 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC R..MALAYALAM VOWEL SIGN VOCALIC RR +0D62..0D63 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DD4 ; Bottom # Mn SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Bottom # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0E38..0E3A ; Bottom # Mn [3] THAI CHARACTER SARA U..THAI CHARACTER PHINTHU +0EB8..0EB9 ; Bottom # Mn [2] LAO VOWEL SIGN U..LAO VOWEL SIGN UU +0F71 ; Bottom # Mn TIBETAN VOWEL SIGN AA +0F74..0F75 ; Bottom # Mn [2] TIBETAN VOWEL SIGN U..TIBETAN VOWEL SIGN UU +0F84 ; Bottom # Mn TIBETAN MARK HALANTA +102F..1030 ; Bottom # Mn [2] MYANMAR VOWEL SIGN U..MYANMAR VOWEL SIGN UU +1058..1059 ; Bottom # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1713..1714 ; Bottom # Mn [2] TAGALOG VOWEL SIGN U..TAGALOG SIGN VIRAMA +1733..1734 ; Bottom # Mn [2] HANUNOO VOWEL SIGN U..HANUNOO SIGN PAMUDPOD +1753 ; Bottom # Mn BUHID VOWEL SIGN U +1773 ; Bottom # Mn TAGBANWA VOWEL SIGN U +17BB..17BD ; Bottom # Mn [3] KHMER VOWEL SIGN U..KHMER VOWEL SIGN UA +1922 ; Bottom # Mn LIMBU VOWEL SIGN U +1A18 ; Bottom # Mn BUGINESE VOWEL SIGN U +1A69..1A6A ; Bottom # Mn [2] TAI THAM VOWEL SIGN U..TAI THAM VOWEL SIGN UU +1A6C ; Bottom # Mn TAI THAM VOWEL SIGN OA BELOW +1B38..1B3A ; Bottom # Mn [3] BALINESE VOWEL SIGN SUKU..BALINESE VOWEL SIGN RA REPA +1BA5 ; Bottom # Mn SUNDANESE VOWEL SIGN PANYUKU +1C2C ; Bottom # Mn LEPCHA VOWEL SIGN E +A825 ; Bottom # Mn SYLOTI NAGRI VOWEL SIGN U +A8C4 ; Bottom # Mn SAURASHTRA SIGN VIRAMA +A947..A949 ; Bottom # Mn [3] REJANG VOWEL SIGN I..REJANG VOWEL SIGN E +A94B..A94E ; Bottom # Mn [4] REJANG VOWEL SIGN O..REJANG VOWEL SIGN EA +A9B8..A9B9 ; Bottom # Mn [2] JAVANESE VOWEL SIGN SUKU..JAVANESE VOWEL SIGN SUKU MENDUT +AA2D ; Bottom # Mn CHAM VOWEL SIGN U +AA32 ; Bottom # Mn CHAM VOWEL SIGN UE +AAB4 ; Bottom # Mn TAI VIET VOWEL U +AAEC ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UU +ABE8 ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK +10A02..10A03 ; Bottom # Mn [2] KHAROSHTHI VOWEL SIGN U..KHAROSHTHI VOWEL SIGN VOCALIC R +10A0C ; Bottom # Mn KHAROSHTHI VOWEL LENGTH MARK +1103C..11041 ; Bottom # Mn [6] BRAHMI VOWEL SIGN U..BRAHMI VOWEL SIGN VOCALIC LL +110B3..110B4 ; Bottom # Mn [2] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN UU +110B9 ; Bottom # Mn KAITHI SIGN VIRAMA +1112A..1112B ; Bottom # Mn [2] CHAKMA VOWEL SIGN U..CHAKMA VOWEL SIGN UU +11131..11132 ; Bottom # Mn [2] CHAKMA O MARK..CHAKMA AU MARK +111B6..111BB ; Bottom # Mn [6] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN VOCALIC LL +1122F ; Bottom # Mn KHOJKI VOWEL SIGN U +112E3..112E4 ; Bottom # Mn [2] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN UU +112EA ; Bottom # Mn KHUDAWADI SIGN VIRAMA +114B3..114B8 ; Bottom # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114C2 ; Bottom # Mn TIRHUTA SIGN VIRAMA +115B2..115B5 ; Bottom # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115BF ; Bottom # Mn SIDDHAM SIGN VIRAMA +11633..11638 ; Bottom # Mn [6] MODI VOWEL SIGN U..MODI VOWEL SIGN VOCALIC LL +1163F ; Bottom # Mn MODI SIGN VIRAMA +116B0..116B1 ; Bottom # Mn [2] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN UU + +# Indic_Matra_Category=Top_And_Bottom + +0C48 ; Top_And_Bottom # Mn TELUGU VOWEL SIGN AI +0F73 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN II +0F76..0F79 ; Top_And_Bottom # Mn [4] TIBETAN VOWEL SIGN VOCALIC R..TIBETAN VOWEL SIGN VOCALIC LL +0F81 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN REVERSED II +1B3C ; Top_And_Bottom # Mn BALINESE VOWEL SIGN LA LENGA +1112E..1112F ; Top_And_Bottom # Mn [2] CHAKMA VOWEL SIGN O..CHAKMA VOWEL SIGN AU + +# Indic_Matra_Category=Top_And_Right + +0AC9 ; Top_And_Right # Mc GUJARATI VOWEL SIGN CANDRA O +0B57 ; Top_And_Right # Mc ORIYA AU LENGTH MARK +0CC0 ; Top_And_Right # Mc KANNADA VOWEL SIGN II +0CC7..0CC8 ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +1925..1926 ; Top_And_Right # Mc [2] LIMBU VOWEL SIGN OO..LIMBU VOWEL SIGN AU +1B43 ; Top_And_Right # Mc BALINESE VOWEL SIGN PEPET TEDUNG +111BF ; Top_And_Right # Mc SHARADA VOWEL SIGN AU +11232..11233 ; Top_And_Right # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU + +# Indic_Matra_Category=Top_And_Left + +0B48 ; Top_And_Left # Mc ORIYA VOWEL SIGN AI +0DDA ; Top_And_Left # Mc SINHALA VOWEL SIGN DIGA KOMBUVA +17BE ; Top_And_Left # Mc KHMER VOWEL SIGN OE +1C29 ; Top_And_Left # Mc LEPCHA VOWEL SIGN OO +114BB ; Top_And_Left # Mc TIRHUTA VOWEL SIGN AI +115B9 ; Top_And_Left # Mc SIDDHAM VOWEL SIGN AI + +# Indic_Matra_Category=Top_And_Left_And_Right + +0B4C ; Top_And_Left_And_Right # Mc ORIYA VOWEL SIGN AU +0DDD ; Top_And_Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA +17BF ; Top_And_Left_And_Right # Mc KHMER VOWEL SIGN YA +115BB ; Top_And_Left_And_Right # Mc SIDDHAM VOWEL SIGN AU + +# Indic_Matra_Category=Bottom_And_Right + +1B3B ; Bottom_And_Right # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +A9C0 ; Bottom_And_Right # Mc JAVANESE PANGKON + +# Indic_Matra_Category=Top_And_Bottom_And_Right + +1B3D ; Top_And_Bottom_And_Right # Mc BALINESE VOWEL SIGN LA LENGA TEDUNG + +# Indic_Matra_Category=Overstruck + +10A01 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN I +10A06 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN O + +# EOF diff --git a/data/7.0.0-indic-syllabic-category.txt b/data/7.0.0-indic-syllabic-category.txt new file mode 100644 index 0000000..7634798 --- /dev/null +++ b/data/7.0.0-indic-syllabic-category.txt @@ -0,0 +1,1042 @@ +# IndicSyllabicCategory-7.0.0.txt +# Date: 2014-06-03, 07:00:00 GMT [KW, LI, AG, RP] +# +# Unicode Character Database +# Copyright (c) 1991-2014 Unicode, Inc. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# For documentation, see UAX #44: Unicode Character Database, +# at http://www.unicode.org/reports/tr44/ +# +# This file defines the following provisional property: +# +# Indic_Syllabic_Category enumerated property +# +# NB: Provisional properties and data files have no associated stability +# guarantees. They are provided in part to determine the possible usefulness +# of a property or other data and to encourage analysis and further investigation +# which may result in their improvement. Provisional properties and data files +# may change arbitrarily, or may even be removed in a future version of the +# Unicode Character Database, if they prove not to be useful. +# +# Scope: This provisional property is aimed at two general problem +# areas involving the analysis and processing of Indic scripts: +# +# 1. Specification of syllabic structure. +# 2. Specification of segmentation rules. +# +# Both of these problem areas may benefit from having defined subtypes +# of Indic script characters which are relevant to how Indic +# syllables (or aksaras) are constructed. Note that rules for +# syllabic structure in Indic scripts may differ significantly +# from how phonological syllables are defined. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Syllabic_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as Indic in the structural sense used for the +# Indic_Syllabic_Category are the following: +# +# Balinese, Batak, Bengali, Brahmi, Buginese, Buhid, Chakma, Cham, +# Devanagari, Grantha, Gujarati, Gurmukhi, Hanunoo, Javanese, Kaithi, +# Kannada, Kayah Li, Kharoshthi, Khmer, Khojki, Khudawadi, Lao, Lepcha, +# Limbu, Mahajani, Malayalam, Meetei Mayek, Modi, Myanmar, New Tai Lue, +# Oriya, Phags-pa, Rejang, Saurashtra, Sharada, Siddham, Sinhala, +# Sundanese, Syloti Nagri, Tagalog, Tagbanwa, Tai Le, Tai Tham, Tai Viet, +# Takri, Tamil, Telugu, Thai, Tibetan, and Tirhuta. +# +# All characters for all other scripts not in that list +# take the default value for this property, unless they +# are individually listed in this data file. +# + +# ================================================ + +# Property: Indic_Syllabic_Category +# +# All code points not explicitly listed for Indic_Syllabic_Category +# have the value Other. +# +# @missing: 0000..10FFFF; Other + +# ================================================ + +# Indic_Syllabic_Category=Bindu + +# Bindu/Anusvara (nasalization or -n) +# Excludes various Vedic nasalization signs. + +# [Not derivable] + +0900..0902 ; Bindu # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +0981 ; Bindu # Mn BENGALI SIGN CANDRABINDU +0982 ; Bindu # Mc BENGALI SIGN ANUSVARA +0A01..0A02 ; Bindu # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A70 ; Bindu # Mn GURMUKHI TIPPI +0A81..0A82 ; Bindu # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0B01 ; Bindu # Mn ORIYA SIGN CANDRABINDU +0B02 ; Bindu # Mc ORIYA SIGN ANUSVARA +0B82 ; Bindu # Mn TAMIL SIGN ANUSVARA +0C00 ; Bindu # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C01..0C02 ; Bindu # Mc [2] TELUGU SIGN CANDRABINDU..TELUGU SIGN ANUSVARA +0C81 ; Bindu # Mn KANNADA SIGN CANDRABINDU +0C82 ; Bindu # Mc KANNADA SIGN ANUSVARA +0D01 ; Bindu # Mn MALAYALAM SIGN CANDRABINDU +0D02 ; Bindu # Mc MALAYALAM SIGN ANUSVARA +0D82 ; Bindu # Mc SINHALA SIGN ANUSVARAYA +0E4D ; Bindu # Mn THAI CHARACTER NIKHAHIT +0ECD ; Bindu # Mn LAO NIGGAHITA +0F7E ; Bindu # Mn TIBETAN SIGN RJES SU NGA RO +0F82..0F83 ; Bindu # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +1036 ; Bindu # Mn MYANMAR SIGN ANUSVARA +17C6 ; Bindu # Mn KHMER SIGN NIKAHIT +1932 ; Bindu # Mn LIMBU SMALL LETTER ANUSVARA +1B00..1B02 ; Bindu # Mn [3] BALINESE SIGN ULU RICEM..BALINESE SIGN CECEK +1B80 ; Bindu # Mn SUNDANESE SIGN PANYECEK +1C34..1C35 ; Bindu # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A80B ; Bindu # Mn SYLOTI NAGRI SIGN ANUSVARA +A873 ; Bindu # Lo PHAGS-PA LETTER CANDRABINDU +A880 ; Bindu # Mc SAURASHTRA SIGN ANUSVARA +A980..A981 ; Bindu # Mn [2] JAVANESE SIGN PANYANGGA..JAVANESE SIGN CECAK +10A0E ; Bindu # Mn KHAROSHTHI SIGN ANUSVARA +11000 ; Bindu # Mc BRAHMI SIGN CANDRABINDU +11001 ; Bindu # Mn BRAHMI SIGN ANUSVARA +11080..11081 ; Bindu # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +11100..11101 ; Bindu # Mn [2] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN ANUSVARA +11180..11181 ; Bindu # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +11234 ; Bindu # Mn KHOJKI SIGN ANUSVARA +112DF ; Bindu # Mn KHUDAWADI SIGN ANUSVARA +11301 ; Bindu # Mn GRANTHA SIGN CANDRABINDU +11302 ; Bindu # Mc GRANTHA SIGN ANUSVARA +114BF..114C0 ; Bindu # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Bindu # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +1163D ; Bindu # Mn MODI SIGN ANUSVARA +116AB ; Bindu # Mn TAKRI SIGN ANUSVARA + +# ================================================ + +# Indic_Syllabic_Category=Visarga + +# Visarga (-h) +# Includes specialized case for Sanskrit: ardhavisarga +# Excludes letters for jihvamuliya and upadhmaniya, which are +# related, but structured somewhat differently. + +# [Not derivable] + +0903 ; Visarga # Mc DEVANAGARI SIGN VISARGA +0983 ; Visarga # Mc BENGALI SIGN VISARGA +0A03 ; Visarga # Mc GURMUKHI SIGN VISARGA +0A83 ; Visarga # Mc GUJARATI SIGN VISARGA +0B03 ; Visarga # Mc ORIYA SIGN VISARGA +0C03 ; Visarga # Mc TELUGU SIGN VISARGA +0C83 ; Visarga # Mc KANNADA SIGN VISARGA +0D03 ; Visarga # Mc MALAYALAM SIGN VISARGA +0D83 ; Visarga # Mc SINHALA SIGN VISARGAYA +0F7F ; Visarga # Mc TIBETAN SIGN RNAM BCAD +1038 ; Visarga # Mc MYANMAR SIGN VISARGA +17C7 ; Visarga # Mc KHMER SIGN REAHMUK +1B04 ; Visarga # Mc BALINESE SIGN BISAH +1B82 ; Visarga # Mc SUNDANESE SIGN PANGWISAD +1CF2..1CF3 ; Visarga # Mc [2] VEDIC SIGN ARDHAVISARGA..VEDIC SIGN ROTATED ARDHAVISARGA +A881 ; Visarga # Mc SAURASHTRA SIGN VISARGA +A983 ; Visarga # Mc JAVANESE SIGN WIGNYAN +AAF5 ; Visarga # Mc MEETEI MAYEK VOWEL SIGN VISARGA +10A0F ; Visarga # Mn KHAROSHTHI SIGN VISARGA +11002 ; Visarga # Mc BRAHMI SIGN VISARGA +11082 ; Visarga # Mc KAITHI SIGN VISARGA +11102 ; Visarga # Mn CHAKMA SIGN VISARGA +11182 ; Visarga # Mc SHARADA SIGN VISARGA +11303 ; Visarga # Mc GRANTHA SIGN VISARGA +114C1 ; Visarga # Mc TIRHUTA SIGN VISARGA +115BE ; Visarga # Mc SIDDHAM SIGN VISARGA +1163E ; Visarga # Mc MODI SIGN VISARGA +116AC ; Visarga # Mc TAKRI SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Avagraha + +# Avagraha (elision of initial a- in sandhi) + +# [Not derivable] + +093D ; Avagraha # Lo DEVANAGARI SIGN AVAGRAHA +09BD ; Avagraha # Lo BENGALI SIGN AVAGRAHA +0ABD ; Avagraha # Lo GUJARATI SIGN AVAGRAHA +0B3D ; Avagraha # Lo ORIYA SIGN AVAGRAHA +0C3D ; Avagraha # Lo TELUGU SIGN AVAGRAHA +0CBD ; Avagraha # Lo KANNADA SIGN AVAGRAHA +0D3D ; Avagraha # Lo MALAYALAM SIGN AVAGRAHA +0F85 ; Avagraha # Po TIBETAN MARK PALUTA +17DC ; Avagraha # Lo KHMER SIGN AVAKRAHASANYA +1BBA ; Avagraha # Lo SUNDANESE AVAGRAHA +111C1 ; Avagraha # Lo SHARADA SIGN AVAGRAHA +1133D ; Avagraha # Lo GRANTHA SIGN AVAGRAHA +114C4 ; Avagraha # Lo TIRHUTA SIGN AVAGRAHA + +# ================================================ + +# Indic_Syllabic_Category=Nukta + +# Nukta (diacritic for borrowed consonants) + +# [Derivation: (ccc=7) - 1037] + +093C ; Nukta # Mn DEVANAGARI SIGN NUKTA +09BC ; Nukta # Mn BENGALI SIGN NUKTA +0A3C ; Nukta # Mn GURMUKHI SIGN NUKTA +0ABC ; Nukta # Mn GUJARATI SIGN NUKTA +0B3C ; Nukta # Mn ORIYA SIGN NUKTA +0CBC ; Nukta # Mn KANNADA SIGN NUKTA +1B34 ; Nukta # Mn BALINESE SIGN REREKAN +1BE6 ; Nukta # Mn BATAK SIGN TOMPI +1C37 ; Nukta # Mn LEPCHA SIGN NUKTA +A9B3 ; Nukta # Mn JAVANESE SIGN CECAK TELU +110BA ; Nukta # Mn KAITHI SIGN NUKTA +11173 ; Nukta # Mn MAHAJANI SIGN NUKTA +11236 ; Nukta # Mn KHOJKI SIGN NUKTA +112E9 ; Nukta # Mn KHUDAWADI SIGN NUKTA +1133C ; Nukta # Mn GRANTHA SIGN NUKTA +114C3 ; Nukta # Mn TIRHUTA SIGN NUKTA +115C0 ; Nukta # Mn SIDDHAM SIGN NUKTA +116B7 ; Nukta # Mn TAKRI SIGN NUKTA + +# ================================================ + +# Indic_Syllabic_Category=Virama + +# Virama (killing of inherent vowel in consonant sequence +# or consonant stacker) +# Only includes characters that can act both as visible killer viramas +# and consonant stackers. Separate property values exist for characters +# that can only act as pure killers or only as consonant stackers. + +# [Derivation: (ccc=9) - (InSC=Pure_Killer) - (InSC=Invisible_Stacker) - 2D7F - 1107F] + +094D ; Virama # Mn DEVANAGARI SIGN VIRAMA +09CD ; Virama # Mn BENGALI SIGN VIRAMA +0A4D ; Virama # Mn GURMUKHI SIGN VIRAMA +0ACD ; Virama # Mn GUJARATI SIGN VIRAMA +0B4D ; Virama # Mn ORIYA SIGN VIRAMA +0BCD ; Virama # Mn TAMIL SIGN VIRAMA +0C4D ; Virama # Mn TELUGU SIGN VIRAMA +0CCD ; Virama # Mn KANNADA SIGN VIRAMA +0D4D ; Virama # Mn MALAYALAM SIGN VIRAMA +0DCA ; Virama # Mn SINHALA SIGN AL-LAKUNA +1B44 ; Virama # Mc BALINESE ADEG ADEG +A8C4 ; Virama # Mn SAURASHTRA SIGN VIRAMA +A9C0 ; Virama # Mc JAVANESE PANGKON +11046 ; Virama # Mn BRAHMI VIRAMA +110B9 ; Virama # Mn KAITHI SIGN VIRAMA +111C0 ; Virama # Mc SHARADA SIGN VIRAMA +11235 ; Virama # Mc KHOJKI SIGN VIRAMA +1134D ; Virama # Mc GRANTHA SIGN VIRAMA +114C2 ; Virama # Mn TIRHUTA SIGN VIRAMA +115BF ; Virama # Mn SIDDHAM SIGN VIRAMA +1163F ; Virama # Mn MODI SIGN VIRAMA +116B6 ; Virama # Mc TAKRI SIGN VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Pure_Killer + +# Pure killer (killing of inherent vowel in consonant sequence, +# with no consonant stacking behavior) + +# [Not derivable] + +0E3A ; Pure_Killer # Mn THAI CHARACTER PHINTHU +0E4E ; Pure_Killer # Mn THAI CHARACTER YAMAKKAN +0F84 ; Pure_Killer # Mn TIBETAN MARK HALANTA +103A ; Pure_Killer # Mn MYANMAR SIGN ASAT +1714 ; Pure_Killer # Mn TAGALOG SIGN VIRAMA +1734 ; Pure_Killer # Mn HANUNOO SIGN PAMUDPOD +17D1 ; Pure_Killer # Mn KHMER SIGN VIRIAM +1BAA ; Pure_Killer # Mc SUNDANESE SIGN PAMAAEH +1BF2..1BF3 ; Pure_Killer # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +A806 ; Pure_Killer # Mn SYLOTI NAGRI SIGN HASANTA +A953 ; Pure_Killer # Mc REJANG VIRAMA +ABED ; Pure_Killer # Mn MEETEI MAYEK APUN IYEK +11134 ; Pure_Killer # Mn CHAKMA MAAYYAA +112EA ; Pure_Killer # Mn KHUDAWADI SIGN VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Invisible_Stacker + +# Invisible stacker (invisible consonant stacker virama) + +# [Not derivable] + +1039 ; Invisible_Stacker # Mn MYANMAR SIGN VIRAMA +17D2 ; Invisible_Stacker # Mn KHMER SIGN COENG +1A60 ; Invisible_Stacker # Mn TAI THAM SIGN SAKOT +1BAB ; Invisible_Stacker # Mn SUNDANESE SIGN VIRAMA +AAF6 ; Invisible_Stacker # Mn MEETEI MAYEK VIRAMA +10A3F ; Invisible_Stacker # Mn KHAROSHTHI VIRAMA +11133 ; Invisible_Stacker # Mn CHAKMA VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Independent + +# Independent Vowels (contrasted with matras) + +# [Not derivable] + +0904..0914 ; Vowel_Independent # Lo [17] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER AU +0960..0961 ; Vowel_Independent # Lo [2] DEVANAGARI LETTER VOCALIC RR..DEVANAGARI LETTER VOCALIC LL +0972..0977 ; Vowel_Independent # Lo [6] DEVANAGARI LETTER CANDRA A..DEVANAGARI LETTER UUE +0985..098C ; Vowel_Independent # Lo [8] BENGALI LETTER A..BENGALI LETTER VOCALIC L +098F..0990 ; Vowel_Independent # Lo [2] BENGALI LETTER E..BENGALI LETTER AI +0993..0994 ; Vowel_Independent # Lo [2] BENGALI LETTER O..BENGALI LETTER AU +09E0..09E1 ; Vowel_Independent # Lo [2] BENGALI LETTER VOCALIC RR..BENGALI LETTER VOCALIC LL +0A05..0A0A ; Vowel_Independent # Lo [6] GURMUKHI LETTER A..GURMUKHI LETTER UU +0A0F..0A10 ; Vowel_Independent # Lo [2] GURMUKHI LETTER EE..GURMUKHI LETTER AI +0A13..0A14 ; Vowel_Independent # Lo [2] GURMUKHI LETTER OO..GURMUKHI LETTER AU +0A85..0A8D ; Vowel_Independent # Lo [9] GUJARATI LETTER A..GUJARATI VOWEL CANDRA E +0A8F..0A91 ; Vowel_Independent # Lo [3] GUJARATI LETTER E..GUJARATI VOWEL CANDRA O +0A93..0A94 ; Vowel_Independent # Lo [2] GUJARATI LETTER O..GUJARATI LETTER AU +0AE0..0AE1 ; Vowel_Independent # Lo [2] GUJARATI LETTER VOCALIC RR..GUJARATI LETTER VOCALIC LL +0B05..0B0C ; Vowel_Independent # Lo [8] ORIYA LETTER A..ORIYA LETTER VOCALIC L +0B0F..0B10 ; Vowel_Independent # Lo [2] ORIYA LETTER E..ORIYA LETTER AI +0B13..0B14 ; Vowel_Independent # Lo [2] ORIYA LETTER O..ORIYA LETTER AU +0B60..0B61 ; Vowel_Independent # Lo [2] ORIYA LETTER VOCALIC RR..ORIYA LETTER VOCALIC LL +0B85..0B8A ; Vowel_Independent # Lo [6] TAMIL LETTER A..TAMIL LETTER UU +0B8E..0B90 ; Vowel_Independent # Lo [3] TAMIL LETTER E..TAMIL LETTER AI +0B92..0B94 ; Vowel_Independent # Lo [3] TAMIL LETTER O..TAMIL LETTER AU +0C05..0C0C ; Vowel_Independent # Lo [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L +0C0E..0C10 ; Vowel_Independent # Lo [3] TELUGU LETTER E..TELUGU LETTER AI +0C12..0C14 ; Vowel_Independent # Lo [3] TELUGU LETTER O..TELUGU LETTER AU +0C60..0C61 ; Vowel_Independent # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL +0C85..0C8C ; Vowel_Independent # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L +0C8E..0C90 ; Vowel_Independent # Lo [3] KANNADA LETTER E..KANNADA LETTER AI +0C92..0C94 ; Vowel_Independent # Lo [3] KANNADA LETTER O..KANNADA LETTER AU +0CE0..0CE1 ; Vowel_Independent # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL +0D05..0D0C ; Vowel_Independent # Lo [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L +0D0E..0D10 ; Vowel_Independent # Lo [3] MALAYALAM LETTER E..MALAYALAM LETTER AI +0D12..0D14 ; Vowel_Independent # Lo [3] MALAYALAM LETTER O..MALAYALAM LETTER AU +0D60..0D61 ; Vowel_Independent # Lo [2] MALAYALAM LETTER VOCALIC RR..MALAYALAM LETTER VOCALIC LL +0D85..0D96 ; Vowel_Independent # Lo [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA +1021..102A ; Vowel_Independent # Lo [10] MYANMAR LETTER A..MYANMAR LETTER AU +1052..1055 ; Vowel_Independent # Lo [4] MYANMAR LETTER VOCALIC R..MYANMAR LETTER VOCALIC LL +1700..1702 ; Vowel_Independent # Lo [3] TAGALOG LETTER A..TAGALOG LETTER U +1720..1722 ; Vowel_Independent # Lo [3] HANUNOO LETTER A..HANUNOO LETTER U +1740..1742 ; Vowel_Independent # Lo [3] BUHID LETTER A..BUHID LETTER U +1760..1762 ; Vowel_Independent # Lo [3] TAGBANWA LETTER A..TAGBANWA LETTER U +17A3..17B3 ; Vowel_Independent # Lo [17] KHMER INDEPENDENT VOWEL QAQ..KHMER INDEPENDENT VOWEL QAU +1A4D..1A52 ; Vowel_Independent # Lo [6] TAI THAM LETTER I..TAI THAM LETTER OO +1B05..1B12 ; Vowel_Independent # Lo [14] BALINESE LETTER AKARA..BALINESE LETTER OKARA TEDUNG +1B83..1B89 ; Vowel_Independent # Lo [7] SUNDANESE LETTER A..SUNDANESE LETTER EU +1BE4..1BE5 ; Vowel_Independent # Lo [2] BATAK LETTER I..BATAK LETTER U +A800..A801 ; Vowel_Independent # Lo [2] SYLOTI NAGRI LETTER A..SYLOTI NAGRI LETTER I +A803..A805 ; Vowel_Independent # Lo [3] SYLOTI NAGRI LETTER U..SYLOTI NAGRI LETTER O +A882..A891 ; Vowel_Independent # Lo [16] SAURASHTRA LETTER A..SAURASHTRA LETTER AU +A984..A988 ; Vowel_Independent # Lo [5] JAVANESE LETTER A..JAVANESE LETTER U +A98C..A98E ; Vowel_Independent # Lo [3] JAVANESE LETTER E..JAVANESE LETTER O +AA00..AA05 ; Vowel_Independent # Lo [6] CHAM LETTER A..CHAM LETTER O +AAE0..AAE1 ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER E..MEETEI MAYEK LETTER O +ABCE..ABCF ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER UN..MEETEI MAYEK LETTER I +ABD1 ; Vowel_Independent # Lo MEETEI MAYEK LETTER ATIYA +11005..11012 ; Vowel_Independent # Lo [14] BRAHMI LETTER A..BRAHMI LETTER AU +11083..1108C ; Vowel_Independent # Lo [10] KAITHI LETTER A..KAITHI LETTER AU +11103..11106 ; Vowel_Independent # Lo [4] CHAKMA LETTER AA..CHAKMA LETTER E +11183..11190 ; Vowel_Independent # Lo [14] SHARADA LETTER A..SHARADA LETTER AU +11200..11207 ; Vowel_Independent # Lo [8] KHOJKI LETTER A..KHOJKI LETTER AU +112B0..112B9 ; Vowel_Independent # Lo [10] KHUDAWADI LETTER A..KHUDAWADI LETTER AU +11305..1130C ; Vowel_Independent # Lo [8] GRANTHA LETTER A..GRANTHA LETTER VOCALIC L +1130F..11310 ; Vowel_Independent # Lo [2] GRANTHA LETTER EE..GRANTHA LETTER AI +11313..11314 ; Vowel_Independent # Lo [2] GRANTHA LETTER OO..GRANTHA LETTER AU +11360..11361 ; Vowel_Independent # Lo [2] GRANTHA LETTER VOCALIC RR..GRANTHA LETTER VOCALIC LL +11481..1148E ; Vowel_Independent # Lo [14] TIRHUTA LETTER A..TIRHUTA LETTER AU +11580..1158D ; Vowel_Independent # Lo [14] SIDDHAM LETTER A..SIDDHAM LETTER AU +11600..1160D ; Vowel_Independent # Lo [14] MODI LETTER A..MODI LETTER AU +11680..11689 ; Vowel_Independent # Lo [10] TAKRI LETTER A..TAKRI LETTER AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Dependent + +# Dependent Vowels (contrasted with independent vowels and/or with complex placement) +# Matras (in Indic scripts) + +# [Not derivable] + +093A ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN OE +093B ; Vowel_Dependent # Mc DEVANAGARI VOWEL SIGN OOE +093E..0940 ; Vowel_Dependent # Mc [3] DEVANAGARI VOWEL SIGN AA..DEVANAGARI VOWEL SIGN II +0941..0948 ; Vowel_Dependent # Mn [8] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN AI +0949..094C ; Vowel_Dependent # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094E..094F ; Vowel_Dependent # Mc [2] DEVANAGARI VOWEL SIGN PRISHTHAMATRA E..DEVANAGARI VOWEL SIGN AW +0955..0957 ; Vowel_Dependent # Mn [3] DEVANAGARI VOWEL SIGN CANDRA LONG E..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Vowel_Dependent # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BE..09C0 ; Vowel_Dependent # Mc [3] BENGALI VOWEL SIGN AA..BENGALI VOWEL SIGN II +09C1..09C4 ; Vowel_Dependent # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09C7..09C8 ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +09CB..09CC ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +09D7 ; Vowel_Dependent # Mc BENGALI AU LENGTH MARK +09E2..09E3 ; Vowel_Dependent # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3E..0A40 ; Vowel_Dependent # Mc [3] GURMUKHI VOWEL SIGN AA..GURMUKHI VOWEL SIGN II +0A41..0A42 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A47..0A48 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0ABE..0AC0 ; Vowel_Dependent # Mc [3] GUJARATI VOWEL SIGN AA..GUJARATI VOWEL SIGN II +0AC1..0AC5 ; Vowel_Dependent # Mn [5] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AC9 ; Vowel_Dependent # Mc GUJARATI VOWEL SIGN CANDRA O +0ACB..0ACC ; Vowel_Dependent # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0AE2..0AE3 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3E ; Vowel_Dependent # Mc ORIYA VOWEL SIGN AA +0B3F ; Vowel_Dependent # Mn ORIYA VOWEL SIGN I +0B40 ; Vowel_Dependent # Mc ORIYA VOWEL SIGN II +0B41..0B44 ; Vowel_Dependent # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B47..0B48 ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI +0B4B..0B4C ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN O..ORIYA VOWEL SIGN AU +0B56 ; Vowel_Dependent # Mn ORIYA AI LENGTH MARK +0B57 ; Vowel_Dependent # Mc ORIYA AU LENGTH MARK +0B62..0B63 ; Vowel_Dependent # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BBE..0BBF ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC0 ; Vowel_Dependent # Mn TAMIL VOWEL SIGN II +0BC1..0BC2 ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BC6..0BC8 ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0BCA..0BCC ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0BD7 ; Vowel_Dependent # Mc TAMIL AU LENGTH MARK +0C3E..0C40 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C41..0C44 ; Vowel_Dependent # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C46..0C48 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI +0C4A..0C4C ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C55..0C56 ; Vowel_Dependent # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK +0C62..0C63 ; Vowel_Dependent # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBE ; Vowel_Dependent # Mc KANNADA VOWEL SIGN AA +0CBF ; Vowel_Dependent # Mn KANNADA VOWEL SIGN I +0CC0..0CC4 ; Vowel_Dependent # Mc [5] KANNADA VOWEL SIGN II..KANNADA VOWEL SIGN VOCALIC RR +0CC6 ; Vowel_Dependent # Mn KANNADA VOWEL SIGN E +0CC7..0CC8 ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +0CCC ; Vowel_Dependent # Mn KANNADA VOWEL SIGN AU +0CD5..0CD6 ; Vowel_Dependent # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CE2..0CE3 ; Vowel_Dependent # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D3E..0D40 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D44 ; Vowel_Dependent # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR +0D46..0D48 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0D4A..0D4C ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0D57 ; Vowel_Dependent # Mc MALAYALAM AU LENGTH MARK +0D62..0D63 ; Vowel_Dependent # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DCF..0DD1 ; Vowel_Dependent # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD2..0DD4 ; Vowel_Dependent # Mn [3] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Vowel_Dependent # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0DD8..0DDF ; Vowel_Dependent # Mc [8] SINHALA VOWEL SIGN GAETTA-PILLA..SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Vowel_Dependent # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Vowel_Dependent # Lo THAI CHARACTER SARA A +0E31 ; Vowel_Dependent # Mn THAI CHARACTER MAI HAN-AKAT +0E32..0E33 ; Vowel_Dependent # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E34..0E39 ; Vowel_Dependent # Mn [6] THAI CHARACTER SARA I..THAI CHARACTER SARA UU +0E40..0E45 ; Vowel_Dependent # Lo [6] THAI CHARACTER SARA E..THAI CHARACTER LAKKHANGYAO +0E47 ; Vowel_Dependent # Mn THAI CHARACTER MAITAIKHU +0EB0 ; Vowel_Dependent # Lo LAO VOWEL SIGN A +0EB1 ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KAN +0EB2..0EB3 ; Vowel_Dependent # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0EB4..0EB9 ; Vowel_Dependent # Mn [6] LAO VOWEL SIGN I..LAO VOWEL SIGN UU +0EBB ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KON +0EC0..0EC4 ; Vowel_Dependent # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +0F71..0F7D ; Vowel_Dependent # Mn [13] TIBETAN VOWEL SIGN AA..TIBETAN VOWEL SIGN OO +0F80..0F81 ; Vowel_Dependent # Mn [2] TIBETAN VOWEL SIGN REVERSED I..TIBETAN VOWEL SIGN REVERSED II +102B..102C ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +102D..1030 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN UU +1031 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN E +1032..1035 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +1056..1057 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1058..1059 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1062 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1071..1074 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1083..1084 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN SHAN AA..MYANMAR VOWEL SIGN SHAN E +1085..1086 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109C ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN AITON A +109D ; Vowel_Dependent # Mn MYANMAR VOWEL SIGN AITON AI +1712..1713 ; Vowel_Dependent # Mn [2] TAGALOG VOWEL SIGN I..TAGALOG VOWEL SIGN U +1732..1733 ; Vowel_Dependent # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1752..1753 ; Vowel_Dependent # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U +1772..1773 ; Vowel_Dependent # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U +17B6 ; Vowel_Dependent # Mc KHMER VOWEL SIGN AA +17B7..17BD ; Vowel_Dependent # Mn [7] KHMER VOWEL SIGN I..KHMER VOWEL SIGN UA +17BE..17C5 ; Vowel_Dependent # Mc [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU +17C8 ; Vowel_Dependent # Mc KHMER SIGN YUUKALEAPINTU +1920..1922 ; Vowel_Dependent # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U +1923..1926 ; Vowel_Dependent # Mc [4] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AU +1927..1928 ; Vowel_Dependent # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +19B0..19C0 ; Vowel_Dependent # Mc [17] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN IY +1A17..1A18 ; Vowel_Dependent # Mn [2] BUGINESE VOWEL SIGN I..BUGINESE VOWEL SIGN U +1A19..1A1A ; Vowel_Dependent # Mc [2] BUGINESE VOWEL SIGN E..BUGINESE VOWEL SIGN O +1A1B ; Vowel_Dependent # Mn BUGINESE VOWEL SIGN AE +1A61 ; Vowel_Dependent # Mc TAI THAM VOWEL SIGN A +1A62 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN MAI SAT +1A63..1A64 ; Vowel_Dependent # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A65..1A6C ; Vowel_Dependent # Mn [8] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN OA BELOW +1A6D..1A72 ; Vowel_Dependent # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI +1A73..1A74 ; Vowel_Dependent # Mn [2] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN MAI KANG +1B35 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN TEDUNG +1B36..1B3A ; Vowel_Dependent # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA +1B3B ; Vowel_Dependent # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +1B3C ; Vowel_Dependent # Mn BALINESE VOWEL SIGN LA LENGA +1B3D..1B41 ; Vowel_Dependent # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1B42 ; Vowel_Dependent # Mn BALINESE VOWEL SIGN PEPET +1B43 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN PEPET TEDUNG +1BA4..1BA5 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PANGHULU..SUNDANESE VOWEL SIGN PANYUKU +1BA6..1BA7 ; Vowel_Dependent # Mc [2] SUNDANESE VOWEL SIGN PANAELAENG..SUNDANESE VOWEL SIGN PANOLONG +1BA8..1BA9 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE7 ; Vowel_Dependent # Mc BATAK VOWEL SIGN E +1BE8..1BE9 ; Vowel_Dependent # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BEA..1BEC ; Vowel_Dependent # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BED ; Vowel_Dependent # Mn BATAK VOWEL SIGN KARO O +1BEE ; Vowel_Dependent # Mc BATAK VOWEL SIGN U +1BEF ; Vowel_Dependent # Mn BATAK VOWEL SIGN U FOR SIMALUNGUN SA +1C26..1C2B ; Vowel_Dependent # Mc [6] LEPCHA VOWEL SIGN AA..LEPCHA VOWEL SIGN UU +1C2C ; Vowel_Dependent # Mn LEPCHA VOWEL SIGN E +A823..A824 ; Vowel_Dependent # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A825..A826 ; Vowel_Dependent # Mn [2] SYLOTI NAGRI VOWEL SIGN U..SYLOTI NAGRI VOWEL SIGN E +A827 ; Vowel_Dependent # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Vowel_Dependent # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A947..A94E ; Vowel_Dependent # Mn [8] REJANG VOWEL SIGN I..REJANG VOWEL SIGN EA +A9B4..A9B5 ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9B6..A9B9 ; Vowel_Dependent # Mn [4] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BA..A9BB ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +A9BC ; Vowel_Dependent # Mn JAVANESE VOWEL SIGN PEPET +AA29..AA2E ; Vowel_Dependent # Mn [6] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN OE +AA2F..AA30 ; Vowel_Dependent # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA31..AA32 ; Vowel_Dependent # Mn [2] CHAM VOWEL SIGN AU..CHAM VOWEL SIGN UE +AAB0 ; Vowel_Dependent # Mn TAI VIET MAI KANG +AAB1 ; Vowel_Dependent # Lo TAI VIET VOWEL AA +AAB2..AAB4 ; Vowel_Dependent # Mn [3] TAI VIET VOWEL I..TAI VIET VOWEL U +AAB5..AAB6 ; Vowel_Dependent # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB7..AAB8 ; Vowel_Dependent # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AAB9..AABD ; Vowel_Dependent # Lo [5] TAI VIET VOWEL UEA..TAI VIET VOWEL AN +AABE ; Vowel_Dependent # Mn TAI VIET VOWEL AM +AAEB ; Vowel_Dependent # Mc MEETEI MAYEK VOWEL SIGN II +AAEC..AAED ; Vowel_Dependent # Mn [2] MEETEI MAYEK VOWEL SIGN UU..MEETEI MAYEK VOWEL SIGN AAI +AAEE..AAEF ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN AU..MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE5 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN ANAP +ABE6..ABE7 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE8 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABE9..ABEA ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +10A01..10A03 ; Vowel_Dependent # Mn [3] KHAROSHTHI VOWEL SIGN I..KHAROSHTHI VOWEL SIGN VOCALIC R +10A05..10A06 ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O +10A0C ; Vowel_Dependent # Mn KHAROSHTHI VOWEL LENGTH MARK +11038..11045 ; Vowel_Dependent # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +110B0..110B2 ; Vowel_Dependent # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II +110B3..110B6 ; Vowel_Dependent # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI +110B7..110B8 ; Vowel_Dependent # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11127..1112B ; Vowel_Dependent # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU +1112C ; Vowel_Dependent # Mc CHAKMA VOWEL SIGN E +1112D..11132 ; Vowel_Dependent # Mn [6] CHAKMA VOWEL SIGN AI..CHAKMA AU MARK +111B3..111B5 ; Vowel_Dependent # Mc [3] SHARADA VOWEL SIGN AA..SHARADA VOWEL SIGN II +111B6..111BE ; Vowel_Dependent # Mn [9] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN O +111BF ; Vowel_Dependent # Mc SHARADA VOWEL SIGN AU +1122C..1122E ; Vowel_Dependent # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +1122F..11231 ; Vowel_Dependent # Mn [3] KHOJKI VOWEL SIGN U..KHOJKI VOWEL SIGN AI +11232..11233 ; Vowel_Dependent # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU +112E0..112E2 ; Vowel_Dependent # Mc [3] KHUDAWADI VOWEL SIGN AA..KHUDAWADI VOWEL SIGN II +112E3..112E8 ; Vowel_Dependent # Mn [6] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN AU +1133E..1133F ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11340 ; Vowel_Dependent # Mn GRANTHA VOWEL SIGN II +11341..11344 ; Vowel_Dependent # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +11347..11348 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +1134B..1134C ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +11357 ; Vowel_Dependent # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +114B0..114B2 ; Vowel_Dependent # Mc [3] TIRHUTA VOWEL SIGN AA..TIRHUTA VOWEL SIGN II +114B3..114B8 ; Vowel_Dependent # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114B9 ; Vowel_Dependent # Mc TIRHUTA VOWEL SIGN E +114BA ; Vowel_Dependent # Mn TIRHUTA VOWEL SIGN SHORT E +114BB..114BE ; Vowel_Dependent # Mc [4] TIRHUTA VOWEL SIGN AI..TIRHUTA VOWEL SIGN AU +115AF..115B1 ; Vowel_Dependent # Mc [3] SIDDHAM VOWEL SIGN AA..SIDDHAM VOWEL SIGN II +115B2..115B5 ; Vowel_Dependent # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115B8..115BB ; Vowel_Dependent # Mc [4] SIDDHAM VOWEL SIGN E..SIDDHAM VOWEL SIGN AU +11630..11632 ; Vowel_Dependent # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +11633..1163A ; Vowel_Dependent # Mn [8] MODI VOWEL SIGN U..MODI VOWEL SIGN AI +1163B..1163C ; Vowel_Dependent # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +116AD ; Vowel_Dependent # Mn TAKRI VOWEL SIGN AA +116AE..116AF ; Vowel_Dependent # Mc [2] TAKRI VOWEL SIGN I..TAKRI VOWEL SIGN II +116B0..116B5 ; Vowel_Dependent # Mn [6] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel + +# (Other) Vowels (reanalyzed as ordinary alphabetic letters or marks) + +# [Not derivable] + +1963..196D ; Vowel # Lo [11] TAI LE LETTER A..TAI LE LETTER AI +A85E..A861 ; Vowel # Lo [4] PHAGS-PA LETTER I..PHAGS-PA LETTER O +A866 ; Vowel # Lo PHAGS-PA LETTER EE +A922..A925 ; Vowel # Lo [4] KAYAH LI LETTER A..KAYAH LI LETTER OO +A926..A92A ; Vowel # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O +11150..11154 ; Vowel # Lo [5] MAHAJANI LETTER A..MAHAJANI LETTER O + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Placeholder + +# Consonant Placeholder +# This includes generic placeholders used for +# Indic script layout (NBSP and dotted circle), as well as a few script- +# specific vowel-holder characters which are not technically +# consonants, but serve instead as bases for placement of vowel marks. + +# [Not derivable] + +002D ; Consonant_Placeholder # Pd HYPHEN-MINUS +00A0 ; Consonant_Placeholder # Zs NO-BREAK SPACE +00D7 ; Consonant_Placeholder # Sm MULTIPLICATION SIGN +0A72..0A73 ; Consonant_Placeholder # Lo [2] GURMUKHI IRI..GURMUKHI URA +104E ; Consonant_Placeholder # Po MYANMAR SYMBOL AFOREMENTIONED +1900 ; Consonant_Placeholder # Lo LIMBU VOWEL-CARRIER LETTER +2012..2014 ; Consonant_Placeholder # Pd [3] FIGURE DASH..EM DASH +25CC ; Consonant_Placeholder # So DOTTED CIRCLE + +# ================================================ + +# Indic_Syllabic_Category=Consonant + +# Consonant (ordinary abugida consonants, with inherent vowels) + +# [Not derivable] + +0915..0939 ; Consonant # Lo [37] DEVANAGARI LETTER KA..DEVANAGARI LETTER HA +0958..095F ; Consonant # Lo [8] DEVANAGARI LETTER QA..DEVANAGARI LETTER YYA +0978..097F ; Consonant # Lo [8] DEVANAGARI LETTER MARWARI DDA..DEVANAGARI LETTER BBA +0995..09A8 ; Consonant # Lo [20] BENGALI LETTER KA..BENGALI LETTER NA +09AA..09B0 ; Consonant # Lo [7] BENGALI LETTER PA..BENGALI LETTER RA +09B2 ; Consonant # Lo BENGALI LETTER LA +09B6..09B9 ; Consonant # Lo [4] BENGALI LETTER SHA..BENGALI LETTER HA +09DC..09DD ; Consonant # Lo [2] BENGALI LETTER RRA..BENGALI LETTER RHA +09DF ; Consonant # Lo BENGALI LETTER YYA +09F0..09F1 ; Consonant # Lo [2] BENGALI LETTER RA WITH MIDDLE DIAGONAL..BENGALI LETTER RA WITH LOWER DIAGONAL +0A15..0A28 ; Consonant # Lo [20] GURMUKHI LETTER KA..GURMUKHI LETTER NA +0A2A..0A30 ; Consonant # Lo [7] GURMUKHI LETTER PA..GURMUKHI LETTER RA +0A32..0A33 ; Consonant # Lo [2] GURMUKHI LETTER LA..GURMUKHI LETTER LLA +0A35..0A36 ; Consonant # Lo [2] GURMUKHI LETTER VA..GURMUKHI LETTER SHA +0A38..0A39 ; Consonant # Lo [2] GURMUKHI LETTER SA..GURMUKHI LETTER HA +0A59..0A5C ; Consonant # Lo [4] GURMUKHI LETTER KHHA..GURMUKHI LETTER RRA +0A5E ; Consonant # Lo GURMUKHI LETTER FA +0A95..0AA8 ; Consonant # Lo [20] GUJARATI LETTER KA..GUJARATI LETTER NA +0AAA..0AB0 ; Consonant # Lo [7] GUJARATI LETTER PA..GUJARATI LETTER RA +0AB2..0AB3 ; Consonant # Lo [2] GUJARATI LETTER LA..GUJARATI LETTER LLA +0AB5..0AB9 ; Consonant # Lo [5] GUJARATI LETTER VA..GUJARATI LETTER HA +0B15..0B28 ; Consonant # Lo [20] ORIYA LETTER KA..ORIYA LETTER NA +0B2A..0B30 ; Consonant # Lo [7] ORIYA LETTER PA..ORIYA LETTER RA +0B32..0B33 ; Consonant # Lo [2] ORIYA LETTER LA..ORIYA LETTER LLA +0B35..0B39 ; Consonant # Lo [5] ORIYA LETTER VA..ORIYA LETTER HA +0B5C..0B5D ; Consonant # Lo [2] ORIYA LETTER RRA..ORIYA LETTER RHA +0B5F ; Consonant # Lo ORIYA LETTER YYA +0B71 ; Consonant # Lo ORIYA LETTER WA +0B95 ; Consonant # Lo TAMIL LETTER KA +0B99..0B9A ; Consonant # Lo [2] TAMIL LETTER NGA..TAMIL LETTER CA +0B9C ; Consonant # Lo TAMIL LETTER JA +0B9E..0B9F ; Consonant # Lo [2] TAMIL LETTER NYA..TAMIL LETTER TTA +0BA3..0BA4 ; Consonant # Lo [2] TAMIL LETTER NNA..TAMIL LETTER TA +0BA8..0BAA ; Consonant # Lo [3] TAMIL LETTER NA..TAMIL LETTER PA +0BAE..0BB9 ; Consonant # Lo [12] TAMIL LETTER MA..TAMIL LETTER HA +0C15..0C28 ; Consonant # Lo [20] TELUGU LETTER KA..TELUGU LETTER NA +0C2A..0C39 ; Consonant # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C58..0C59 ; Consonant # Lo [2] TELUGU LETTER TSA..TELUGU LETTER DZA +0C95..0CA8 ; Consonant # Lo [20] KANNADA LETTER KA..KANNADA LETTER NA +0CAA..0CB3 ; Consonant # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA +0CB5..0CB9 ; Consonant # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA +0CDE ; Consonant # Lo KANNADA LETTER FA +0D15..0D3A ; Consonant # Lo [38] MALAYALAM LETTER KA..MALAYALAM LETTER TTTA +0D9A..0DB1 ; Consonant # Lo [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA +0DB3..0DBB ; Consonant # Lo [9] SINHALA LETTER SANYAKA DAYANNA..SINHALA LETTER RAYANNA +0DBD ; Consonant # Lo SINHALA LETTER DANTAJA LAYANNA +0DC0..0DC6 ; Consonant # Lo [7] SINHALA LETTER VAYANNA..SINHALA LETTER FAYANNA +0E01..0E2E ; Consonant # Lo [46] THAI CHARACTER KO KAI..THAI CHARACTER HO NOKHUK +0E81..0E82 ; Consonant # Lo [2] LAO LETTER KO..LAO LETTER KHO SUNG +0E84 ; Consonant # Lo LAO LETTER KHO TAM +0E87..0E88 ; Consonant # Lo [2] LAO LETTER NGO..LAO LETTER CO +0E8A ; Consonant # Lo LAO LETTER SO TAM +0E8D ; Consonant # Lo LAO LETTER NYO +0E94..0E97 ; Consonant # Lo [4] LAO LETTER DO..LAO LETTER THO TAM +0E99..0E9F ; Consonant # Lo [7] LAO LETTER NO..LAO LETTER FO SUNG +0EA1..0EA3 ; Consonant # Lo [3] LAO LETTER MO..LAO LETTER LO LING +0EA5 ; Consonant # Lo LAO LETTER LO LOOT +0EA7 ; Consonant # Lo LAO LETTER WO +0EAA..0EAB ; Consonant # Lo [2] LAO LETTER SO SUNG..LAO LETTER HO SUNG +0EAD..0EAE ; Consonant # Lo [2] LAO LETTER O..LAO LETTER HO TAM +0EDC..0EDF ; Consonant # Lo [4] LAO HO NO..LAO LETTER KHMU NYO +0F40..0F47 ; Consonant # Lo [8] TIBETAN LETTER KA..TIBETAN LETTER JA +0F49..0F6C ; Consonant # Lo [36] TIBETAN LETTER NYA..TIBETAN LETTER RRA +1000..1020 ; Consonant # Lo [33] MYANMAR LETTER KA..MYANMAR LETTER LLA +103F ; Consonant # Lo MYANMAR LETTER GREAT SA +1050..1051 ; Consonant # Lo [2] MYANMAR LETTER SHA..MYANMAR LETTER SSA +105A..105D ; Consonant # Lo [4] MYANMAR LETTER MON NGA..MYANMAR LETTER MON BBE +1061 ; Consonant # Lo MYANMAR LETTER SGAW KAREN SHA +1065..1066 ; Consonant # Lo [2] MYANMAR LETTER WESTERN PWO KAREN THA..MYANMAR LETTER WESTERN PWO KAREN PWA +106E..1070 ; Consonant # Lo [3] MYANMAR LETTER EASTERN PWO KAREN NNA..MYANMAR LETTER EASTERN PWO KAREN GHWA +1075..1081 ; Consonant # Lo [13] MYANMAR LETTER SHAN KA..MYANMAR LETTER SHAN HA +108E ; Consonant # Lo MYANMAR LETTER RUMAI PALAUNG FA +1703..170C ; Consonant # Lo [10] TAGALOG LETTER KA..TAGALOG LETTER YA +170E..1711 ; Consonant # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1723..1731 ; Consonant # Lo [15] HANUNOO LETTER KA..HANUNOO LETTER HA +1743..1751 ; Consonant # Lo [15] BUHID LETTER KA..BUHID LETTER HA +1763..176C ; Consonant # Lo [10] TAGBANWA LETTER KA..TAGBANWA LETTER YA +176E..1770 ; Consonant # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA +1780..17A2 ; Consonant # Lo [35] KHMER LETTER KA..KHMER LETTER QA +1901..191E ; Consonant # Lo [30] LIMBU LETTER KA..LIMBU LETTER TRA +1950..1962 ; Consonant # Lo [19] TAI LE LETTER KA..TAI LE LETTER NA +1980..19AB ; Consonant # Lo [44] NEW TAI LUE LETTER HIGH QA..NEW TAI LUE LETTER LOW SUA +1A00..1A16 ; Consonant # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA +1A20..1A4C ; Consonant # Lo [45] TAI THAM LETTER HIGH KA..TAI THAM LETTER LOW HA +1A53..1A54 ; Consonant # Lo [2] TAI THAM LETTER LAE..TAI THAM LETTER GREAT SA +1B13..1B33 ; Consonant # Lo [33] BALINESE LETTER KA..BALINESE LETTER HA +1B45..1B4B ; Consonant # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B8A..1BA0 ; Consonant # Lo [23] SUNDANESE LETTER KA..SUNDANESE LETTER HA +1BAE..1BAF ; Consonant # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA +1BBB..1BBD ; Consonant # Lo [3] SUNDANESE LETTER REU..SUNDANESE LETTER BHA +1BC0..1BE3 ; Consonant # Lo [36] BATAK LETTER A..BATAK LETTER MBA +1C00..1C23 ; Consonant # Lo [36] LEPCHA LETTER KA..LEPCHA LETTER A +1C4D..1C4F ; Consonant # Lo [3] LEPCHA LETTER TTA..LEPCHA LETTER DDA +A807..A80A ; Consonant # Lo [4] SYLOTI NAGRI LETTER KO..SYLOTI NAGRI LETTER GHO +A80C..A822 ; Consonant # Lo [23] SYLOTI NAGRI LETTER CO..SYLOTI NAGRI LETTER HO +A840..A85D ; Consonant # Lo [30] PHAGS-PA LETTER KA..PHAGS-PA LETTER A +A862..A865 ; Consonant # Lo [4] PHAGS-PA LETTER QA..PHAGS-PA LETTER GGA +A869..A870 ; Consonant # Lo [8] PHAGS-PA LETTER TTA..PHAGS-PA LETTER ASPIRATED FA +A872 ; Consonant # Lo PHAGS-PA SUPERFIXED LETTER RA +A892..A8B3 ; Consonant # Lo [34] SAURASHTRA LETTER KA..SAURASHTRA LETTER LLA +A90A..A921 ; Consonant # Lo [24] KAYAH LI LETTER KA..KAYAH LI LETTER CA +A930..A946 ; Consonant # Lo [23] REJANG LETTER KA..REJANG LETTER A +A989..A98B ; Consonant # Lo [3] JAVANESE LETTER PA CEREK..JAVANESE LETTER NGA LELET RASWADI +A98F..A9B2 ; Consonant # Lo [36] JAVANESE LETTER KA..JAVANESE LETTER HA +A9E0..A9E4 ; Consonant # Lo [5] MYANMAR LETTER SHAN GHA..MYANMAR LETTER SHAN BHA +A9E7..A9EF ; Consonant # Lo [9] MYANMAR LETTER TAI LAING NYA..MYANMAR LETTER TAI LAING NNA +A9FA..A9FE ; Consonant # Lo [5] MYANMAR LETTER TAI LAING LLA..MYANMAR LETTER TAI LAING BHA +AA06..AA28 ; Consonant # Lo [35] CHAM LETTER KA..CHAM LETTER HA +AA60..AA6F ; Consonant # Lo [16] MYANMAR LETTER KHAMTI GA..MYANMAR LETTER KHAMTI FA +AA71..AA73 ; Consonant # Lo [3] MYANMAR LETTER KHAMTI XA..MYANMAR LETTER KHAMTI RA +AA7A ; Consonant # Lo MYANMAR LETTER AITON RA +AA7E..AA7F ; Consonant # Lo [2] MYANMAR LETTER SHWE PALAUNG CHA..MYANMAR LETTER SHWE PALAUNG SHA +AA80..AAAF ; Consonant # Lo [48] TAI VIET LETTER LOW KO..TAI VIET LETTER HIGH O +AAE2..AAEA ; Consonant # Lo [9] MEETEI MAYEK LETTER CHA..MEETEI MAYEK LETTER SSA +ABC0..ABCD ; Consonant # Lo [14] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER HUK +ABD0 ; Consonant # Lo MEETEI MAYEK LETTER PHAM +ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTER BHAM +10A00 ; Consonant # Lo KHAROSHTHI LETTER A +10A10..10A13 ; Consonant # Lo [4] KHAROSHTHI LETTER KA..KHAROSHTHI LETTER GHA +10A15..10A17 ; Consonant # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA +10A19..10A33 ; Consonant # Lo [27] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER TTTHA +11013..11037 ; Consonant # Lo [37] BRAHMI LETTER KA..BRAHMI LETTER OLD TAMIL NNNA +1108D..110AF ; Consonant # Lo [35] KAITHI LETTER KA..KAITHI LETTER HA +11107..11126 ; Consonant # Lo [32] CHAKMA LETTER KAA..CHAKMA LETTER HAA +11155..11172 ; Consonant # Lo [30] MAHAJANI LETTER KA..MAHAJANI LETTER RRA +11191..111B2 ; Consonant # Lo [34] SHARADA LETTER KA..SHARADA LETTER HA +11208..11211 ; Consonant # Lo [10] KHOJKI LETTER KA..KHOJKI LETTER JJA +11213..1122B ; Consonant # Lo [25] KHOJKI LETTER NYA..KHOJKI LETTER LLA +112BA..112DE ; Consonant # Lo [37] KHUDAWADI LETTER KA..KHUDAWADI LETTER HA +11315..11328 ; Consonant # Lo [20] GRANTHA LETTER KA..GRANTHA LETTER NA +1132A..11330 ; Consonant # Lo [7] GRANTHA LETTER PA..GRANTHA LETTER RA +11332..11333 ; Consonant # Lo [2] GRANTHA LETTER LA..GRANTHA LETTER LLA +11335..11339 ; Consonant # Lo [5] GRANTHA LETTER VA..GRANTHA LETTER HA +1148F..114AF ; Consonant # Lo [33] TIRHUTA LETTER KA..TIRHUTA LETTER HA +1158E..115AE ; Consonant # Lo [33] SIDDHAM LETTER KA..SIDDHAM LETTER HA +1160E..1162F ; Consonant # Lo [34] MODI LETTER KA..MODI LETTER LLA +1168A..116AA ; Consonant # Lo [33] TAKRI LETTER KA..TAKRI LETTER RRA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Dead + +# Dead Consonant (special consonant with killed vowel) + +# [Not derivable] + +09CE ; Consonant_Dead # Lo BENGALI LETTER KHANDA TA +0D7A..0D7F ; Consonant_Dead # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Preceding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when preceding the main consonant + +# [Not derivable] + +0D4E ; Consonant_Preceding_Repha # Lo MALAYALAM LETTER DOT REPH + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Succeeding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when succeeding the main consonant + +# [Not derivable] + +17CC ; Consonant_Succeeding_Repha # Mn KHMER SIGN ROBAT +1B03 ; Consonant_Succeeding_Repha # Mn BALINESE SIGN SURANG +1B81 ; Consonant_Succeeding_Repha # Mn SUNDANESE SIGN PANGLAYAR +A982 ; Consonant_Succeeding_Repha # Mn JAVANESE SIGN LAYAR + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Subjoined + +# Subjoined Consonant (C2 form subtending a base consonant in Tibetan, etc.) + +# [Not derivable] + +0F8D..0F97 ; Consonant_Subjoined # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Consonant_Subjoined # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +1929..192B ; Consonant_Subjoined # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1BA1 ; Consonant_Subjoined # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA2..1BA3 ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BAC..1BAD ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C24..1C25 ; Consonant_Subjoined # Mc [2] LEPCHA SUBJOINED LETTER YA..LEPCHA SUBJOINED LETTER RA +A867..A868 ; Consonant_Subjoined # Lo [2] PHAGS-PA SUBJOINED LETTER WA..PHAGS-PA SUBJOINED LETTER YA +A871 ; Consonant_Subjoined # Lo PHAGS-PA SUBJOINED LETTER RA +A9BD ; Consonant_Subjoined # Mc JAVANESE CONSONANT SIGN KERET + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Medial + +# Medial Consonant (medial liquid, occurring in clusters) + +# [Not derivable] + +0A75 ; Consonant_Medial # Mn GURMUKHI SIGN YAKASH +0EBC ; Consonant_Medial # Mn LAO SEMIVOWEL SIGN LO +0EBD ; Consonant_Medial # Lo LAO SEMIVOWEL SIGN NYO +103B..103C ; Consonant_Medial # Mc [2] MYANMAR CONSONANT SIGN MEDIAL YA..MYANMAR CONSONANT SIGN MEDIAL RA +103D..103E ; Consonant_Medial # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +105E..1060 ; Consonant_Medial # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Consonant_Medial # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +1A55 ; Consonant_Medial # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A56 ; Consonant_Medial # Mn TAI THAM CONSONANT SIGN MEDIAL LA +A9BE..A9BF ; Consonant_Medial # Mc [2] JAVANESE CONSONANT SIGN PENGKAL..JAVANESE CONSONANT SIGN CAKRA +AA33..AA34 ; Consonant_Medial # Mc [2] CHAM CONSONANT SIGN YA..CHAM CONSONANT SIGN RA +AA35..AA36 ; Consonant_Medial # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Final + +# Final Consonant (special final forms which do not take vowels) + +# [Not derivable] + +1930..1931 ; Consonant_Final # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Consonant_Final # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +19C1..19C7 ; Consonant_Final # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B +1A57 ; Consonant_Final # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A58..1A5E ; Consonant_Final # Mn [7] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN SA +1BBE..1BBF ; Consonant_Final # Lo [2] SUNDANESE LETTER FINAL K..SUNDANESE LETTER FINAL M +1BF0..1BF1 ; Consonant_Final # Mn [2] BATAK CONSONANT SIGN NG..BATAK CONSONANT SIGN H +1C2D..1C33 ; Consonant_Final # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +A8B4 ; Consonant_Final # Mc SAURASHTRA CONSONANT SIGN HAARU +A94F..A951 ; Consonant_Final # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A952 ; Consonant_Final # Mc REJANG CONSONANT SIGN H +AA40..AA42 ; Consonant_Final # Lo [3] CHAM LETTER FINAL K..CHAM LETTER FINAL NG +AA43 ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL NG +AA44..AA4B ; Consonant_Final # Lo [8] CHAM LETTER FINAL CH..CHAM LETTER FINAL SS +AA4C ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL M +AA4D ; Consonant_Final # Mc CHAM CONSONANT SIGN FINAL H +ABDB..ABE2 ; Consonant_Final # Lo [8] MEETEI MAYEK LETTER KOK LONSUM..MEETEI MAYEK LETTER I LONSUM + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Head_Letter + +# Head Letter (Tibetan) + +# [Not derivable] + +0F88..0F8C ; Consonant_Head_Letter # Lo [5] TIBETAN SIGN LCE TSA CAN..TIBETAN SIGN INVERTED MCHU CAN + +# ================================================ + +# Indic_Syllabic_Category=Modifying_Letter + +# Reanalyzed letters not participating in the abugida structure, but +# serving to modify the sound of an adjacent vowel or consonant. +# Note that this is not the same as General_Category=Modifier_Letter. + +# [Not derivable] + +0B83 ; Modifying_Letter # Lo TAMIL SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Tone_Letter + +# Tone Letter (spacing lexical tone mark with status as a letter) + +# [Not derivable] + +1970..1974 ; Tone_Letter # Lo [5] TAI LE LETTER TONE-2..TAI LE LETTER TONE-6 +AAC0 ; Tone_Letter # Lo TAI VIET TONE MAI NUENG +AAC2 ; Tone_Letter # Lo TAI VIET TONE MAI SONG + +# ================================================ + +# Indic_Syllabic_Category=Tone_Mark + +# Tone Mark (nonspacing or spacing lexical tone mark) + +# [Not derivable] + +0951..0952 ; Tone_Mark # Mn [2] DEVANAGARI STRESS SIGN UDATTA..DEVANAGARI STRESS SIGN ANUDATTA +0E48..0E4B ; Tone_Mark # Mn [4] THAI CHARACTER MAI EK..THAI CHARACTER MAI CHATTAWA +0EC8..0ECB ; Tone_Mark # Mn [4] LAO TONE MAI EK..LAO TONE MAI CATAWA +1037 ; Tone_Mark # Mn MYANMAR SIGN DOT BELOW +1063..1064 ; Tone_Mark # Mc [2] MYANMAR TONE MARK SGAW KAREN HATHI..MYANMAR TONE MARK SGAW KAREN KE PHO +1069..106D ; Tone_Mark # Mc [5] MYANMAR SIGN WESTERN PWO KAREN TONE-1..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1087..108C ; Tone_Mark # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108D ; Tone_Mark # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +108F ; Tone_Mark # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109B ; Tone_Mark # Mc [2] MYANMAR SIGN KHAMTI TONE-1..MYANMAR SIGN KHAMTI TONE-3 +19C8..19C9 ; Tone_Mark # Mc [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A75..1A79 ; Tone_Mark # Mn [5] TAI THAM SIGN TONE-1..TAI THAM SIGN KHUEN TONE-5 +1CD0..1CD2 ; Tone_Mark # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CD4..1CE0 ; Tone_Mark # Mn [13] VEDIC SIGN YAJURVEDIC MIDLINE SVARITA..VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CE1 ; Tone_Mark # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF4 ; Tone_Mark # Mn VEDIC TONE CANDRA ABOVE +A92B..A92D ; Tone_Mark # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +AA7B ; Tone_Mark # Mc MYANMAR SIGN PAO KAREN TONE +AA7C ; Tone_Mark # Mn MYANMAR SIGN TAI LAING TONE-2 +AA7D ; Tone_Mark # Mc MYANMAR SIGN TAI LAING TONE-5 +AABF ; Tone_Mark # Mn TAI VIET TONE MAI EK +AAC1 ; Tone_Mark # Mn TAI VIET TONE MAI THO +ABEC ; Tone_Mark # Mc MEETEI MAYEK LUM IYEK + +# ================================================ + +# Indic_Syllabic_Category=Gemination_Mark + +# Gemination Mark (doubling of the preceding or following consonant) + +# [Not derivable] + +0A71 ; Gemination_Mark # Mn GURMUKHI ADDAK +11237 ; Gemination_Mark # Mn KHOJKI SIGN SHADDA + +# ================================================ + +# Indic_Syllabic_Category=Cantillation_Mark + +# Cantillation Mark (recitation marks, such as svara markers for the Samaveda) + +# [Not derivable] + +A8E0..A8F1 ; Cantillation_Mark # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +11366..1136C ; Cantillation_Mark # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Cantillation_Mark # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA + +# ================================================ + +# Indic_Syllabic_Category=Register_Shifter + +# Register Shifter (shifts register for consonants, akin to a tone mark) + +# [Not derivable] + +17C9..17CB ; Register_Shifter # Mn [3] KHMER SIGN MUUSIKATOAN..KHMER SIGN BANTOC + +# ================================================ + +# Indic_Syllabic_Category=Non_Joiner + +# Non_Joiner (Zero Width Non-Joiner) + +# [Not derivable] + +200C ; Non_Joiner # Cf ZERO WIDTH NON-JOINER + +# ================================================ + +# Indic_Syllabic_Category=Joiner + +# Joiner (Zero Width Joiner) + +# [Not derivable] + +200D ; Joiner # Cf ZERO WIDTH JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number_Joiner + +# Number_Joiner (forms ligatures between numbers for multiplication) + +# [Not derivable] + +1107F ; Number_Joiner # Mn BRAHMI NUMBER JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number + +# Number (can be used a vowel-holders like consonant placeholders) + +# [Not derivable] + +0030..0039 ; Number # Nd [10] DIGIT ZERO..DIGIT NINE +0966..096F ; Number # Nd [10] DEVANAGARI DIGIT ZERO..DEVANAGARI DIGIT NINE +09E6..09EF ; Number # Nd [10] BENGALI DIGIT ZERO..BENGALI DIGIT NINE +0A66..0A6F ; Number # Nd [10] GURMUKHI DIGIT ZERO..GURMUKHI DIGIT NINE +0AE6..0AEF ; Number # Nd [10] GUJARATI DIGIT ZERO..GUJARATI DIGIT NINE +0B66..0B6F ; Number # Nd [10] ORIYA DIGIT ZERO..ORIYA DIGIT NINE +0BE6..0BEF ; Number # Nd [10] TAMIL DIGIT ZERO..TAMIL DIGIT NINE +0C66..0C6F ; Number # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE +0CE6..0CEF ; Number # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE +0D66..0D6F ; Number # Nd [10] MALAYALAM DIGIT ZERO..MALAYALAM DIGIT NINE +0DE6..0DEF ; Number # Nd [10] SINHALA LITH DIGIT ZERO..SINHALA LITH DIGIT NINE +0E50..0E59 ; Number # Nd [10] THAI DIGIT ZERO..THAI DIGIT NINE +0ED0..0ED9 ; Number # Nd [10] LAO DIGIT ZERO..LAO DIGIT NINE +0F20..0F29 ; Number # Nd [10] TIBETAN DIGIT ZERO..TIBETAN DIGIT NINE +0F2A..0F33 ; Number # No [10] TIBETAN DIGIT HALF ONE..TIBETAN DIGIT HALF ZERO +1040..1049 ; Number # Nd [10] MYANMAR DIGIT ZERO..MYANMAR DIGIT NINE +1090..1099 ; Number # Nd [10] MYANMAR SHAN DIGIT ZERO..MYANMAR SHAN DIGIT NINE +17E0..17E9 ; Number # Nd [10] KHMER DIGIT ZERO..KHMER DIGIT NINE +1946..194F ; Number # Nd [10] LIMBU DIGIT ZERO..LIMBU DIGIT NINE +19D0..19D9 ; Number # Nd [10] NEW TAI LUE DIGIT ZERO..NEW TAI LUE DIGIT NINE +1A80..1A89 ; Number # Nd [10] TAI THAM HORA DIGIT ZERO..TAI THAM HORA DIGIT NINE +1A90..1A99 ; Number # Nd [10] TAI THAM THAM DIGIT ZERO..TAI THAM THAM DIGIT NINE +1B50..1B59 ; Number # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE +1BB0..1BB9 ; Number # Nd [10] SUNDANESE DIGIT ZERO..SUNDANESE DIGIT NINE +1C40..1C49 ; Number # Nd [10] LEPCHA DIGIT ZERO..LEPCHA DIGIT NINE +A8D0..A8D9 ; Number # Nd [10] SAURASHTRA DIGIT ZERO..SAURASHTRA DIGIT NINE +A900..A909 ; Number # Nd [10] KAYAH LI DIGIT ZERO..KAYAH LI DIGIT NINE +A9D0..A9D9 ; Number # Nd [10] JAVANESE DIGIT ZERO..JAVANESE DIGIT NINE +A9F0..A9F9 ; Number # Nd [10] MYANMAR TAI LAING DIGIT ZERO..MYANMAR TAI LAING DIGIT NINE +AA50..AA59 ; Number # Nd [10] CHAM DIGIT ZERO..CHAM DIGIT NINE +ABF0..ABF9 ; Number # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE +10A40..10A47 ; Number # No [8] KHAROSHTHI DIGIT ONE..KHAROSHTHI NUMBER ONE THOUSAND +11066..1106F ; Number # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11136..1113F ; Number # Nd [10] CHAKMA DIGIT ZERO..CHAKMA DIGIT NINE +111D0..111D9 ; Number # Nd [10] SHARADA DIGIT ZERO..SHARADA DIGIT NINE +111E1..111F4 ; Number # No [20] SINHALA ARCHAIC DIGIT ONE..SINHALA ARCHAIC NUMBER ONE THOUSAND +112F0..112F9 ; Number # Nd [10] KHUDAWADI DIGIT ZERO..KHUDAWADI DIGIT NINE +114D0..114D9 ; Number # Nd [10] TIRHUTA DIGIT ZERO..TIRHUTA DIGIT NINE +11650..11659 ; Number # Nd [10] MODI DIGIT ZERO..MODI DIGIT NINE +116C0..116C9 ; Number # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE + +# ================================================ + +# Indic_Syllabic_Category=Brahmi_Joining_Number + +# Brahmi Joining Number +# Similar to Numbers, can be used as vowel-holders like consonant placeholders, +# but may also be joined by a Number_Joiner of the same script (e.g. in +# Brahmi) + +# [Not derivable] + +11052..11065 ; Brahmi_Joining_Number # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND + +# EOF diff --git a/data/8.0.0-indic-positional-category.txt b/data/8.0.0-indic-positional-category.txt new file mode 100644 index 0000000..92cca55 --- /dev/null +++ b/data/8.0.0-indic-positional-category.txt @@ -0,0 +1,632 @@ +# IndicPositionalCategory-8.0.0.txt +# Date: 2015-05-12, 10:00:00 GMT [RP, KW, LI] +# +# Unicode Character Database +# Copyright (c) 1991-2015 Unicode, Inc. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# For documentation, see UAX #44: Unicode Character Database, +# at http://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Positional_Category enumerated property +# +# Scope: This property is aimed at the problem of +# the specification of syllabic structure for Indic scripts. +# Because dependent vowels (matras), visible viramas, and other +# characters are placed in notional slots around the consonant (or +# consonant cluster) core of an Indic syllable, there may be +# cooccurrence constraints or other interactions. Also, it may be +# desirable, in cases where more than one such character may occur in +# sequence, as for example, in a top slot and a bottom slot, to +# specify preferred orders for spelling. As such, this property +# is designed primarily to supplement the Indic_Syllabic_Category +# property. +# +# Note that this property is *not* intended as +# a prescriptive property regarding display or font design, +# for a number of reasons. Good font design requires information +# that is outside the context of a character encoding standard, +# and is best handled in other venues. For Indic dependent +# vowels and similar characters, in particular: +# +# 1. Matra placement may vary somewhat based on typeface design. +# 2. Matra placement, even within a single script, may vary +# somewhat according to historic period or local conventions. +# 3. Matra placement may be changed by explicit orthographic reform +# decisions. +# 4. Matras may ligate in various ways with a consonant (or even +# other elements of a syllable) instead of occurring in a +# discrete location. +# 5. Matra display may be contextually determined. This is +# notable, for example, in the Tamil script, where the shape +# and placement of -u and -uu vowels depends strongly on +# which consonant they adjoin. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Positional_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as containing dependent vowels or similar characters +# in the structural sense used for the Indic_Positional_Category are the +# following: +# +# Ahom, Balinese, Batak, Bengali, Brahmi, Buginese, Buhid, Chakma, +# Cham, Devanagari, Grantha, Gujarati, Gurmukhi, Hanunoo, Javanese, +# Kaithi, Kannada, Kharoshthi, Khmer, Khojki, Khudawadi, Lao, Lepcha, +# Limbu, Malayalam, Meetei Mayek, Modi, Myanmar, New Tai Lue, Oriya, +# Rejang, Saurashtra, Sharada, Siddham, Sinhala, Sundanese, Syloti +# Nagri, Tagalog, Tagbanwa, Tai Tham, Tai Viet, Takri, Tamil, Telugu, +# Thai, Tibetan, and Tirhuta. +# +# All characters for all other scripts not in that list +# take the default value for this property. +# +# See IndicSyllabicCategory.txt for a slightly more extended +# list of Indic scripts, including those which do not have +# positional characters. Currently, those additional +# Indic scripts without positional characters are +# Kayah Li, Mahajani, Multani, Phags-pa, and Tai Le. +# + +# ================================================ + +# Property: Indic_Positional_Category +# +# All code points not explicitly listed for Indic_Positional_Category +# have the value NA (not applicable). +# +# @missing: 0000..10FFFF; NA + +# ------------------------------------------------ + +# Indic_Positional_Category=Right + +0903 ; Right # Mc DEVANAGARI SIGN VISARGA +093B ; Right # Mc DEVANAGARI VOWEL SIGN OOE +093E ; Right # Mc DEVANAGARI VOWEL SIGN AA +0940 ; Right # Mc DEVANAGARI VOWEL SIGN II +0949..094C ; Right # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094F ; Right # Mc DEVANAGARI VOWEL SIGN AW +0982..0983 ; Right # Mc [2] BENGALI SIGN ANUSVARA..BENGALI SIGN VISARGA +09BE ; Right # Mc BENGALI VOWEL SIGN AA +09C0 ; Right # Mc BENGALI VOWEL SIGN II +09D7 ; Right # Mc BENGALI AU LENGTH MARK +0A03 ; Right # Mc GURMUKHI SIGN VISARGA +0A3E ; Right # Mc GURMUKHI VOWEL SIGN AA +0A40 ; Right # Mc GURMUKHI VOWEL SIGN II +0A83 ; Right # Mc GUJARATI SIGN VISARGA +0ABE ; Right # Mc GUJARATI VOWEL SIGN AA +0AC0 ; Right # Mc GUJARATI VOWEL SIGN II +0ACB..0ACC ; Right # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0B02..0B03 ; Right # Mc [2] ORIYA SIGN ANUSVARA..ORIYA SIGN VISARGA +0B3E ; Right # Mc ORIYA VOWEL SIGN AA +0B40 ; Right # Mc ORIYA VOWEL SIGN II +0BBE..0BBF ; Right # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC1..0BC2 ; Right # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +# Note: U and UU have contextually variable placement in Tamil. +0BD7 ; Right # Mc TAMIL AU LENGTH MARK +0C01..0C03 ; Right # Mc [3] TELUGU SIGN CANDRABINDU..TELUGU SIGN VISARGA +0C41..0C44 ; Right # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C82..0C83 ; Right # Mc [2] KANNADA SIGN ANUSVARA..KANNADA SIGN VISARGA +0CBE ; Right # Mc KANNADA VOWEL SIGN AA +0CC1..0CC4 ; Right # Mc [4] KANNADA VOWEL SIGN U..KANNADA VOWEL SIGN VOCALIC RR +0CD5..0CD6 ; Right # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0D02..0D03 ; Right # Mc [2] MALAYALAM SIGN ANUSVARA..MALAYALAM SIGN VISARGA +0D3E..0D40 ; Right # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D42 ; Right # Mn [2] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN UU +# Note: U and UU form complex ligatures with consonants in older Malayalam orthography. +0D57 ; Right # Mc MALAYALAM AU LENGTH MARK +0D82..0D83 ; Right # Mc [2] SINHALA SIGN ANUSVARAYA..SINHALA SIGN VISARGAYA +0DCF..0DD1 ; Right # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD8 ; Right # Mc SINHALA VOWEL SIGN GAETTA-PILLA +0DDF ; Right # Mc SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Right # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Right # Lo THAI CHARACTER SARA A +0E32..0E33 ; Right # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E45 ; Right # Lo THAI CHARACTER LAKKHANGYAO +0EB0 ; Right # Lo LAO VOWEL SIGN A +0EB2..0EB3 ; Right # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0F3E ; Right # Mc TIBETAN SIGN YAR TSHES +0F7F ; Right # Mc TIBETAN SIGN RNAM BCAD +102B..102C ; Right # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +1038 ; Right # Mc MYANMAR SIGN VISARGA +103B ; Right # Mc MYANMAR CONSONANT SIGN MEDIAL YA +1056..1057 ; Right # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1062..1064 ; Right # Mc [3] MYANMAR VOWEL SIGN SGAW KAREN EU..MYANMAR TONE MARK SGAW KAREN KE PHO +1067..106D ; Right # Mc [7] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1083 ; Right # Mc MYANMAR VOWEL SIGN SHAN AA +1087..108C ; Right # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108F ; Right # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109C ; Right # Mc [3] MYANMAR SIGN KHAMTI TONE-1..MYANMAR VOWEL SIGN AITON A +17B6 ; Right # Mc KHMER VOWEL SIGN AA +17C7..17C8 ; Right # Mc [2] KHMER SIGN REAHMUK..KHMER SIGN YUUKALEAPINTU +1923..1924 ; Right # Mc [2] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AI +1929..192B ; Right # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1930..1931 ; Right # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Right # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +19B0..19B4 ; Right # Lo [5] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN UU +19B8..19B9 ; Right # Lo [2] NEW TAI LUE VOWEL SIGN OA..NEW TAI LUE VOWEL SIGN UE +19BB..19C0 ; Right # Lo [6] NEW TAI LUE VOWEL SIGN AAY..NEW TAI LUE VOWEL SIGN IY +19C8..19C9 ; Right # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A1A ; Right # Mc BUGINESE VOWEL SIGN O +1A57 ; Right # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A61 ; Right # Mc TAI THAM VOWEL SIGN A +1A63..1A64 ; Right # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A6D ; Right # Mc TAI THAM VOWEL SIGN OY +1B04 ; Right # Mc BALINESE SIGN BISAH +1B35 ; Right # Mc BALINESE VOWEL SIGN TEDUNG +1B44 ; Right # Mc BALINESE ADEG ADEG +1B82 ; Right # Mc SUNDANESE SIGN PANGWISAD +1BA1 ; Right # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA7 ; Right # Mc SUNDANESE VOWEL SIGN PANOLONG +1BAA ; Right # Mc SUNDANESE SIGN PAMAAEH +1BE7 ; Right # Mc BATAK VOWEL SIGN E +1BEA..1BEC ; Right # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BEE ; Right # Mc BATAK VOWEL SIGN U +1BF2..1BF3 ; Right # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +1C24..1C26 ; Right # Mc [3] LEPCHA SUBJOINED LETTER YA..LEPCHA VOWEL SIGN AA +1C2A..1C2B ; Right # Mc [2] LEPCHA VOWEL SIGN U..LEPCHA VOWEL SIGN UU +1CE1 ; Right # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +A823..A824 ; Right # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A827 ; Right # Mc SYLOTI NAGRI VOWEL SIGN OO +A880..A881 ; Right # Mc [2] SAURASHTRA SIGN ANUSVARA..SAURASHTRA SIGN VISARGA +A8B4..A8C3 ; Right # Mc [16] SAURASHTRA CONSONANT SIGN HAARU..SAURASHTRA VOWEL SIGN AU +A952..A953 ; Right # Mc [2] REJANG CONSONANT SIGN H..REJANG VIRAMA +A983 ; Right # Mc JAVANESE SIGN WIGNYAN +A9B4..A9B5 ; Right # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9BD..A9BF ; Right # Mc [3] JAVANESE CONSONANT SIGN KERET..JAVANESE CONSONANT SIGN CAKRA +AA33 ; Right # Mc CHAM CONSONANT SIGN YA +AA4D ; Right # Mc CHAM CONSONANT SIGN FINAL H +AA7B ; Right # Mc MYANMAR SIGN PAO KAREN TONE +AA7D ; Right # Mc MYANMAR SIGN TAI LAING TONE-5 +AAB1 ; Right # Lo TAI VIET VOWEL AA +AABA ; Right # Lo TAI VIET VOWEL UA +AABD ; Right # Lo TAI VIET VOWEL AN +AAEF ; Right # Mc MEETEI MAYEK VOWEL SIGN AAU +AAF5 ; Right # Mc MEETEI MAYEK VOWEL SIGN VISARGA +ABE3..ABE4 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE6..ABE7 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE9..ABEA ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +ABEC ; Right # Mc MEETEI MAYEK LUM IYEK +11000 ; Right # Mc BRAHMI SIGN CANDRABINDU +11002 ; Right # Mc BRAHMI SIGN VISARGA +11082 ; Right # Mc KAITHI SIGN VISARGA +110B0 ; Right # Mc KAITHI VOWEL SIGN AA +110B2 ; Right # Mc KAITHI VOWEL SIGN II +110B7..110B8 ; Right # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11182 ; Right # Mc SHARADA SIGN VISARGA +111B3 ; Right # Mc SHARADA VOWEL SIGN AA +111B5 ; Right # Mc SHARADA VOWEL SIGN II +111C0 ; Right # Mc SHARADA SIGN VIRAMA +1122C..1122E ; Right # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +11235 ; Right # Mc KHOJKI SIGN VIRAMA +112E0 ; Right # Mc KHUDAWADI VOWEL SIGN AA +112E2 ; Right # Mc KHUDAWADI VOWEL SIGN II +11302..11303 ; Right # Mc [2] GRANTHA SIGN ANUSVARA..GRANTHA SIGN VISARGA +1133E..1133F ; Right # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11341..11342 ; Right # Mc [2] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN UU +# Note: U and UU have contextually variable placement in Grantha. +11343..11344 ; Right # Mc [2] GRANTHA VOWEL SIGN VOCALIC R..GRANTHA VOWEL SIGN VOCALIC RR +1134D ; Right # Mc GRANTHA SIGN VIRAMA +11357 ; Right # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Right # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +114B0 ; Right # Mc TIRHUTA VOWEL SIGN AA +114B2 ; Right # Mc TIRHUTA VOWEL SIGN II +114BD ; Right # Mc TIRHUTA VOWEL SIGN SHORT O +114C1 ; Right # Mc TIRHUTA SIGN VISARGA +115AF ; Right # Mc SIDDHAM VOWEL SIGN AA +115B1 ; Right # Mc SIDDHAM VOWEL SIGN II +115BE ; Right # Mc SIDDHAM SIGN VISARGA +11630..11632 ; Right # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +1163B..1163C ; Right # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +1163E ; Right # Mc MODI SIGN VISARGA +116AC ; Right # Mc TAKRI SIGN VISARGA +116AF ; Right # Mc TAKRI VOWEL SIGN II +116B6 ; Right # Mc TAKRI SIGN VIRAMA +11720..11721 ; Right # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA + +# Indic_Positional_Category=Left + +093F ; Left # Mc DEVANAGARI VOWEL SIGN I +094E ; Left # Mc DEVANAGARI VOWEL SIGN PRISHTHAMATRA E +09BF ; Left # Mc BENGALI VOWEL SIGN I +09C7..09C8 ; Left # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +0A3F ; Left # Mc GURMUKHI VOWEL SIGN I +0ABF ; Left # Mc GUJARATI VOWEL SIGN I +0B47 ; Left # Mc ORIYA VOWEL SIGN E +0BC6..0BC8 ; Left # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0D46..0D48 ; Left # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0DD9 ; Left # Mc SINHALA VOWEL SIGN KOMBUVA +0DDB ; Left # Mc SINHALA VOWEL SIGN KOMBU DEKA +0F3F ; Left # Mc TIBETAN SIGN MAR TSHES +1031 ; Left # Mc MYANMAR VOWEL SIGN E +1084 ; Left # Mc MYANMAR VOWEL SIGN SHAN E +17C1..17C3 ; Left # Mc [3] KHMER VOWEL SIGN E..KHMER VOWEL SIGN AI +1A19 ; Left # Mc BUGINESE VOWEL SIGN E +1A55 ; Left # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A6E..1A72 ; Left # Mc [5] TAI THAM VOWEL SIGN E..TAI THAM VOWEL SIGN THAM AI +1B3E..1B3F ; Left # Mc [2] BALINESE VOWEL SIGN TALING..BALINESE VOWEL SIGN TALING REPA +1BA6 ; Left # Mc SUNDANESE VOWEL SIGN PANAELAENG +1C27..1C28 ; Left # Mc [2] LEPCHA VOWEL SIGN I..LEPCHA VOWEL SIGN O +1C34..1C35 ; Left # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A9BA..A9BB ; Left # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +AA2F..AA30 ; Left # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA34 ; Left # Mc CHAM CONSONANT SIGN RA +AAEB ; Left # Mc MEETEI MAYEK VOWEL SIGN II +AAEE ; Left # Mc MEETEI MAYEK VOWEL SIGN AU +110B1 ; Left # Mc KAITHI VOWEL SIGN I +1112C ; Left # Mc CHAKMA VOWEL SIGN E +111B4 ; Left # Mc SHARADA VOWEL SIGN I +112E1 ; Left # Mc KHUDAWADI VOWEL SIGN I +11347..11348 ; Left # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +114B1 ; Left # Mc TIRHUTA VOWEL SIGN I +114B9 ; Left # Mc TIRHUTA VOWEL SIGN E +115B0 ; Left # Mc SIDDHAM VOWEL SIGN I +115B8 ; Left # Mc SIDDHAM VOWEL SIGN E +116AE ; Left # Mc TAKRI VOWEL SIGN I +11726 ; Left # Mc AHOM VOWEL SIGN E + +# Indic_Positional_Category=Visual_Order_Left + +# These are dependent vowels that occur to the left of the consonant +# letter in a syllable, but which occur in scripts using the visual order +# model, instead of the logical order model. Because of the different +# model, these left-side vowels occur first in the backing store (before +# the consonant letter) and are not reordered during text rendering. +# +# [Derivation: Logical_Order_Exception=Yes] + +0E40..0E44 ; Visual_Order_Left # Lo [5] THAI CHARACTER SARA E..THAI CHARACTER SARA AI MAIMALAI +0EC0..0EC4 ; Visual_Order_Left # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +19B5..19B7 ; Visual_Order_Left # Lo [3] NEW TAI LUE VOWEL SIGN E..NEW TAI LUE VOWEL SIGN O +19BA ; Visual_Order_Left # Lo NEW TAI LUE VOWEL SIGN AY +AAB5..AAB6 ; Visual_Order_Left # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB9 ; Visual_Order_Left # Lo TAI VIET VOWEL UEA +AABB..AABC ; Visual_Order_Left # Lo [2] TAI VIET VOWEL AUE..TAI VIET VOWEL AY + +# Indic_Positional_Category=Left_And_Right + +09CB..09CC ; Left_And_Right # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +0B4B ; Left_And_Right # Mc ORIYA VOWEL SIGN O +0BCA..0BCC ; Left_And_Right # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0D4A..0D4C ; Left_And_Right # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0DDC ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA +0DDE ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA +17C0 ; Left_And_Right # Mc KHMER VOWEL SIGN IE +17C4..17C5 ; Left_And_Right # Mc [2] KHMER VOWEL SIGN OO..KHMER VOWEL SIGN AU +1B40..1B41 ; Left_And_Right # Mc [2] BALINESE VOWEL SIGN TALING TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1134B..1134C ; Left_And_Right # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +114BC ; Left_And_Right # Mc TIRHUTA VOWEL SIGN O +114BE ; Left_And_Right # Mc TIRHUTA VOWEL SIGN AU +115BA ; Left_And_Right # Mc SIDDHAM VOWEL SIGN O + +# Indic_Positional_Category=Top + +0900..0902 ; Top # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +093A ; Top # Mn DEVANAGARI VOWEL SIGN OE +0945..0948 ; Top # Mn [4] DEVANAGARI VOWEL SIGN CANDRA E..DEVANAGARI VOWEL SIGN AI +0951 ; Top # Mn DEVANAGARI STRESS SIGN UDATTA +0953..0955 ; Top # Mn [3] DEVANAGARI GRAVE ACCENT..DEVANAGARI VOWEL SIGN CANDRA LONG E +0981 ; Top # Mn BENGALI SIGN CANDRABINDU +0A01..0A02 ; Top # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A47..0A48 ; Top # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Top # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0A70..0A71 ; Top # Mn [2] GURMUKHI TIPPI..GURMUKHI ADDAK +0A81..0A82 ; Top # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0AC5 ; Top # Mn GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Top # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0B01 ; Top # Mn ORIYA SIGN CANDRABINDU +0B3F ; Top # Mn ORIYA VOWEL SIGN I +0B56 ; Top # Mn ORIYA AI LENGTH MARK +0B82 ; Top # Mn TAMIL SIGN ANUSVARA +0BC0 ; Top # Mn TAMIL VOWEL SIGN II +0BCD ; Top # Mn TAMIL SIGN VIRAMA +0C00 ; Top # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C3E..0C40 ; Top # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C46..0C47 ; Top # Mn [2] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN EE +0C4A..0C4D ; Top # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA +0C55 ; Top # Mn TELUGU LENGTH MARK +0C81 ; Top # Mn KANNADA SIGN CANDRABINDU +0CBF ; Top # Mn KANNADA VOWEL SIGN I +0CC6 ; Top # Mn KANNADA VOWEL SIGN E +0CCC..0CCD ; Top # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA +0D01 ; Top # Mn MALAYALAM SIGN CANDRABINDU +0D4D ; Top # Mn MALAYALAM SIGN VIRAMA +0DCA ; Top # Mn SINHALA SIGN AL-LAKUNA +0DD2..0DD3 ; Top # Mn [2] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN DIGA IS-PILLA +0E31 ; Top # Mn THAI CHARACTER MAI HAN-AKAT +0E34..0E37 ; Top # Mn [4] THAI CHARACTER SARA I..THAI CHARACTER SARA UEE +0E47..0E4E ; Top # Mn [8] THAI CHARACTER MAITAIKHU..THAI CHARACTER YAMAKKAN +0EB1 ; Top # Mn LAO VOWEL SIGN MAI KAN +0EB4..0EB7 ; Top # Mn [4] LAO VOWEL SIGN I..LAO VOWEL SIGN YY +0EBB ; Top # Mn LAO VOWEL SIGN MAI KON +0EC8..0ECD ; Top # Mn [6] LAO TONE MAI EK..LAO NIGGAHITA +0F39 ; Top # Mn TIBETAN MARK TSA -PHRU +0F72 ; Top # Mn TIBETAN VOWEL SIGN I +0F7A..0F7E ; Top # Mn [5] TIBETAN VOWEL SIGN E..TIBETAN SIGN RJES SU NGA RO +0F80 ; Top # Mn TIBETAN VOWEL SIGN REVERSED I +0F82..0F83 ; Top # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +0F86..0F87 ; Top # Mn [2] TIBETAN SIGN LCI RTAGS..TIBETAN SIGN YANG RTAGS +102D..102E ; Top # Mn [2] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN II +1032..1036 ; Top # Mn [5] MYANMAR VOWEL SIGN AI..MYANMAR SIGN ANUSVARA +103A ; Top # Mn MYANMAR SIGN ASAT +1071..1074 ; Top # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1085..1086 ; Top # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109D ; Top # Mn MYANMAR VOWEL SIGN AITON AI +1712 ; Top # Mn TAGALOG VOWEL SIGN I +1732 ; Top # Mn HANUNOO VOWEL SIGN I +1752 ; Top # Mn BUHID VOWEL SIGN I +1772 ; Top # Mn TAGBANWA VOWEL SIGN I +17B7..17BA ; Top # Mn [4] KHMER VOWEL SIGN I..KHMER VOWEL SIGN YY +17C6 ; Top # Mn KHMER SIGN NIKAHIT +17C9..17D1 ; Top # Mn [9] KHMER SIGN MUUSIKATOAN..KHMER SIGN VIRIAM +17D3 ; Top # Mn KHMER SIGN BATHAMASAT +17DD ; Top # Mn KHMER SIGN ATTHACAN +1920..1921 ; Top # Mn [2] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN I +1927..1928 ; Top # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Top # Mn LIMBU SIGN KEMPHRENG +1A17 ; Top # Mn BUGINESE VOWEL SIGN I +1A1B ; Top # Mn BUGINESE VOWEL SIGN AE +1A58..1A5A ; Top # Mn [3] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN LOW PA +1A62 ; Top # Mn TAI THAM VOWEL SIGN MAI SAT +1A65..1A68 ; Top # Mn [4] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN UUE +1A6B ; Top # Mn TAI THAM VOWEL SIGN O +1A73..1A7C ; Top # Mn [10] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN KHUEN-LUE KARAN +1B00..1B03 ; Top # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG +1B34 ; Top # Mn BALINESE SIGN REREKAN +1B36..1B37 ; Top # Mn [2] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN ULU SARI +1B42 ; Top # Mn BALINESE VOWEL SIGN PEPET +1B6B ; Top # Mn BALINESE MUSICAL SYMBOL COMBINING TEGEH +1B6D..1B73 ; Top # Mn [7] BALINESE MUSICAL SYMBOL COMBINING KEMPUL..BALINESE MUSICAL SYMBOL COMBINING GONG +1B80..1B81 ; Top # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR +1BA4 ; Top # Mn SUNDANESE VOWEL SIGN PANGHULU +1BA8..1BA9 ; Top # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE6 ; Top # Mn BATAK SIGN TOMPI +1BE8..1BE9 ; Top # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BED ; Top # Mn BATAK VOWEL SIGN KARO O +1BEF..1BF1 ; Top # Mn [3] BATAK VOWEL SIGN U FOR SIMALUNGUN SA..BATAK CONSONANT SIGN H +1C2D..1C33 ; Top # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +1C36 ; Top # Mn LEPCHA SIGN RAN +1CD0..1CD2 ; Top # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CDA..1CDB ; Top # Mn [2] VEDIC TONE DOUBLE SVARITA..VEDIC TONE TRIPLE SVARITA +1CE0 ; Top # Mn VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CF4 ; Top # Mn VEDIC TONE CANDRA ABOVE +A806 ; Top # Mn SYLOTI NAGRI SIGN HASANTA +A80B ; Top # Mn SYLOTI NAGRI SIGN ANUSVARA +A826 ; Top # Mn SYLOTI NAGRI VOWEL SIGN E +A8E0..A8F1 ; Top # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +A94A ; Top # Mn REJANG VOWEL SIGN AI +A94F..A951 ; Top # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A980..A982 ; Top # Mn [3] JAVANESE SIGN PANYANGGA..JAVANESE SIGN LAYAR +A9B3 ; Top # Mn JAVANESE SIGN CECAK TELU +A9B6..A9B7 ; Top # Mn [2] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN WULU MELIK +A9BC ; Top # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Top # Mn MYANMAR SIGN SHAN SAW +AA29..AA2C ; Top # Mn [4] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN EI +AA2E ; Top # Mn CHAM VOWEL SIGN OE +AA31 ; Top # Mn CHAM VOWEL SIGN AU +AA43 ; Top # Mn CHAM CONSONANT SIGN FINAL NG +AA4C ; Top # Mn CHAM CONSONANT SIGN FINAL M +AA7C ; Top # Mn MYANMAR SIGN TAI LAING TONE-2 +AAB0 ; Top # Mn TAI VIET MAI KANG +AAB2..AAB3 ; Top # Mn [2] TAI VIET VOWEL I..TAI VIET VOWEL UE +AAB7..AAB8 ; Top # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AABE..AABF ; Top # Mn [2] TAI VIET VOWEL AM..TAI VIET TONE MAI EK +AAC1 ; Top # Mn TAI VIET TONE MAI THO +AAED ; Top # Mn MEETEI MAYEK VOWEL SIGN AAI +ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP +10A05 ; Top # Mn KHAROSHTHI VOWEL SIGN E +10A0F ; Top # Mn KHAROSHTHI SIGN VISARGA +10A38 ; Top # Mn KHAROSHTHI SIGN BAR ABOVE +11001 ; Top # Mn BRAHMI SIGN ANUSVARA +11038..1103B ; Top # Mn [4] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN II +11042..11046 ; Top # Mn [5] BRAHMI VOWEL SIGN E..BRAHMI VIRAMA +11080..11081 ; Top # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +110B5..110B6 ; Top # Mn [2] KAITHI VOWEL SIGN E..KAITHI VOWEL SIGN AI +11100..11102 ; Top # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA +11127..11129 ; Top # Mn [3] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN II +1112D ; Top # Mn CHAKMA VOWEL SIGN AI +11130 ; Top # Mn CHAKMA VOWEL SIGN OI +11134 ; Top # Mn CHAKMA MAAYYAA +11180..11181 ; Top # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +111BC..111BE ; Top # Mn [3] SHARADA VOWEL SIGN E..SHARADA VOWEL SIGN O +111CB ; Top # Mn SHARADA VOWEL MODIFIER MARK +11230..11231 ; Top # Mn [2] KHOJKI VOWEL SIGN E..KHOJKI VOWEL SIGN AI +11234 ; Top # Mn KHOJKI SIGN ANUSVARA +11236..11237 ; Top # Mn [2] KHOJKI SIGN NUKTA..KHOJKI SIGN SHADDA +112DF ; Top # Mn KHUDAWADI SIGN ANUSVARA +112E5..112E8 ; Top # Mn [4] KHUDAWADI VOWEL SIGN E..KHUDAWADI VOWEL SIGN AU +11301 ; Top # Mn GRANTHA SIGN CANDRABINDU +11340 ; Top # Mn GRANTHA VOWEL SIGN II +11366..1136C ; Top # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Top # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA +114BA ; Top # Mn TIRHUTA VOWEL SIGN SHORT E +114BF..114C0 ; Top # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Top # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +11639..1163A ; Top # Mn [2] MODI VOWEL SIGN E..MODI VOWEL SIGN AI +1163D ; Top # Mn MODI SIGN ANUSVARA +11640 ; Top # Mn MODI SIGN ARDHACANDRA +116AB ; Top # Mn TAKRI SIGN ANUSVARA +116AD ; Top # Mn TAKRI VOWEL SIGN AA +116B2..116B5 ; Top # Mn [4] TAKRI VOWEL SIGN E..TAKRI VOWEL SIGN AU +1171F ; Top # Mn AHOM CONSONANT SIGN MEDIAL LIGATING RA +11722..11723 ; Top # Mn [2] AHOM VOWEL SIGN I..AHOM VOWEL SIGN II +11727 ; Top # Mn AHOM VOWEL SIGN AW +11729..1172B ; Top # Mn [3] AHOM VOWEL SIGN AI..AHOM SIGN KILLER + +# Indic_Positional_Category=Bottom + +093C ; Bottom # Mn DEVANAGARI SIGN NUKTA +0941..0944 ; Bottom # Mn [4] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN VOCALIC RR +094D ; Bottom # Mn DEVANAGARI SIGN VIRAMA +0952 ; Bottom # Mn DEVANAGARI STRESS SIGN ANUDATTA +0956..0957 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN UE..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BC ; Bottom # Mn BENGALI SIGN NUKTA +09C1..09C4 ; Bottom # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09CD ; Bottom # Mn BENGALI SIGN VIRAMA +09E2..09E3 ; Bottom # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3C ; Bottom # Mn GURMUKHI SIGN NUKTA +0A41..0A42 ; Bottom # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A4D ; Bottom # Mn GURMUKHI SIGN VIRAMA +0A75 ; Bottom # Mn GURMUKHI SIGN YAKASH +0ABC ; Bottom # Mn GUJARATI SIGN NUKTA +0AC1..0AC4 ; Bottom # Mn [4] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN VOCALIC RR +0ACD ; Bottom # Mn GUJARATI SIGN VIRAMA +0AE2..0AE3 ; Bottom # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3C ; Bottom # Mn ORIYA SIGN NUKTA +0B41..0B44 ; Bottom # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B4D ; Bottom # Mn ORIYA SIGN VIRAMA +0B62..0B63 ; Bottom # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0C56 ; Bottom # Mn TELUGU AI LENGTH MARK +0C62..0C63 ; Bottom # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBC ; Bottom # Mn KANNADA SIGN NUKTA +0CE2..0CE3 ; Bottom # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D43..0D44 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC R..MALAYALAM VOWEL SIGN VOCALIC RR +0D62..0D63 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DD4 ; Bottom # Mn SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Bottom # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0E38..0E3A ; Bottom # Mn [3] THAI CHARACTER SARA U..THAI CHARACTER PHINTHU +0EB8..0EB9 ; Bottom # Mn [2] LAO VOWEL SIGN U..LAO VOWEL SIGN UU +0EBC ; Bottom # Mn LAO SEMIVOWEL SIGN LO +0F18..0F19 ; Bottom # Mn [2] TIBETAN ASTROLOGICAL SIGN -KHYUD PA..TIBETAN ASTROLOGICAL SIGN SDONG TSHUGS +0F35 ; Bottom # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Bottom # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0F71 ; Bottom # Mn TIBETAN VOWEL SIGN AA +0F74..0F75 ; Bottom # Mn [2] TIBETAN VOWEL SIGN U..TIBETAN VOWEL SIGN UU +0F84 ; Bottom # Mn TIBETAN MARK HALANTA +0F8D..0F97 ; Bottom # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Bottom # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +0FC6 ; Bottom # Mn TIBETAN SYMBOL PADMA GDAN +102F..1030 ; Bottom # Mn [2] MYANMAR VOWEL SIGN U..MYANMAR VOWEL SIGN UU +1037 ; Bottom # Mn MYANMAR SIGN DOT BELOW +103D..103E ; Bottom # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +1058..1059 ; Bottom # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +105E..1060 ; Bottom # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Bottom # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +108D ; Bottom # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +1713..1714 ; Bottom # Mn [2] TAGALOG VOWEL SIGN U..TAGALOG SIGN VIRAMA +1733..1734 ; Bottom # Mn [2] HANUNOO VOWEL SIGN U..HANUNOO SIGN PAMUDPOD +1753 ; Bottom # Mn BUHID VOWEL SIGN U +1773 ; Bottom # Mn TAGBANWA VOWEL SIGN U +17BB..17BD ; Bottom # Mn [3] KHMER VOWEL SIGN U..KHMER VOWEL SIGN UA +1922 ; Bottom # Mn LIMBU VOWEL SIGN U +1932 ; Bottom # Mn LIMBU SMALL LETTER ANUSVARA +1939 ; Bottom # Mn LIMBU SIGN MUKPHRENG +193B ; Bottom # Mn LIMBU SIGN SA-I +1A18 ; Bottom # Mn BUGINESE VOWEL SIGN U +1A56 ; Bottom # Mn TAI THAM CONSONANT SIGN MEDIAL LA +1A5B..1A5E ; Bottom # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1A69..1A6A ; Bottom # Mn [2] TAI THAM VOWEL SIGN U..TAI THAM VOWEL SIGN UU +1A6C ; Bottom # Mn TAI THAM VOWEL SIGN OA BELOW +1A7F ; Bottom # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1B38..1B3A ; Bottom # Mn [3] BALINESE VOWEL SIGN SUKU..BALINESE VOWEL SIGN RA REPA +1B6C ; Bottom # Mn BALINESE MUSICAL SYMBOL COMBINING ENDEP +1BA2..1BA3 ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BA5 ; Bottom # Mn SUNDANESE VOWEL SIGN PANYUKU +1BAC..1BAD ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C2C ; Bottom # Mn LEPCHA VOWEL SIGN E +1C37 ; Bottom # Mn LEPCHA SIGN NUKTA +1CD5..1CD9 ; Bottom # Mn [5] VEDIC TONE YAJURVEDIC AGGRAVATED INDEPENDENT SVARITA..VEDIC TONE YAJURVEDIC KATHAKA INDEPENDENT SVARITA SCHROEDER +1CDC..1CDF ; Bottom # Mn [4] VEDIC TONE KATHAKA ANUDATTA..VEDIC TONE THREE DOTS BELOW +1CED ; Bottom # Mn VEDIC SIGN TIRYAK +A825 ; Bottom # Mn SYLOTI NAGRI VOWEL SIGN U +A8C4 ; Bottom # Mn SAURASHTRA SIGN VIRAMA +A92B..A92D ; Bottom # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +A947..A949 ; Bottom # Mn [3] REJANG VOWEL SIGN I..REJANG VOWEL SIGN E +A94B..A94E ; Bottom # Mn [4] REJANG VOWEL SIGN O..REJANG VOWEL SIGN EA +A9B8..A9B9 ; Bottom # Mn [2] JAVANESE VOWEL SIGN SUKU..JAVANESE VOWEL SIGN SUKU MENDUT +AA2D ; Bottom # Mn CHAM VOWEL SIGN U +AA32 ; Bottom # Mn CHAM VOWEL SIGN UE +AA35..AA36 ; Bottom # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +AAB4 ; Bottom # Mn TAI VIET VOWEL U +AAEC ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UU +ABE8 ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK +10A02..10A03 ; Bottom # Mn [2] KHAROSHTHI VOWEL SIGN U..KHAROSHTHI VOWEL SIGN VOCALIC R +10A0C..10A0E ; Bottom # Mn [3] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN ANUSVARA +10A39..10A3A ; Bottom # Mn [2] KHAROSHTHI SIGN CAUDA..KHAROSHTHI SIGN DOT BELOW +1103C..11041 ; Bottom # Mn [6] BRAHMI VOWEL SIGN U..BRAHMI VOWEL SIGN VOCALIC LL +110B3..110B4 ; Bottom # Mn [2] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN UU +110B9..110BA ; Bottom # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +1112A..1112B ; Bottom # Mn [2] CHAKMA VOWEL SIGN U..CHAKMA VOWEL SIGN UU +11131..11132 ; Bottom # Mn [2] CHAKMA O MARK..CHAKMA AU MARK +11173 ; Bottom # Mn MAHAJANI SIGN NUKTA +111B6..111BB ; Bottom # Mn [6] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN VOCALIC LL +111CC ; Bottom # Mn SHARADA EXTRA SHORT VOWEL MARK +1122F ; Bottom # Mn KHOJKI VOWEL SIGN U +112E3..112E4 ; Bottom # Mn [2] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN UU +112E9..112EA ; Bottom # Mn [2] KHUDAWADI SIGN NUKTA..KHUDAWADI SIGN VIRAMA +114B3..114B8 ; Bottom # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114C2..114C3 ; Bottom # Mn [2] TIRHUTA SIGN VIRAMA..TIRHUTA SIGN NUKTA +115B2..115B5 ; Bottom # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115BF..115C0 ; Bottom # Mn [2] SIDDHAM SIGN VIRAMA..SIDDHAM SIGN NUKTA +115DC..115DD ; Bottom # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11633..11638 ; Bottom # Mn [6] MODI VOWEL SIGN U..MODI VOWEL SIGN VOCALIC LL +1163F ; Bottom # Mn MODI SIGN VIRAMA +116B0..116B1 ; Bottom # Mn [2] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN UU +116B7 ; Bottom # Mn TAKRI SIGN NUKTA +1171D ; Bottom # Mn AHOM CONSONANT SIGN MEDIAL LA +11724..11725 ; Bottom # Mn [2] AHOM VOWEL SIGN U..AHOM VOWEL SIGN UU +11728 ; Bottom # Mn AHOM VOWEL SIGN O + +# Indic_Positional_Category=Top_And_Bottom + +0C48 ; Top_And_Bottom # Mn TELUGU VOWEL SIGN AI +0F73 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN II +0F76..0F79 ; Top_And_Bottom # Mn [4] TIBETAN VOWEL SIGN VOCALIC R..TIBETAN VOWEL SIGN VOCALIC LL +0F81 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN REVERSED II +1B3C ; Top_And_Bottom # Mn BALINESE VOWEL SIGN LA LENGA +1112E..1112F ; Top_And_Bottom # Mn [2] CHAKMA VOWEL SIGN O..CHAKMA VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Right + +0AC9 ; Top_And_Right # Mc GUJARATI VOWEL SIGN CANDRA O +0B57 ; Top_And_Right # Mc ORIYA AU LENGTH MARK +0CC0 ; Top_And_Right # Mc KANNADA VOWEL SIGN II +0CC7..0CC8 ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +1925..1926 ; Top_And_Right # Mc [2] LIMBU VOWEL SIGN OO..LIMBU VOWEL SIGN AU +1B43 ; Top_And_Right # Mc BALINESE VOWEL SIGN PEPET TEDUNG +111BF ; Top_And_Right # Mc SHARADA VOWEL SIGN AU +11232..11233 ; Top_And_Right # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Left + +0B48 ; Top_And_Left # Mc ORIYA VOWEL SIGN AI +0DDA ; Top_And_Left # Mc SINHALA VOWEL SIGN DIGA KOMBUVA +17BE ; Top_And_Left # Mc KHMER VOWEL SIGN OE +1C29 ; Top_And_Left # Mc LEPCHA VOWEL SIGN OO +114BB ; Top_And_Left # Mc TIRHUTA VOWEL SIGN AI +115B9 ; Top_And_Left # Mc SIDDHAM VOWEL SIGN AI + +# Indic_Positional_Category=Top_And_Left_And_Right + +0B4C ; Top_And_Left_And_Right # Mc ORIYA VOWEL SIGN AU +0DDD ; Top_And_Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA +17BF ; Top_And_Left_And_Right # Mc KHMER VOWEL SIGN YA +115BB ; Top_And_Left_And_Right # Mc SIDDHAM VOWEL SIGN AU + +# Indic_Positional_Category=Bottom_And_Right + +1B3B ; Bottom_And_Right # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +A9C0 ; Bottom_And_Right # Mc JAVANESE PANGKON + +# Indic_Positional_Category=Top_And_Bottom_And_Right + +1B3D ; Top_And_Bottom_And_Right # Mc BALINESE VOWEL SIGN LA LENGA TEDUNG + +# Indic_Positional_Category=Overstruck + +1CD4 ; Overstruck # Mn VEDIC SIGN YAJURVEDIC MIDLINE SVARITA +1CE2..1CE8 ; Overstruck # Mn [7] VEDIC SIGN VISARGA SVARITA..VEDIC SIGN VISARGA ANUDATTA WITH TAIL +10A01 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN I +10A06 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN O + +# EOF diff --git a/data/8.0.0-indic-syllabic-category.txt b/data/8.0.0-indic-syllabic-category.txt new file mode 100644 index 0000000..d7834f3 --- /dev/null +++ b/data/8.0.0-indic-syllabic-category.txt @@ -0,0 +1,1121 @@ +# IndicSyllabicCategory-8.0.0.txt +# Date: 2015-05-12, 10:00:00 GMT [RP, KW, LI] +# +# Unicode Character Database +# Copyright (c) 1991-2015 Unicode, Inc. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# For documentation, see UAX #44: Unicode Character Database, +# at http://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Syllabic_Category enumerated property +# +# Scope: This property is aimed at two general problem +# areas involving the analysis and processing of Indic scripts: +# +# 1. Specification of syllabic structure. +# 2. Specification of segmentation rules. +# +# Both of these problem areas may benefit from having defined subtypes +# of Indic script characters which are relevant to how Indic +# syllables (or aksaras) are constructed. Note that rules for +# syllabic structure in Indic scripts may differ significantly +# from how phonological syllables are defined. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Syllabic_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as Indic in the structural sense used for the +# Indic_Syllabic_Category are the following: +# +# Ahom, Balinese, Batak, Bengali, Brahmi, Buginese, Buhid, Chakma, +# Cham, Devanagari, Grantha, Gujarati, Gurmukhi, Hanunoo, Javanese, +# Kaithi, Kannada, Kayah Li, Kharoshthi, Khmer, Khojki, Khudawadi, +# Lao, Lepcha, Limbu, Mahajani, Malayalam, Meetei Mayek, Modi, +# Multani, Myanmar, New Tai Lue, Oriya, Phags-pa, Rejang, Saurashtra, +# Sharada, Siddham, Sinhala, Sundanese, Syloti Nagri, Tagalog, +# Tagbanwa, Tai Le, Tai Tham, Tai Viet, Takri, Tamil, Telugu, Thai, +# Tibetan, and Tirhuta. +# +# All characters for all other scripts not in that list +# take the default value for this property, unless they +# are individually listed in this data file. +# + +# ================================================ + +# Property: Indic_Syllabic_Category +# +# All code points not explicitly listed for Indic_Syllabic_Category +# have the value Other. +# +# @missing: 0000..10FFFF; Other + +# ================================================ + +# Indic_Syllabic_Category=Bindu + +# Bindu/Anusvara (nasalization or -n) +# Excludes various Vedic nasalization signs. + +# [Not derivable] + +0900..0902 ; Bindu # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +0981 ; Bindu # Mn BENGALI SIGN CANDRABINDU +0982 ; Bindu # Mc BENGALI SIGN ANUSVARA +0A01..0A02 ; Bindu # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A70 ; Bindu # Mn GURMUKHI TIPPI +0A81..0A82 ; Bindu # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0B01 ; Bindu # Mn ORIYA SIGN CANDRABINDU +0B02 ; Bindu # Mc ORIYA SIGN ANUSVARA +0B82 ; Bindu # Mn TAMIL SIGN ANUSVARA +0C00 ; Bindu # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C01..0C02 ; Bindu # Mc [2] TELUGU SIGN CANDRABINDU..TELUGU SIGN ANUSVARA +0C81 ; Bindu # Mn KANNADA SIGN CANDRABINDU +0C82 ; Bindu # Mc KANNADA SIGN ANUSVARA +0D01 ; Bindu # Mn MALAYALAM SIGN CANDRABINDU +0D02 ; Bindu # Mc MALAYALAM SIGN ANUSVARA +0D82 ; Bindu # Mc SINHALA SIGN ANUSVARAYA +0E4D ; Bindu # Mn THAI CHARACTER NIKHAHIT +0ECD ; Bindu # Mn LAO NIGGAHITA +0F7E ; Bindu # Mn TIBETAN SIGN RJES SU NGA RO +0F82..0F83 ; Bindu # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +1036 ; Bindu # Mn MYANMAR SIGN ANUSVARA +17C6 ; Bindu # Mn KHMER SIGN NIKAHIT +1932 ; Bindu # Mn LIMBU SMALL LETTER ANUSVARA +1B00..1B02 ; Bindu # Mn [3] BALINESE SIGN ULU RICEM..BALINESE SIGN CECEK +1B80 ; Bindu # Mn SUNDANESE SIGN PANYECEK +1C34..1C35 ; Bindu # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A80B ; Bindu # Mn SYLOTI NAGRI SIGN ANUSVARA +A873 ; Bindu # Lo PHAGS-PA LETTER CANDRABINDU +A880 ; Bindu # Mc SAURASHTRA SIGN ANUSVARA +A980..A981 ; Bindu # Mn [2] JAVANESE SIGN PANYANGGA..JAVANESE SIGN CECAK +10A0E ; Bindu # Mn KHAROSHTHI SIGN ANUSVARA +11000 ; Bindu # Mc BRAHMI SIGN CANDRABINDU +11001 ; Bindu # Mn BRAHMI SIGN ANUSVARA +11080..11081 ; Bindu # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +11100..11101 ; Bindu # Mn [2] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN ANUSVARA +11180..11181 ; Bindu # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +11234 ; Bindu # Mn KHOJKI SIGN ANUSVARA +112DF ; Bindu # Mn KHUDAWADI SIGN ANUSVARA +11300..11301 ; Bindu # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11302 ; Bindu # Mc GRANTHA SIGN ANUSVARA +114BF..114C0 ; Bindu # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Bindu # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +1163D ; Bindu # Mn MODI SIGN ANUSVARA +116AB ; Bindu # Mn TAKRI SIGN ANUSVARA + +# ================================================ + +# Indic_Syllabic_Category=Visarga + +# Visarga (-h) +# Includes specialized case for Sanskrit: ardhavisarga +# Excludes letters for jihvamuliya and upadhmaniya, which are +# related, but structured somewhat differently. + +# [Not derivable] + +0903 ; Visarga # Mc DEVANAGARI SIGN VISARGA +0983 ; Visarga # Mc BENGALI SIGN VISARGA +0A03 ; Visarga # Mc GURMUKHI SIGN VISARGA +0A83 ; Visarga # Mc GUJARATI SIGN VISARGA +0B03 ; Visarga # Mc ORIYA SIGN VISARGA +0C03 ; Visarga # Mc TELUGU SIGN VISARGA +0C83 ; Visarga # Mc KANNADA SIGN VISARGA +0D03 ; Visarga # Mc MALAYALAM SIGN VISARGA +0D83 ; Visarga # Mc SINHALA SIGN VISARGAYA +0F7F ; Visarga # Mc TIBETAN SIGN RNAM BCAD +1038 ; Visarga # Mc MYANMAR SIGN VISARGA +17C7 ; Visarga # Mc KHMER SIGN REAHMUK +1B04 ; Visarga # Mc BALINESE SIGN BISAH +1B82 ; Visarga # Mc SUNDANESE SIGN PANGWISAD +1CF2..1CF3 ; Visarga # Mc [2] VEDIC SIGN ARDHAVISARGA..VEDIC SIGN ROTATED ARDHAVISARGA +A881 ; Visarga # Mc SAURASHTRA SIGN VISARGA +A983 ; Visarga # Mc JAVANESE SIGN WIGNYAN +AAF5 ; Visarga # Mc MEETEI MAYEK VOWEL SIGN VISARGA +10A0F ; Visarga # Mn KHAROSHTHI SIGN VISARGA +11002 ; Visarga # Mc BRAHMI SIGN VISARGA +11082 ; Visarga # Mc KAITHI SIGN VISARGA +11102 ; Visarga # Mn CHAKMA SIGN VISARGA +11182 ; Visarga # Mc SHARADA SIGN VISARGA +11303 ; Visarga # Mc GRANTHA SIGN VISARGA +114C1 ; Visarga # Mc TIRHUTA SIGN VISARGA +115BE ; Visarga # Mc SIDDHAM SIGN VISARGA +1163E ; Visarga # Mc MODI SIGN VISARGA +116AC ; Visarga # Mc TAKRI SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Avagraha + +# Avagraha (elision of initial a- in sandhi) + +# [Not derivable] + +093D ; Avagraha # Lo DEVANAGARI SIGN AVAGRAHA +09BD ; Avagraha # Lo BENGALI SIGN AVAGRAHA +0ABD ; Avagraha # Lo GUJARATI SIGN AVAGRAHA +0B3D ; Avagraha # Lo ORIYA SIGN AVAGRAHA +0C3D ; Avagraha # Lo TELUGU SIGN AVAGRAHA +0CBD ; Avagraha # Lo KANNADA SIGN AVAGRAHA +0D3D ; Avagraha # Lo MALAYALAM SIGN AVAGRAHA +0F85 ; Avagraha # Po TIBETAN MARK PALUTA +17DC ; Avagraha # Lo KHMER SIGN AVAKRAHASANYA +1BBA ; Avagraha # Lo SUNDANESE AVAGRAHA +111C1 ; Avagraha # Lo SHARADA SIGN AVAGRAHA +1133D ; Avagraha # Lo GRANTHA SIGN AVAGRAHA +114C4 ; Avagraha # Lo TIRHUTA SIGN AVAGRAHA + +# ================================================ + +# Indic_Syllabic_Category=Nukta + +# Nukta (diacritic for borrowed consonants or other consonant +# modifications) + +# [Derivation: (ccc=7) + 0F39 + 10A38..10A3A - 1037] + +093C ; Nukta # Mn DEVANAGARI SIGN NUKTA +09BC ; Nukta # Mn BENGALI SIGN NUKTA +0A3C ; Nukta # Mn GURMUKHI SIGN NUKTA +0ABC ; Nukta # Mn GUJARATI SIGN NUKTA +0B3C ; Nukta # Mn ORIYA SIGN NUKTA +0CBC ; Nukta # Mn KANNADA SIGN NUKTA +0F39 ; Nukta # Mn TIBETAN MARK TSA -PHRU +1B34 ; Nukta # Mn BALINESE SIGN REREKAN +1BE6 ; Nukta # Mn BATAK SIGN TOMPI +1C37 ; Nukta # Mn LEPCHA SIGN NUKTA +A9B3 ; Nukta # Mn JAVANESE SIGN CECAK TELU +10A38..10A3A ; Nukta # Mn [3] KHAROSHTHI SIGN BAR ABOVE..KHAROSHTHI SIGN DOT BELOW +110BA ; Nukta # Mn KAITHI SIGN NUKTA +11173 ; Nukta # Mn MAHAJANI SIGN NUKTA +111CA ; Nukta # Mn SHARADA SIGN NUKTA +11236 ; Nukta # Mn KHOJKI SIGN NUKTA +112E9 ; Nukta # Mn KHUDAWADI SIGN NUKTA +1133C ; Nukta # Mn GRANTHA SIGN NUKTA +114C3 ; Nukta # Mn TIRHUTA SIGN NUKTA +115C0 ; Nukta # Mn SIDDHAM SIGN NUKTA +116B7 ; Nukta # Mn TAKRI SIGN NUKTA + +# ================================================ + +# Indic_Syllabic_Category=Virama + +# Virama (killing of inherent vowel in consonant sequence +# or consonant stacker) +# Only includes characters that can act both as visible killer viramas +# and consonant stackers. Separate property values exist for characters +# that can only act as pure killers or only as consonant stackers. + +# [Derivation: (ccc=9) - (InSC=Pure_Killer) - (InSC=Invisible_Stacker) +# - (InSC=Number_Joiner) - 2D7F] + +094D ; Virama # Mn DEVANAGARI SIGN VIRAMA +09CD ; Virama # Mn BENGALI SIGN VIRAMA +0A4D ; Virama # Mn GURMUKHI SIGN VIRAMA +0ACD ; Virama # Mn GUJARATI SIGN VIRAMA +0B4D ; Virama # Mn ORIYA SIGN VIRAMA +0BCD ; Virama # Mn TAMIL SIGN VIRAMA +0C4D ; Virama # Mn TELUGU SIGN VIRAMA +0CCD ; Virama # Mn KANNADA SIGN VIRAMA +0D4D ; Virama # Mn MALAYALAM SIGN VIRAMA +0DCA ; Virama # Mn SINHALA SIGN AL-LAKUNA +1B44 ; Virama # Mc BALINESE ADEG ADEG +A8C4 ; Virama # Mn SAURASHTRA SIGN VIRAMA +A9C0 ; Virama # Mc JAVANESE PANGKON +11046 ; Virama # Mn BRAHMI VIRAMA +110B9 ; Virama # Mn KAITHI SIGN VIRAMA +111C0 ; Virama # Mc SHARADA SIGN VIRAMA +11235 ; Virama # Mc KHOJKI SIGN VIRAMA +1134D ; Virama # Mc GRANTHA SIGN VIRAMA +114C2 ; Virama # Mn TIRHUTA SIGN VIRAMA +115BF ; Virama # Mn SIDDHAM SIGN VIRAMA +1163F ; Virama # Mn MODI SIGN VIRAMA +116B6 ; Virama # Mc TAKRI SIGN VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Pure_Killer + +# Pure killer (killing of inherent vowel in consonant sequence, +# with no consonant stacking behavior) + +# [Not derivable] + +0E3A ; Pure_Killer # Mn THAI CHARACTER PHINTHU +0E4E ; Pure_Killer # Mn THAI CHARACTER YAMAKKAN +0F84 ; Pure_Killer # Mn TIBETAN MARK HALANTA +103A ; Pure_Killer # Mn MYANMAR SIGN ASAT +1714 ; Pure_Killer # Mn TAGALOG SIGN VIRAMA +1734 ; Pure_Killer # Mn HANUNOO SIGN PAMUDPOD +17D1 ; Pure_Killer # Mn KHMER SIGN VIRIAM +1BAA ; Pure_Killer # Mc SUNDANESE SIGN PAMAAEH +1BF2..1BF3 ; Pure_Killer # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +A806 ; Pure_Killer # Mn SYLOTI NAGRI SIGN HASANTA +A953 ; Pure_Killer # Mc REJANG VIRAMA +ABED ; Pure_Killer # Mn MEETEI MAYEK APUN IYEK +11134 ; Pure_Killer # Mn CHAKMA MAAYYAA +112EA ; Pure_Killer # Mn KHUDAWADI SIGN VIRAMA +1172B ; Pure_Killer # Mn AHOM SIGN KILLER + +# ================================================ + +# Indic_Syllabic_Category=Invisible_Stacker + +# Invisible stacker (invisible consonant stacker virama) + +# [Not derivable] + +1039 ; Invisible_Stacker # Mn MYANMAR SIGN VIRAMA +17D2 ; Invisible_Stacker # Mn KHMER SIGN COENG +1A60 ; Invisible_Stacker # Mn TAI THAM SIGN SAKOT +1BAB ; Invisible_Stacker # Mn SUNDANESE SIGN VIRAMA +AAF6 ; Invisible_Stacker # Mn MEETEI MAYEK VIRAMA +10A3F ; Invisible_Stacker # Mn KHAROSHTHI VIRAMA +11133 ; Invisible_Stacker # Mn CHAKMA VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Independent + +# Independent Vowels (contrasted with matras) + +# [Not derivable] + +0904..0914 ; Vowel_Independent # Lo [17] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER AU +0960..0961 ; Vowel_Independent # Lo [2] DEVANAGARI LETTER VOCALIC RR..DEVANAGARI LETTER VOCALIC LL +0972..0977 ; Vowel_Independent # Lo [6] DEVANAGARI LETTER CANDRA A..DEVANAGARI LETTER UUE +0985..098C ; Vowel_Independent # Lo [8] BENGALI LETTER A..BENGALI LETTER VOCALIC L +098F..0990 ; Vowel_Independent # Lo [2] BENGALI LETTER E..BENGALI LETTER AI +0993..0994 ; Vowel_Independent # Lo [2] BENGALI LETTER O..BENGALI LETTER AU +09E0..09E1 ; Vowel_Independent # Lo [2] BENGALI LETTER VOCALIC RR..BENGALI LETTER VOCALIC LL +0A05..0A0A ; Vowel_Independent # Lo [6] GURMUKHI LETTER A..GURMUKHI LETTER UU +0A0F..0A10 ; Vowel_Independent # Lo [2] GURMUKHI LETTER EE..GURMUKHI LETTER AI +0A13..0A14 ; Vowel_Independent # Lo [2] GURMUKHI LETTER OO..GURMUKHI LETTER AU +0A85..0A8D ; Vowel_Independent # Lo [9] GUJARATI LETTER A..GUJARATI VOWEL CANDRA E +0A8F..0A91 ; Vowel_Independent # Lo [3] GUJARATI LETTER E..GUJARATI VOWEL CANDRA O +0A93..0A94 ; Vowel_Independent # Lo [2] GUJARATI LETTER O..GUJARATI LETTER AU +0AE0..0AE1 ; Vowel_Independent # Lo [2] GUJARATI LETTER VOCALIC RR..GUJARATI LETTER VOCALIC LL +0B05..0B0C ; Vowel_Independent # Lo [8] ORIYA LETTER A..ORIYA LETTER VOCALIC L +0B0F..0B10 ; Vowel_Independent # Lo [2] ORIYA LETTER E..ORIYA LETTER AI +0B13..0B14 ; Vowel_Independent # Lo [2] ORIYA LETTER O..ORIYA LETTER AU +0B60..0B61 ; Vowel_Independent # Lo [2] ORIYA LETTER VOCALIC RR..ORIYA LETTER VOCALIC LL +0B85..0B8A ; Vowel_Independent # Lo [6] TAMIL LETTER A..TAMIL LETTER UU +0B8E..0B90 ; Vowel_Independent # Lo [3] TAMIL LETTER E..TAMIL LETTER AI +0B92..0B94 ; Vowel_Independent # Lo [3] TAMIL LETTER O..TAMIL LETTER AU +0C05..0C0C ; Vowel_Independent # Lo [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L +0C0E..0C10 ; Vowel_Independent # Lo [3] TELUGU LETTER E..TELUGU LETTER AI +0C12..0C14 ; Vowel_Independent # Lo [3] TELUGU LETTER O..TELUGU LETTER AU +0C60..0C61 ; Vowel_Independent # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL +0C85..0C8C ; Vowel_Independent # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L +0C8E..0C90 ; Vowel_Independent # Lo [3] KANNADA LETTER E..KANNADA LETTER AI +0C92..0C94 ; Vowel_Independent # Lo [3] KANNADA LETTER O..KANNADA LETTER AU +0CE0..0CE1 ; Vowel_Independent # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL +0D05..0D0C ; Vowel_Independent # Lo [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L +0D0E..0D10 ; Vowel_Independent # Lo [3] MALAYALAM LETTER E..MALAYALAM LETTER AI +0D12..0D14 ; Vowel_Independent # Lo [3] MALAYALAM LETTER O..MALAYALAM LETTER AU +0D5F..0D61 ; Vowel_Independent # Lo [3] MALAYALAM LETTER ARCHAIC II..MALAYALAM LETTER VOCALIC LL +0D85..0D96 ; Vowel_Independent # Lo [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA +1021..102A ; Vowel_Independent # Lo [10] MYANMAR LETTER A..MYANMAR LETTER AU +1052..1055 ; Vowel_Independent # Lo [4] MYANMAR LETTER VOCALIC R..MYANMAR LETTER VOCALIC LL +1700..1702 ; Vowel_Independent # Lo [3] TAGALOG LETTER A..TAGALOG LETTER U +1720..1722 ; Vowel_Independent # Lo [3] HANUNOO LETTER A..HANUNOO LETTER U +1740..1742 ; Vowel_Independent # Lo [3] BUHID LETTER A..BUHID LETTER U +1760..1762 ; Vowel_Independent # Lo [3] TAGBANWA LETTER A..TAGBANWA LETTER U +17A3..17B3 ; Vowel_Independent # Lo [17] KHMER INDEPENDENT VOWEL QAQ..KHMER INDEPENDENT VOWEL QAU +1A4D..1A52 ; Vowel_Independent # Lo [6] TAI THAM LETTER I..TAI THAM LETTER OO +1B05..1B12 ; Vowel_Independent # Lo [14] BALINESE LETTER AKARA..BALINESE LETTER OKARA TEDUNG +1B83..1B89 ; Vowel_Independent # Lo [7] SUNDANESE LETTER A..SUNDANESE LETTER EU +1BE4..1BE5 ; Vowel_Independent # Lo [2] BATAK LETTER I..BATAK LETTER U +A800..A801 ; Vowel_Independent # Lo [2] SYLOTI NAGRI LETTER A..SYLOTI NAGRI LETTER I +A803..A805 ; Vowel_Independent # Lo [3] SYLOTI NAGRI LETTER U..SYLOTI NAGRI LETTER O +A882..A891 ; Vowel_Independent # Lo [16] SAURASHTRA LETTER A..SAURASHTRA LETTER AU +A984..A988 ; Vowel_Independent # Lo [5] JAVANESE LETTER A..JAVANESE LETTER U +A98C..A98E ; Vowel_Independent # Lo [3] JAVANESE LETTER E..JAVANESE LETTER O +AA00..AA05 ; Vowel_Independent # Lo [6] CHAM LETTER A..CHAM LETTER O +AAE0..AAE1 ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER E..MEETEI MAYEK LETTER O +ABCE..ABCF ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER UN..MEETEI MAYEK LETTER I +ABD1 ; Vowel_Independent # Lo MEETEI MAYEK LETTER ATIYA +11005..11012 ; Vowel_Independent # Lo [14] BRAHMI LETTER A..BRAHMI LETTER AU +11083..1108C ; Vowel_Independent # Lo [10] KAITHI LETTER A..KAITHI LETTER AU +11103..11106 ; Vowel_Independent # Lo [4] CHAKMA LETTER AA..CHAKMA LETTER E +11183..11190 ; Vowel_Independent # Lo [14] SHARADA LETTER A..SHARADA LETTER AU +11200..11207 ; Vowel_Independent # Lo [8] KHOJKI LETTER A..KHOJKI LETTER AU +11280..11283 ; Vowel_Independent # Lo [4] MULTANI LETTER A..MULTANI LETTER E +112B0..112B9 ; Vowel_Independent # Lo [10] KHUDAWADI LETTER A..KHUDAWADI LETTER AU +11305..1130C ; Vowel_Independent # Lo [8] GRANTHA LETTER A..GRANTHA LETTER VOCALIC L +1130F..11310 ; Vowel_Independent # Lo [2] GRANTHA LETTER EE..GRANTHA LETTER AI +11313..11314 ; Vowel_Independent # Lo [2] GRANTHA LETTER OO..GRANTHA LETTER AU +11360..11361 ; Vowel_Independent # Lo [2] GRANTHA LETTER VOCALIC RR..GRANTHA LETTER VOCALIC LL +11481..1148E ; Vowel_Independent # Lo [14] TIRHUTA LETTER A..TIRHUTA LETTER AU +11580..1158D ; Vowel_Independent # Lo [14] SIDDHAM LETTER A..SIDDHAM LETTER AU +115D8..115DB ; Vowel_Independent # Lo [4] SIDDHAM LETTER THREE-CIRCLE ALTERNATE I..SIDDHAM LETTER ALTERNATE U +11600..1160D ; Vowel_Independent # Lo [14] MODI LETTER A..MODI LETTER AU +11680..11689 ; Vowel_Independent # Lo [10] TAKRI LETTER A..TAKRI LETTER AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Dependent + +# Dependent Vowels (contrasted with independent vowels and/or with complex placement) +# Matras (in Indic scripts) + +# [Not derivable] + +093A ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN OE +093B ; Vowel_Dependent # Mc DEVANAGARI VOWEL SIGN OOE +093E..0940 ; Vowel_Dependent # Mc [3] DEVANAGARI VOWEL SIGN AA..DEVANAGARI VOWEL SIGN II +0941..0948 ; Vowel_Dependent # Mn [8] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN AI +0949..094C ; Vowel_Dependent # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094E..094F ; Vowel_Dependent # Mc [2] DEVANAGARI VOWEL SIGN PRISHTHAMATRA E..DEVANAGARI VOWEL SIGN AW +0955..0957 ; Vowel_Dependent # Mn [3] DEVANAGARI VOWEL SIGN CANDRA LONG E..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Vowel_Dependent # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BE..09C0 ; Vowel_Dependent # Mc [3] BENGALI VOWEL SIGN AA..BENGALI VOWEL SIGN II +09C1..09C4 ; Vowel_Dependent # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09C7..09C8 ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +09CB..09CC ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +09D7 ; Vowel_Dependent # Mc BENGALI AU LENGTH MARK +09E2..09E3 ; Vowel_Dependent # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3E..0A40 ; Vowel_Dependent # Mc [3] GURMUKHI VOWEL SIGN AA..GURMUKHI VOWEL SIGN II +0A41..0A42 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A47..0A48 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0ABE..0AC0 ; Vowel_Dependent # Mc [3] GUJARATI VOWEL SIGN AA..GUJARATI VOWEL SIGN II +0AC1..0AC5 ; Vowel_Dependent # Mn [5] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AC9 ; Vowel_Dependent # Mc GUJARATI VOWEL SIGN CANDRA O +0ACB..0ACC ; Vowel_Dependent # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0AE2..0AE3 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3E ; Vowel_Dependent # Mc ORIYA VOWEL SIGN AA +0B3F ; Vowel_Dependent # Mn ORIYA VOWEL SIGN I +0B40 ; Vowel_Dependent # Mc ORIYA VOWEL SIGN II +0B41..0B44 ; Vowel_Dependent # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B47..0B48 ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI +0B4B..0B4C ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN O..ORIYA VOWEL SIGN AU +0B56 ; Vowel_Dependent # Mn ORIYA AI LENGTH MARK +0B57 ; Vowel_Dependent # Mc ORIYA AU LENGTH MARK +0B62..0B63 ; Vowel_Dependent # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BBE..0BBF ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC0 ; Vowel_Dependent # Mn TAMIL VOWEL SIGN II +0BC1..0BC2 ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BC6..0BC8 ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0BCA..0BCC ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0BD7 ; Vowel_Dependent # Mc TAMIL AU LENGTH MARK +0C3E..0C40 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C41..0C44 ; Vowel_Dependent # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C46..0C48 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI +0C4A..0C4C ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C55..0C56 ; Vowel_Dependent # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK +0C62..0C63 ; Vowel_Dependent # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBE ; Vowel_Dependent # Mc KANNADA VOWEL SIGN AA +0CBF ; Vowel_Dependent # Mn KANNADA VOWEL SIGN I +0CC0..0CC4 ; Vowel_Dependent # Mc [5] KANNADA VOWEL SIGN II..KANNADA VOWEL SIGN VOCALIC RR +0CC6 ; Vowel_Dependent # Mn KANNADA VOWEL SIGN E +0CC7..0CC8 ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +0CCC ; Vowel_Dependent # Mn KANNADA VOWEL SIGN AU +0CD5..0CD6 ; Vowel_Dependent # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CE2..0CE3 ; Vowel_Dependent # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D3E..0D40 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D44 ; Vowel_Dependent # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR +0D46..0D48 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0D4A..0D4C ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0D57 ; Vowel_Dependent # Mc MALAYALAM AU LENGTH MARK +0D62..0D63 ; Vowel_Dependent # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DCF..0DD1 ; Vowel_Dependent # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD2..0DD4 ; Vowel_Dependent # Mn [3] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Vowel_Dependent # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0DD8..0DDF ; Vowel_Dependent # Mc [8] SINHALA VOWEL SIGN GAETTA-PILLA..SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Vowel_Dependent # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Vowel_Dependent # Lo THAI CHARACTER SARA A +0E31 ; Vowel_Dependent # Mn THAI CHARACTER MAI HAN-AKAT +0E32..0E33 ; Vowel_Dependent # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E34..0E39 ; Vowel_Dependent # Mn [6] THAI CHARACTER SARA I..THAI CHARACTER SARA UU +0E40..0E45 ; Vowel_Dependent # Lo [6] THAI CHARACTER SARA E..THAI CHARACTER LAKKHANGYAO +0E47 ; Vowel_Dependent # Mn THAI CHARACTER MAITAIKHU +0EB0 ; Vowel_Dependent # Lo LAO VOWEL SIGN A +0EB1 ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KAN +0EB2..0EB3 ; Vowel_Dependent # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0EB4..0EB9 ; Vowel_Dependent # Mn [6] LAO VOWEL SIGN I..LAO VOWEL SIGN UU +0EBB ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KON +0EC0..0EC4 ; Vowel_Dependent # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +0F71..0F7D ; Vowel_Dependent # Mn [13] TIBETAN VOWEL SIGN AA..TIBETAN VOWEL SIGN OO +0F80..0F81 ; Vowel_Dependent # Mn [2] TIBETAN VOWEL SIGN REVERSED I..TIBETAN VOWEL SIGN REVERSED II +102B..102C ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +102D..1030 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN UU +1031 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN E +1032..1035 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +1056..1057 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1058..1059 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1062 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1071..1074 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1083..1084 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN SHAN AA..MYANMAR VOWEL SIGN SHAN E +1085..1086 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109C ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN AITON A +109D ; Vowel_Dependent # Mn MYANMAR VOWEL SIGN AITON AI +1712..1713 ; Vowel_Dependent # Mn [2] TAGALOG VOWEL SIGN I..TAGALOG VOWEL SIGN U +1732..1733 ; Vowel_Dependent # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1752..1753 ; Vowel_Dependent # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U +1772..1773 ; Vowel_Dependent # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U +17B6 ; Vowel_Dependent # Mc KHMER VOWEL SIGN AA +17B7..17BD ; Vowel_Dependent # Mn [7] KHMER VOWEL SIGN I..KHMER VOWEL SIGN UA +17BE..17C5 ; Vowel_Dependent # Mc [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU +17C8 ; Vowel_Dependent # Mc KHMER SIGN YUUKALEAPINTU +1920..1922 ; Vowel_Dependent # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U +1923..1926 ; Vowel_Dependent # Mc [4] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AU +1927..1928 ; Vowel_Dependent # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Vowel_Dependent # Mn LIMBU SIGN KEMPHRENG +19B0..19C0 ; Vowel_Dependent # Lo [17] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN IY +1A17..1A18 ; Vowel_Dependent # Mn [2] BUGINESE VOWEL SIGN I..BUGINESE VOWEL SIGN U +1A19..1A1A ; Vowel_Dependent # Mc [2] BUGINESE VOWEL SIGN E..BUGINESE VOWEL SIGN O +1A1B ; Vowel_Dependent # Mn BUGINESE VOWEL SIGN AE +1A61 ; Vowel_Dependent # Mc TAI THAM VOWEL SIGN A +1A62 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN MAI SAT +1A63..1A64 ; Vowel_Dependent # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A65..1A6C ; Vowel_Dependent # Mn [8] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN OA BELOW +1A6D..1A72 ; Vowel_Dependent # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI +1A73..1A74 ; Vowel_Dependent # Mn [2] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN MAI KANG +1B35 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN TEDUNG +1B36..1B3A ; Vowel_Dependent # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA +1B3B ; Vowel_Dependent # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +1B3C ; Vowel_Dependent # Mn BALINESE VOWEL SIGN LA LENGA +1B3D..1B41 ; Vowel_Dependent # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1B42 ; Vowel_Dependent # Mn BALINESE VOWEL SIGN PEPET +1B43 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN PEPET TEDUNG +1BA4..1BA5 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PANGHULU..SUNDANESE VOWEL SIGN PANYUKU +1BA6..1BA7 ; Vowel_Dependent # Mc [2] SUNDANESE VOWEL SIGN PANAELAENG..SUNDANESE VOWEL SIGN PANOLONG +1BA8..1BA9 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE7 ; Vowel_Dependent # Mc BATAK VOWEL SIGN E +1BE8..1BE9 ; Vowel_Dependent # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BEA..1BEC ; Vowel_Dependent # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BED ; Vowel_Dependent # Mn BATAK VOWEL SIGN KARO O +1BEE ; Vowel_Dependent # Mc BATAK VOWEL SIGN U +1BEF ; Vowel_Dependent # Mn BATAK VOWEL SIGN U FOR SIMALUNGUN SA +1C26..1C2B ; Vowel_Dependent # Mc [6] LEPCHA VOWEL SIGN AA..LEPCHA VOWEL SIGN UU +1C2C ; Vowel_Dependent # Mn LEPCHA VOWEL SIGN E +A823..A824 ; Vowel_Dependent # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A825..A826 ; Vowel_Dependent # Mn [2] SYLOTI NAGRI VOWEL SIGN U..SYLOTI NAGRI VOWEL SIGN E +A827 ; Vowel_Dependent # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Vowel_Dependent # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A947..A94E ; Vowel_Dependent # Mn [8] REJANG VOWEL SIGN I..REJANG VOWEL SIGN EA +A9B4..A9B5 ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9B6..A9B9 ; Vowel_Dependent # Mn [4] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BA..A9BB ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +A9BC ; Vowel_Dependent # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Vowel_Dependent # Mn MYANMAR SIGN SHAN SAW +AA29..AA2E ; Vowel_Dependent # Mn [6] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN OE +AA2F..AA30 ; Vowel_Dependent # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA31..AA32 ; Vowel_Dependent # Mn [2] CHAM VOWEL SIGN AU..CHAM VOWEL SIGN UE +AAB0 ; Vowel_Dependent # Mn TAI VIET MAI KANG +AAB1 ; Vowel_Dependent # Lo TAI VIET VOWEL AA +AAB2..AAB4 ; Vowel_Dependent # Mn [3] TAI VIET VOWEL I..TAI VIET VOWEL U +AAB5..AAB6 ; Vowel_Dependent # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB7..AAB8 ; Vowel_Dependent # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AAB9..AABD ; Vowel_Dependent # Lo [5] TAI VIET VOWEL UEA..TAI VIET VOWEL AN +AABE ; Vowel_Dependent # Mn TAI VIET VOWEL AM +AAEB ; Vowel_Dependent # Mc MEETEI MAYEK VOWEL SIGN II +AAEC..AAED ; Vowel_Dependent # Mn [2] MEETEI MAYEK VOWEL SIGN UU..MEETEI MAYEK VOWEL SIGN AAI +AAEE..AAEF ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN AU..MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE5 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN ANAP +ABE6..ABE7 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE8 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABE9..ABEA ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +10A01..10A03 ; Vowel_Dependent # Mn [3] KHAROSHTHI VOWEL SIGN I..KHAROSHTHI VOWEL SIGN VOCALIC R +10A05..10A06 ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O +10A0C..10A0D ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN DOUBLE RING BELOW +11038..11045 ; Vowel_Dependent # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +110B0..110B2 ; Vowel_Dependent # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II +110B3..110B6 ; Vowel_Dependent # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI +110B7..110B8 ; Vowel_Dependent # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11127..1112B ; Vowel_Dependent # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU +1112C ; Vowel_Dependent # Mc CHAKMA VOWEL SIGN E +1112D..11132 ; Vowel_Dependent # Mn [6] CHAKMA VOWEL SIGN AI..CHAKMA AU MARK +111B3..111B5 ; Vowel_Dependent # Mc [3] SHARADA VOWEL SIGN AA..SHARADA VOWEL SIGN II +111B6..111BE ; Vowel_Dependent # Mn [9] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN O +111BF ; Vowel_Dependent # Mc SHARADA VOWEL SIGN AU +111CB..111CC ; Vowel_Dependent # Mn [2] SHARADA VOWEL MODIFIER MARK..SHARADA EXTRA SHORT VOWEL MARK +1122C..1122E ; Vowel_Dependent # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +1122F..11231 ; Vowel_Dependent # Mn [3] KHOJKI VOWEL SIGN U..KHOJKI VOWEL SIGN AI +11232..11233 ; Vowel_Dependent # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU +112E0..112E2 ; Vowel_Dependent # Mc [3] KHUDAWADI VOWEL SIGN AA..KHUDAWADI VOWEL SIGN II +112E3..112E8 ; Vowel_Dependent # Mn [6] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN AU +1133E..1133F ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11340 ; Vowel_Dependent # Mn GRANTHA VOWEL SIGN II +11341..11344 ; Vowel_Dependent # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +11347..11348 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +1134B..1134C ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +11357 ; Vowel_Dependent # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +114B0..114B2 ; Vowel_Dependent # Mc [3] TIRHUTA VOWEL SIGN AA..TIRHUTA VOWEL SIGN II +114B3..114B8 ; Vowel_Dependent # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114B9 ; Vowel_Dependent # Mc TIRHUTA VOWEL SIGN E +114BA ; Vowel_Dependent # Mn TIRHUTA VOWEL SIGN SHORT E +114BB..114BE ; Vowel_Dependent # Mc [4] TIRHUTA VOWEL SIGN AI..TIRHUTA VOWEL SIGN AU +115AF..115B1 ; Vowel_Dependent # Mc [3] SIDDHAM VOWEL SIGN AA..SIDDHAM VOWEL SIGN II +115B2..115B5 ; Vowel_Dependent # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115B8..115BB ; Vowel_Dependent # Mc [4] SIDDHAM VOWEL SIGN E..SIDDHAM VOWEL SIGN AU +115DC..115DD ; Vowel_Dependent # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11630..11632 ; Vowel_Dependent # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +11633..1163A ; Vowel_Dependent # Mn [8] MODI VOWEL SIGN U..MODI VOWEL SIGN AI +1163B..1163C ; Vowel_Dependent # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +11640 ; Vowel_Dependent # Mn MODI SIGN ARDHACANDRA +116AD ; Vowel_Dependent # Mn TAKRI VOWEL SIGN AA +116AE..116AF ; Vowel_Dependent # Mc [2] TAKRI VOWEL SIGN I..TAKRI VOWEL SIGN II +116B0..116B5 ; Vowel_Dependent # Mn [6] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN AU +11720..11721 ; Vowel_Dependent # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +11722..11725 ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN I..AHOM VOWEL SIGN UU +11726 ; Vowel_Dependent # Mc AHOM VOWEL SIGN E +11727..1172A ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN AW..AHOM VOWEL SIGN AM + +# ================================================ + +# Indic_Syllabic_Category=Vowel + +# (Other) Vowels (reanalyzed as ordinary alphabetic letters or marks) + +# [Not derivable] + +1963..196D ; Vowel # Lo [11] TAI LE LETTER A..TAI LE LETTER AI +A85E..A861 ; Vowel # Lo [4] PHAGS-PA LETTER I..PHAGS-PA LETTER O +A866 ; Vowel # Lo PHAGS-PA LETTER EE +A922..A925 ; Vowel # Lo [4] KAYAH LI LETTER A..KAYAH LI LETTER OO +A926..A92A ; Vowel # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O +11150..11154 ; Vowel # Lo [5] MAHAJANI LETTER A..MAHAJANI LETTER O + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Placeholder + +# Consonant Placeholder +# This includes generic placeholders used for +# Indic script layout (NBSP and dotted circle), as well as a few script- +# specific vowel-holder characters which are not technically +# consonants, but serve instead as bases for placement of vowel marks. + +# [Not derivable] + +002D ; Consonant_Placeholder # Pd HYPHEN-MINUS +00A0 ; Consonant_Placeholder # Zs NO-BREAK SPACE +00D7 ; Consonant_Placeholder # Sm MULTIPLICATION SIGN +0A72..0A73 ; Consonant_Placeholder # Lo [2] GURMUKHI IRI..GURMUKHI URA +104E ; Consonant_Placeholder # Po MYANMAR SYMBOL AFOREMENTIONED +1900 ; Consonant_Placeholder # Lo LIMBU VOWEL-CARRIER LETTER +2010..2014 ; Consonant_Placeholder # Pd [5] HYPHEN..EM DASH +25CC ; Consonant_Placeholder # So DOTTED CIRCLE + +# ================================================ + +# Indic_Syllabic_Category=Consonant + +# Consonant (ordinary abugida consonants, with inherent vowels) + +# [Not derivable] + +0915..0939 ; Consonant # Lo [37] DEVANAGARI LETTER KA..DEVANAGARI LETTER HA +0958..095F ; Consonant # Lo [8] DEVANAGARI LETTER QA..DEVANAGARI LETTER YYA +0978..097F ; Consonant # Lo [8] DEVANAGARI LETTER MARWARI DDA..DEVANAGARI LETTER BBA +0995..09A8 ; Consonant # Lo [20] BENGALI LETTER KA..BENGALI LETTER NA +09AA..09B0 ; Consonant # Lo [7] BENGALI LETTER PA..BENGALI LETTER RA +09B2 ; Consonant # Lo BENGALI LETTER LA +09B6..09B9 ; Consonant # Lo [4] BENGALI LETTER SHA..BENGALI LETTER HA +09DC..09DD ; Consonant # Lo [2] BENGALI LETTER RRA..BENGALI LETTER RHA +09DF ; Consonant # Lo BENGALI LETTER YYA +09F0..09F1 ; Consonant # Lo [2] BENGALI LETTER RA WITH MIDDLE DIAGONAL..BENGALI LETTER RA WITH LOWER DIAGONAL +0A15..0A28 ; Consonant # Lo [20] GURMUKHI LETTER KA..GURMUKHI LETTER NA +0A2A..0A30 ; Consonant # Lo [7] GURMUKHI LETTER PA..GURMUKHI LETTER RA +0A32..0A33 ; Consonant # Lo [2] GURMUKHI LETTER LA..GURMUKHI LETTER LLA +0A35..0A36 ; Consonant # Lo [2] GURMUKHI LETTER VA..GURMUKHI LETTER SHA +0A38..0A39 ; Consonant # Lo [2] GURMUKHI LETTER SA..GURMUKHI LETTER HA +0A59..0A5C ; Consonant # Lo [4] GURMUKHI LETTER KHHA..GURMUKHI LETTER RRA +0A5E ; Consonant # Lo GURMUKHI LETTER FA +0A95..0AA8 ; Consonant # Lo [20] GUJARATI LETTER KA..GUJARATI LETTER NA +0AAA..0AB0 ; Consonant # Lo [7] GUJARATI LETTER PA..GUJARATI LETTER RA +0AB2..0AB3 ; Consonant # Lo [2] GUJARATI LETTER LA..GUJARATI LETTER LLA +0AB5..0AB9 ; Consonant # Lo [5] GUJARATI LETTER VA..GUJARATI LETTER HA +0AF9 ; Consonant # Lo GUJARATI LETTER ZHA +0B15..0B28 ; Consonant # Lo [20] ORIYA LETTER KA..ORIYA LETTER NA +0B2A..0B30 ; Consonant # Lo [7] ORIYA LETTER PA..ORIYA LETTER RA +0B32..0B33 ; Consonant # Lo [2] ORIYA LETTER LA..ORIYA LETTER LLA +0B35..0B39 ; Consonant # Lo [5] ORIYA LETTER VA..ORIYA LETTER HA +0B5C..0B5D ; Consonant # Lo [2] ORIYA LETTER RRA..ORIYA LETTER RHA +0B5F ; Consonant # Lo ORIYA LETTER YYA +0B71 ; Consonant # Lo ORIYA LETTER WA +0B95 ; Consonant # Lo TAMIL LETTER KA +0B99..0B9A ; Consonant # Lo [2] TAMIL LETTER NGA..TAMIL LETTER CA +0B9C ; Consonant # Lo TAMIL LETTER JA +0B9E..0B9F ; Consonant # Lo [2] TAMIL LETTER NYA..TAMIL LETTER TTA +0BA3..0BA4 ; Consonant # Lo [2] TAMIL LETTER NNA..TAMIL LETTER TA +0BA8..0BAA ; Consonant # Lo [3] TAMIL LETTER NA..TAMIL LETTER PA +0BAE..0BB9 ; Consonant # Lo [12] TAMIL LETTER MA..TAMIL LETTER HA +0C15..0C28 ; Consonant # Lo [20] TELUGU LETTER KA..TELUGU LETTER NA +0C2A..0C39 ; Consonant # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C58..0C5A ; Consonant # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C95..0CA8 ; Consonant # Lo [20] KANNADA LETTER KA..KANNADA LETTER NA +0CAA..0CB3 ; Consonant # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA +0CB5..0CB9 ; Consonant # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA +0CDE ; Consonant # Lo KANNADA LETTER FA +0D15..0D3A ; Consonant # Lo [38] MALAYALAM LETTER KA..MALAYALAM LETTER TTTA +0D9A..0DB1 ; Consonant # Lo [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA +0DB3..0DBB ; Consonant # Lo [9] SINHALA LETTER SANYAKA DAYANNA..SINHALA LETTER RAYANNA +0DBD ; Consonant # Lo SINHALA LETTER DANTAJA LAYANNA +0DC0..0DC6 ; Consonant # Lo [7] SINHALA LETTER VAYANNA..SINHALA LETTER FAYANNA +0E01..0E2E ; Consonant # Lo [46] THAI CHARACTER KO KAI..THAI CHARACTER HO NOKHUK +0E81..0E82 ; Consonant # Lo [2] LAO LETTER KO..LAO LETTER KHO SUNG +0E84 ; Consonant # Lo LAO LETTER KHO TAM +0E87..0E88 ; Consonant # Lo [2] LAO LETTER NGO..LAO LETTER CO +0E8A ; Consonant # Lo LAO LETTER SO TAM +0E8D ; Consonant # Lo LAO LETTER NYO +0E94..0E97 ; Consonant # Lo [4] LAO LETTER DO..LAO LETTER THO TAM +0E99..0E9F ; Consonant # Lo [7] LAO LETTER NO..LAO LETTER FO SUNG +0EA1..0EA3 ; Consonant # Lo [3] LAO LETTER MO..LAO LETTER LO LING +0EA5 ; Consonant # Lo LAO LETTER LO LOOT +0EA7 ; Consonant # Lo LAO LETTER WO +0EAA..0EAB ; Consonant # Lo [2] LAO LETTER SO SUNG..LAO LETTER HO SUNG +0EAD..0EAE ; Consonant # Lo [2] LAO LETTER O..LAO LETTER HO TAM +0EDC..0EDF ; Consonant # Lo [4] LAO HO NO..LAO LETTER KHMU NYO +0F40..0F47 ; Consonant # Lo [8] TIBETAN LETTER KA..TIBETAN LETTER JA +0F49..0F6C ; Consonant # Lo [36] TIBETAN LETTER NYA..TIBETAN LETTER RRA +1000..1020 ; Consonant # Lo [33] MYANMAR LETTER KA..MYANMAR LETTER LLA +103F ; Consonant # Lo MYANMAR LETTER GREAT SA +1050..1051 ; Consonant # Lo [2] MYANMAR LETTER SHA..MYANMAR LETTER SSA +105A..105D ; Consonant # Lo [4] MYANMAR LETTER MON NGA..MYANMAR LETTER MON BBE +1061 ; Consonant # Lo MYANMAR LETTER SGAW KAREN SHA +1065..1066 ; Consonant # Lo [2] MYANMAR LETTER WESTERN PWO KAREN THA..MYANMAR LETTER WESTERN PWO KAREN PWA +106E..1070 ; Consonant # Lo [3] MYANMAR LETTER EASTERN PWO KAREN NNA..MYANMAR LETTER EASTERN PWO KAREN GHWA +1075..1081 ; Consonant # Lo [13] MYANMAR LETTER SHAN KA..MYANMAR LETTER SHAN HA +108E ; Consonant # Lo MYANMAR LETTER RUMAI PALAUNG FA +1703..170C ; Consonant # Lo [10] TAGALOG LETTER KA..TAGALOG LETTER YA +170E..1711 ; Consonant # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1723..1731 ; Consonant # Lo [15] HANUNOO LETTER KA..HANUNOO LETTER HA +1743..1751 ; Consonant # Lo [15] BUHID LETTER KA..BUHID LETTER HA +1763..176C ; Consonant # Lo [10] TAGBANWA LETTER KA..TAGBANWA LETTER YA +176E..1770 ; Consonant # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA +1780..17A2 ; Consonant # Lo [35] KHMER LETTER KA..KHMER LETTER QA +1901..191E ; Consonant # Lo [30] LIMBU LETTER KA..LIMBU LETTER TRA +1950..1962 ; Consonant # Lo [19] TAI LE LETTER KA..TAI LE LETTER NA +1980..19AB ; Consonant # Lo [44] NEW TAI LUE LETTER HIGH QA..NEW TAI LUE LETTER LOW SUA +1A00..1A16 ; Consonant # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA +1A20..1A4C ; Consonant # Lo [45] TAI THAM LETTER HIGH KA..TAI THAM LETTER LOW HA +1A53..1A54 ; Consonant # Lo [2] TAI THAM LETTER LAE..TAI THAM LETTER GREAT SA +1B13..1B33 ; Consonant # Lo [33] BALINESE LETTER KA..BALINESE LETTER HA +1B45..1B4B ; Consonant # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B8A..1BA0 ; Consonant # Lo [23] SUNDANESE LETTER KA..SUNDANESE LETTER HA +1BAE..1BAF ; Consonant # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA +1BBB..1BBD ; Consonant # Lo [3] SUNDANESE LETTER REU..SUNDANESE LETTER BHA +1BC0..1BE3 ; Consonant # Lo [36] BATAK LETTER A..BATAK LETTER MBA +1C00..1C23 ; Consonant # Lo [36] LEPCHA LETTER KA..LEPCHA LETTER A +1C4D..1C4F ; Consonant # Lo [3] LEPCHA LETTER TTA..LEPCHA LETTER DDA +A807..A80A ; Consonant # Lo [4] SYLOTI NAGRI LETTER KO..SYLOTI NAGRI LETTER GHO +A80C..A822 ; Consonant # Lo [23] SYLOTI NAGRI LETTER CO..SYLOTI NAGRI LETTER HO +A840..A85D ; Consonant # Lo [30] PHAGS-PA LETTER KA..PHAGS-PA LETTER A +A862..A865 ; Consonant # Lo [4] PHAGS-PA LETTER QA..PHAGS-PA LETTER GGA +A869..A870 ; Consonant # Lo [8] PHAGS-PA LETTER TTA..PHAGS-PA LETTER ASPIRATED FA +A872 ; Consonant # Lo PHAGS-PA SUPERFIXED LETTER RA +A892..A8B3 ; Consonant # Lo [34] SAURASHTRA LETTER KA..SAURASHTRA LETTER LLA +A90A..A921 ; Consonant # Lo [24] KAYAH LI LETTER KA..KAYAH LI LETTER CA +A930..A946 ; Consonant # Lo [23] REJANG LETTER KA..REJANG LETTER A +A989..A98B ; Consonant # Lo [3] JAVANESE LETTER PA CEREK..JAVANESE LETTER NGA LELET RASWADI +A98F..A9B2 ; Consonant # Lo [36] JAVANESE LETTER KA..JAVANESE LETTER HA +A9E0..A9E4 ; Consonant # Lo [5] MYANMAR LETTER SHAN GHA..MYANMAR LETTER SHAN BHA +A9E7..A9EF ; Consonant # Lo [9] MYANMAR LETTER TAI LAING NYA..MYANMAR LETTER TAI LAING NNA +A9FA..A9FE ; Consonant # Lo [5] MYANMAR LETTER TAI LAING LLA..MYANMAR LETTER TAI LAING BHA +AA06..AA28 ; Consonant # Lo [35] CHAM LETTER KA..CHAM LETTER HA +AA60..AA6F ; Consonant # Lo [16] MYANMAR LETTER KHAMTI GA..MYANMAR LETTER KHAMTI FA +AA71..AA73 ; Consonant # Lo [3] MYANMAR LETTER KHAMTI XA..MYANMAR LETTER KHAMTI RA +AA7A ; Consonant # Lo MYANMAR LETTER AITON RA +AA7E..AA7F ; Consonant # Lo [2] MYANMAR LETTER SHWE PALAUNG CHA..MYANMAR LETTER SHWE PALAUNG SHA +AA80..AAAF ; Consonant # Lo [48] TAI VIET LETTER LOW KO..TAI VIET LETTER HIGH O +AAE2..AAEA ; Consonant # Lo [9] MEETEI MAYEK LETTER CHA..MEETEI MAYEK LETTER SSA +ABC0..ABCD ; Consonant # Lo [14] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER HUK +ABD0 ; Consonant # Lo MEETEI MAYEK LETTER PHAM +ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTER BHAM +10A00 ; Consonant # Lo KHAROSHTHI LETTER A +10A10..10A13 ; Consonant # Lo [4] KHAROSHTHI LETTER KA..KHAROSHTHI LETTER GHA +10A15..10A17 ; Consonant # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA +10A19..10A33 ; Consonant # Lo [27] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER TTTHA +11013..11037 ; Consonant # Lo [37] BRAHMI LETTER KA..BRAHMI LETTER OLD TAMIL NNNA +1108D..110AF ; Consonant # Lo [35] KAITHI LETTER KA..KAITHI LETTER HA +11107..11126 ; Consonant # Lo [32] CHAKMA LETTER KAA..CHAKMA LETTER HAA +11155..11172 ; Consonant # Lo [30] MAHAJANI LETTER KA..MAHAJANI LETTER RRA +11191..111B2 ; Consonant # Lo [34] SHARADA LETTER KA..SHARADA LETTER HA +11208..11211 ; Consonant # Lo [10] KHOJKI LETTER KA..KHOJKI LETTER JJA +11213..1122B ; Consonant # Lo [25] KHOJKI LETTER NYA..KHOJKI LETTER LLA +11284..11286 ; Consonant # Lo [3] MULTANI LETTER KA..MULTANI LETTER GA +11288 ; Consonant # Lo MULTANI LETTER GHA +1128A..1128D ; Consonant # Lo [4] MULTANI LETTER CA..MULTANI LETTER JJA +1128F..1129D ; Consonant # Lo [15] MULTANI LETTER NYA..MULTANI LETTER BA +1129F..112A8 ; Consonant # Lo [10] MULTANI LETTER BHA..MULTANI LETTER RHA +112BA..112DE ; Consonant # Lo [37] KHUDAWADI LETTER KA..KHUDAWADI LETTER HA +11315..11328 ; Consonant # Lo [20] GRANTHA LETTER KA..GRANTHA LETTER NA +1132A..11330 ; Consonant # Lo [7] GRANTHA LETTER PA..GRANTHA LETTER RA +11332..11333 ; Consonant # Lo [2] GRANTHA LETTER LA..GRANTHA LETTER LLA +11335..11339 ; Consonant # Lo [5] GRANTHA LETTER VA..GRANTHA LETTER HA +1148F..114AF ; Consonant # Lo [33] TIRHUTA LETTER KA..TIRHUTA LETTER HA +1158E..115AE ; Consonant # Lo [33] SIDDHAM LETTER KA..SIDDHAM LETTER HA +1160E..1162F ; Consonant # Lo [34] MODI LETTER KA..MODI LETTER LLA +1168A..116AA ; Consonant # Lo [33] TAKRI LETTER KA..TAKRI LETTER RRA +11700..11719 ; Consonant # Lo [26] AHOM LETTER KA..AHOM LETTER JHA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Dead + +# Dead Consonant (special consonant with killed vowel) + +# [Not derivable] + +09CE ; Consonant_Dead # Lo BENGALI LETTER KHANDA TA +0D7A..0D7F ; Consonant_Dead # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K + +# ================================================ + +# Indic_Syllabic_Category=Consonant_With_Stacker + +# Consonants that may make stacked ligatures with the next consonant +# without the use of a virama + +# [Not derivable] + +0CF1..0CF2 ; Consonant_With_Stacker # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA +11003..11004 ; Consonant_With_Stacker # Lo [2] BRAHMI SIGN JIHVAMULIYA..BRAHMI SIGN UPADHMANIYA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Prefixed + +# Cluster-intial consonants + +# [Not derivable] + +111C2..111C3 ; Consonant_Prefixed # Lo [2] SHARADA SIGN JIHVAMULIYA..SHARADA SIGN UPADHMANIYA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Preceding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when preceding the main consonant + +# [Not derivable] + +0D4E ; Consonant_Preceding_Repha # Lo MALAYALAM LETTER DOT REPH + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Succeeding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when succeeding the main consonant + +# [Not derivable] + +17CC ; Consonant_Succeeding_Repha # Mn KHMER SIGN ROBAT +1B03 ; Consonant_Succeeding_Repha # Mn BALINESE SIGN SURANG +1B81 ; Consonant_Succeeding_Repha # Mn SUNDANESE SIGN PANGLAYAR +A982 ; Consonant_Succeeding_Repha # Mn JAVANESE SIGN LAYAR + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Subjoined + +# Subjoined Consonant (C2 form subtending a base consonant in Tibetan, etc.) + +# [Not derivable] + +0F8D..0F97 ; Consonant_Subjoined # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Consonant_Subjoined # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +1929..192B ; Consonant_Subjoined # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1BA1 ; Consonant_Subjoined # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA2..1BA3 ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BAC..1BAD ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C24..1C25 ; Consonant_Subjoined # Mc [2] LEPCHA SUBJOINED LETTER YA..LEPCHA SUBJOINED LETTER RA +A867..A868 ; Consonant_Subjoined # Lo [2] PHAGS-PA SUBJOINED LETTER WA..PHAGS-PA SUBJOINED LETTER YA +A871 ; Consonant_Subjoined # Lo PHAGS-PA SUBJOINED LETTER RA +A9BD ; Consonant_Subjoined # Mc JAVANESE CONSONANT SIGN KERET + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Medial + +# Medial Consonant (medial liquid, occurring in clusters) + +# [Not derivable] + +0A75 ; Consonant_Medial # Mn GURMUKHI SIGN YAKASH +0EBC ; Consonant_Medial # Mn LAO SEMIVOWEL SIGN LO +0EBD ; Consonant_Medial # Lo LAO SEMIVOWEL SIGN NYO +103B..103C ; Consonant_Medial # Mc [2] MYANMAR CONSONANT SIGN MEDIAL YA..MYANMAR CONSONANT SIGN MEDIAL RA +103D..103E ; Consonant_Medial # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +105E..1060 ; Consonant_Medial # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Consonant_Medial # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +1A55 ; Consonant_Medial # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A56 ; Consonant_Medial # Mn TAI THAM CONSONANT SIGN MEDIAL LA +A9BE..A9BF ; Consonant_Medial # Mc [2] JAVANESE CONSONANT SIGN PENGKAL..JAVANESE CONSONANT SIGN CAKRA +AA33..AA34 ; Consonant_Medial # Mc [2] CHAM CONSONANT SIGN YA..CHAM CONSONANT SIGN RA +AA35..AA36 ; Consonant_Medial # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +1171D..1171F ; Consonant_Medial # Mn [3] AHOM CONSONANT SIGN MEDIAL LA..AHOM CONSONANT SIGN MEDIAL LIGATING RA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Final + +# Final Consonant (special final forms which do not take vowels) + +# [Not derivable] + +1930..1931 ; Consonant_Final # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Consonant_Final # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +1939 ; Consonant_Final # Mn LIMBU SIGN MUKPHRENG +19C1..19C7 ; Consonant_Final # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B +1A57 ; Consonant_Final # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A58..1A5E ; Consonant_Final # Mn [7] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN SA +1BBE..1BBF ; Consonant_Final # Lo [2] SUNDANESE LETTER FINAL K..SUNDANESE LETTER FINAL M +1BF0..1BF1 ; Consonant_Final # Mn [2] BATAK CONSONANT SIGN NG..BATAK CONSONANT SIGN H +1C2D..1C33 ; Consonant_Final # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +A8B4 ; Consonant_Final # Mc SAURASHTRA CONSONANT SIGN HAARU +A94F..A951 ; Consonant_Final # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A952 ; Consonant_Final # Mc REJANG CONSONANT SIGN H +AA40..AA42 ; Consonant_Final # Lo [3] CHAM LETTER FINAL K..CHAM LETTER FINAL NG +AA43 ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL NG +AA44..AA4B ; Consonant_Final # Lo [8] CHAM LETTER FINAL CH..CHAM LETTER FINAL SS +AA4C ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL M +AA4D ; Consonant_Final # Mc CHAM CONSONANT SIGN FINAL H +ABDB..ABE2 ; Consonant_Final # Lo [8] MEETEI MAYEK LETTER KOK LONSUM..MEETEI MAYEK LETTER I LONSUM + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Head_Letter + +# Head Letter (Tibetan) + +# [Not derivable] + +0F88..0F8C ; Consonant_Head_Letter # Lo [5] TIBETAN SIGN LCE TSA CAN..TIBETAN SIGN INVERTED MCHU CAN + +# ================================================ + +# Indic_Syllabic_Category=Modifying_Letter + +# Reanalyzed letters not participating in the abugida structure, but +# serving to modify the sound of an adjacent vowel or consonant. +# Note that this is not the same as General_Category=Modifier_Letter. + +# [Not derivable] + +0B83 ; Modifying_Letter # Lo TAMIL SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Tone_Letter + +# Tone Letter (spacing lexical tone mark with status as a letter) + +# [Not derivable] + +1970..1974 ; Tone_Letter # Lo [5] TAI LE LETTER TONE-2..TAI LE LETTER TONE-6 +AAC0 ; Tone_Letter # Lo TAI VIET TONE MAI NUENG +AAC2 ; Tone_Letter # Lo TAI VIET TONE MAI SONG + +# ================================================ + +# Indic_Syllabic_Category=Tone_Mark + +# Tone Mark (nonspacing or spacing lexical tone mark) + +# [Not derivable] + +0E48..0E4B ; Tone_Mark # Mn [4] THAI CHARACTER MAI EK..THAI CHARACTER MAI CHATTAWA +0EC8..0ECB ; Tone_Mark # Mn [4] LAO TONE MAI EK..LAO TONE MAI CATAWA +1037 ; Tone_Mark # Mn MYANMAR SIGN DOT BELOW +1063..1064 ; Tone_Mark # Mc [2] MYANMAR TONE MARK SGAW KAREN HATHI..MYANMAR TONE MARK SGAW KAREN KE PHO +1069..106D ; Tone_Mark # Mc [5] MYANMAR SIGN WESTERN PWO KAREN TONE-1..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1087..108C ; Tone_Mark # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108D ; Tone_Mark # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +108F ; Tone_Mark # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109B ; Tone_Mark # Mc [2] MYANMAR SIGN KHAMTI TONE-1..MYANMAR SIGN KHAMTI TONE-3 +19C8..19C9 ; Tone_Mark # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A75..1A79 ; Tone_Mark # Mn [5] TAI THAM SIGN TONE-1..TAI THAM SIGN KHUEN TONE-5 +A92B..A92D ; Tone_Mark # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +AA7B ; Tone_Mark # Mc MYANMAR SIGN PAO KAREN TONE +AA7C ; Tone_Mark # Mn MYANMAR SIGN TAI LAING TONE-2 +AA7D ; Tone_Mark # Mc MYANMAR SIGN TAI LAING TONE-5 +AABF ; Tone_Mark # Mn TAI VIET TONE MAI EK +AAC1 ; Tone_Mark # Mn TAI VIET TONE MAI THO +ABEC ; Tone_Mark # Mc MEETEI MAYEK LUM IYEK + +# ================================================ + +# Indic_Syllabic_Category=Gemination_Mark + +# Gemination Mark (doubling of the preceding or following consonant) + +# [Not derivable] + +0A71 ; Gemination_Mark # Mn GURMUKHI ADDAK +11237 ; Gemination_Mark # Mn KHOJKI SIGN SHADDA + +# ================================================ + +# Indic_Syllabic_Category=Cantillation_Mark + +# Cantillation Mark (recitation marks, such as svara markers for the Samaveda) + +# [Not derivable] + +0951..0952 ; Cantillation_Mark # Mn [2] DEVANAGARI STRESS SIGN UDATTA..DEVANAGARI STRESS SIGN ANUDATTA +1CD0..1CD2 ; Cantillation_Mark # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CD4..1CE0 ; Cantillation_Mark # Mn [13] VEDIC SIGN YAJURVEDIC MIDLINE SVARITA..VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CE1 ; Cantillation_Mark # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF4 ; Cantillation_Mark # Mn VEDIC TONE CANDRA ABOVE +1CF8..1CF9 ; Cantillation_Mark # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE +A8E0..A8F1 ; Cantillation_Mark # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +11366..1136C ; Cantillation_Mark # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Cantillation_Mark # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA + +# ================================================ + +# Indic_Syllabic_Category=Register_Shifter + +# Register Shifter (shifts register for consonants, akin to a tone mark) + +# [Not derivable] + +17C9..17CA ; Register_Shifter # Mn [2] KHMER SIGN MUUSIKATOAN..KHMER SIGN TRIISAP + +# ================================================ + +# Indic_Syllabic_Category=Syllable_Modifier + +# Syllable Modifier (miscellaneous combining characters that modify +# something in the orthographic syllable they succeed) + +# [Not derivable] + +00B2..00B3 ; Syllable_Modifier # No [2] SUPERSCRIPT TWO..SUPERSCRIPT THREE +0F35 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0FC6 ; Syllable_Modifier # Mn TIBETAN SYMBOL PADMA GDAN +17CB ; Syllable_Modifier # Mn KHMER SIGN BANTOC +17CE..17D0 ; Syllable_Modifier # Mn [3] KHMER SIGN KAKABAT..KHMER SIGN SAMYOK SANNYA +17D3 ; Syllable_Modifier # Mn KHMER SIGN BATHAMASAT +193B ; Syllable_Modifier # Mn LIMBU SIGN SA-I +1A7A..1A7C ; Syllable_Modifier # Mn [3] TAI THAM SIGN RA HAAM..TAI THAM SIGN KHUEN-LUE KARAN +1A7F ; Syllable_Modifier # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1C36 ; Syllable_Modifier # Mn LEPCHA SIGN RAN +2074 ; Syllable_Modifier # No SUPERSCRIPT FOUR +2082..2084 ; Syllable_Modifier # No [3] SUBSCRIPT TWO..SUBSCRIPT FOUR + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Killer + +# Consonant Killer (signifies that the previous consonant or consonants are +# not pronounced) + +# [Not derivable] + +0E4C ; Consonant_Killer # Mn THAI CHARACTER THANTHAKHAT +17CD ; Consonant_Killer # Mn KHMER SIGN TOANDAKHIAT + +# ================================================ + +# Indic_Syllabic_Category=Non_Joiner + +# Non_Joiner (Zero Width Non-Joiner) + +# [Not derivable] + +200C ; Non_Joiner # Cf ZERO WIDTH NON-JOINER + +# ================================================ + +# Indic_Syllabic_Category=Joiner + +# Joiner (Zero Width Joiner) + +# [Not derivable] + +200D ; Joiner # Cf ZERO WIDTH JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number_Joiner + +# Number_Joiner (forms ligatures between numbers for multiplication) + +# [Not derivable] + +1107F ; Number_Joiner # Mn BRAHMI NUMBER JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number + +# Number (can be used as vowel-holders like consonant placeholders) + +# [Not derivable] + +0030..0039 ; Number # Nd [10] DIGIT ZERO..DIGIT NINE +0966..096F ; Number # Nd [10] DEVANAGARI DIGIT ZERO..DEVANAGARI DIGIT NINE +09E6..09EF ; Number # Nd [10] BENGALI DIGIT ZERO..BENGALI DIGIT NINE +0A66..0A6F ; Number # Nd [10] GURMUKHI DIGIT ZERO..GURMUKHI DIGIT NINE +0AE6..0AEF ; Number # Nd [10] GUJARATI DIGIT ZERO..GUJARATI DIGIT NINE +0B66..0B6F ; Number # Nd [10] ORIYA DIGIT ZERO..ORIYA DIGIT NINE +0BE6..0BEF ; Number # Nd [10] TAMIL DIGIT ZERO..TAMIL DIGIT NINE +0C66..0C6F ; Number # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE +0CE6..0CEF ; Number # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE +0D66..0D6F ; Number # Nd [10] MALAYALAM DIGIT ZERO..MALAYALAM DIGIT NINE +0DE6..0DEF ; Number # Nd [10] SINHALA LITH DIGIT ZERO..SINHALA LITH DIGIT NINE +0E50..0E59 ; Number # Nd [10] THAI DIGIT ZERO..THAI DIGIT NINE +0ED0..0ED9 ; Number # Nd [10] LAO DIGIT ZERO..LAO DIGIT NINE +0F20..0F29 ; Number # Nd [10] TIBETAN DIGIT ZERO..TIBETAN DIGIT NINE +0F2A..0F33 ; Number # No [10] TIBETAN DIGIT HALF ONE..TIBETAN DIGIT HALF ZERO +1040..1049 ; Number # Nd [10] MYANMAR DIGIT ZERO..MYANMAR DIGIT NINE +1090..1099 ; Number # Nd [10] MYANMAR SHAN DIGIT ZERO..MYANMAR SHAN DIGIT NINE +17E0..17E9 ; Number # Nd [10] KHMER DIGIT ZERO..KHMER DIGIT NINE +1946..194F ; Number # Nd [10] LIMBU DIGIT ZERO..LIMBU DIGIT NINE +19D0..19D9 ; Number # Nd [10] NEW TAI LUE DIGIT ZERO..NEW TAI LUE DIGIT NINE +1A80..1A89 ; Number # Nd [10] TAI THAM HORA DIGIT ZERO..TAI THAM HORA DIGIT NINE +1A90..1A99 ; Number # Nd [10] TAI THAM THAM DIGIT ZERO..TAI THAM THAM DIGIT NINE +1B50..1B59 ; Number # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE +1BB0..1BB9 ; Number # Nd [10] SUNDANESE DIGIT ZERO..SUNDANESE DIGIT NINE +1C40..1C49 ; Number # Nd [10] LEPCHA DIGIT ZERO..LEPCHA DIGIT NINE +A8D0..A8D9 ; Number # Nd [10] SAURASHTRA DIGIT ZERO..SAURASHTRA DIGIT NINE +A900..A909 ; Number # Nd [10] KAYAH LI DIGIT ZERO..KAYAH LI DIGIT NINE +A9D0..A9D9 ; Number # Nd [10] JAVANESE DIGIT ZERO..JAVANESE DIGIT NINE +A9F0..A9F9 ; Number # Nd [10] MYANMAR TAI LAING DIGIT ZERO..MYANMAR TAI LAING DIGIT NINE +AA50..AA59 ; Number # Nd [10] CHAM DIGIT ZERO..CHAM DIGIT NINE +ABF0..ABF9 ; Number # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE +10A40..10A47 ; Number # No [8] KHAROSHTHI DIGIT ONE..KHAROSHTHI NUMBER ONE THOUSAND +11066..1106F ; Number # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11136..1113F ; Number # Nd [10] CHAKMA DIGIT ZERO..CHAKMA DIGIT NINE +111D0..111D9 ; Number # Nd [10] SHARADA DIGIT ZERO..SHARADA DIGIT NINE +111E1..111F4 ; Number # No [20] SINHALA ARCHAIC DIGIT ONE..SINHALA ARCHAIC NUMBER ONE THOUSAND +112F0..112F9 ; Number # Nd [10] KHUDAWADI DIGIT ZERO..KHUDAWADI DIGIT NINE +114D0..114D9 ; Number # Nd [10] TIRHUTA DIGIT ZERO..TIRHUTA DIGIT NINE +11650..11659 ; Number # Nd [10] MODI DIGIT ZERO..MODI DIGIT NINE +116C0..116C9 ; Number # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE +11730..11739 ; Number # Nd [10] AHOM DIGIT ZERO..AHOM DIGIT NINE +1173A..1173B ; Number # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY + +# ================================================ + +# Indic_Syllabic_Category=Brahmi_Joining_Number + +# Brahmi Joining Number (similar to Number in that in can be used as +# vowel-holders like Consonant_Placeholder, but may also be joined by +# a Number_Joiner of the same script, e.g. in Brahmi) + +# [Not derivable] + +11052..11065 ; Brahmi_Joining_Number # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND + +# EOF diff --git a/data/9.0.0-indic-positional-category.txt b/data/9.0.0-indic-positional-category.txt new file mode 100644 index 0000000..16a8268 --- /dev/null +++ b/data/9.0.0-indic-positional-category.txt @@ -0,0 +1,663 @@ +# IndicPositionalCategory-9.0.0.txt +# Date: 2016-06-09, 19:33:00 GMT [RP] +# © 2016 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# +# For documentation, see UAX #44: Unicode Character Database, +# at http://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Positional_Category enumerated property +# +# Scope: This property is aimed at the problem of +# the specification of syllabic structure for Indic scripts. +# Because dependent vowels (matras), visible viramas, and other +# characters are placed in notional slots around the consonant (or +# consonant cluster) core of an Indic syllable, there may be +# cooccurrence constraints or other interactions. Also, it may be +# desirable, in cases where more than one such character may occur in +# sequence, as for example, in a top slot and a bottom slot, to +# specify preferred orders for spelling. As such, this property +# is designed primarily to supplement the Indic_Syllabic_Category +# property. +# +# Note that this property is *not* intended as +# a prescriptive property regarding display or font design, +# for a number of reasons. Good font design requires information +# that is outside the context of a character encoding standard, +# and is best handled in other venues. For Indic dependent +# vowels and similar characters, in particular: +# +# 1. Matra placement may vary somewhat based on typeface design. +# 2. Matra placement, even within a single script, may vary +# somewhat according to historic period or local conventions. +# 3. Matra placement may be changed by explicit orthographic reform +# decisions. +# 4. Matras may ligate in various ways with a consonant (or even +# other elements of a syllable) instead of occurring in a +# discrete location. +# 5. Matra display may be contextually determined. This is +# notable, for example, in the Tamil script, where the shape +# and placement of -u and -uu vowels depends strongly on +# which consonant they adjoin. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Positional_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as containing dependent vowels or similar characters +# in the structural sense used for the Indic_Positional_Category are the +# following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Grantha, Gujarati, Gurmukhi, Hanunoo, +# Javanese, Kaithi, Kannada, Kharoshthi, Khmer, Khojki, Khudawadi, +# Lao, Lepcha, Limbu, Malayalam, Marchen, Meetei Mayek, Modi, +# Myanmar, Newa, New Tai Lue, Oriya, Rejang, Saurashtra, Sharada, +# Siddham, Sinhala, Sundanese, Syloti Nagri, Tagalog, Tagbanwa, Tai +# Tham, Tai Viet, Takri, Tamil, Telugu, Thai, Tibetan, and Tirhuta. +# +# All characters for all other scripts not in that list +# take the default value for this property. +# +# See IndicSyllabicCategory.txt for a slightly more extended +# list of Indic scripts, including those which do not have +# positional characters. Currently, those additional +# Indic scripts without positional characters are +# Kayah Li, Mahajani, Multani, Phags-pa, and Tai Le. +# +# Note: The following characters are all assigned the positional category +# Right, but may have different positions in some cases: +# * U+0BC1 TAMIL VOWEL SIGN U and U+0BC2 TAMIL VOWEL SIGN UU have +# contextually variable placement in Tamil. +# * U+0D41 MALAYALAM VOWEL SIGN U and U+0D42 MALAYALAM VOWEL SIGN UU form +# complex ligatures with consonants in older Malayalam orthography. +# * U+11341 GRANTHA VOWEL SIGN U and U+11342 GRANTHA VOWEL SIGN UU have +# contextually variable placement in Grantha. + +# ================================================ + +# Property: Indic_Positional_Category +# +# All code points not explicitly listed for Indic_Positional_Category +# have the value NA (not applicable). +# +# @missing: 0000..10FFFF; NA + +# ------------------------------------------------ + +# Indic_Positional_Category=Right + +0903 ; Right # Mc DEVANAGARI SIGN VISARGA +093B ; Right # Mc DEVANAGARI VOWEL SIGN OOE +093E ; Right # Mc DEVANAGARI VOWEL SIGN AA +0940 ; Right # Mc DEVANAGARI VOWEL SIGN II +0949..094C ; Right # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094F ; Right # Mc DEVANAGARI VOWEL SIGN AW +0982..0983 ; Right # Mc [2] BENGALI SIGN ANUSVARA..BENGALI SIGN VISARGA +09BE ; Right # Mc BENGALI VOWEL SIGN AA +09C0 ; Right # Mc BENGALI VOWEL SIGN II +09D7 ; Right # Mc BENGALI AU LENGTH MARK +0A03 ; Right # Mc GURMUKHI SIGN VISARGA +0A3E ; Right # Mc GURMUKHI VOWEL SIGN AA +0A40 ; Right # Mc GURMUKHI VOWEL SIGN II +0A83 ; Right # Mc GUJARATI SIGN VISARGA +0ABE ; Right # Mc GUJARATI VOWEL SIGN AA +0AC0 ; Right # Mc GUJARATI VOWEL SIGN II +0ACB..0ACC ; Right # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0B02..0B03 ; Right # Mc [2] ORIYA SIGN ANUSVARA..ORIYA SIGN VISARGA +0B3E ; Right # Mc ORIYA VOWEL SIGN AA +0B40 ; Right # Mc ORIYA VOWEL SIGN II +0BBE..0BBF ; Right # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC1..0BC2 ; Right # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BD7 ; Right # Mc TAMIL AU LENGTH MARK +0C01..0C03 ; Right # Mc [3] TELUGU SIGN CANDRABINDU..TELUGU SIGN VISARGA +0C41..0C44 ; Right # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C82..0C83 ; Right # Mc [2] KANNADA SIGN ANUSVARA..KANNADA SIGN VISARGA +0CBE ; Right # Mc KANNADA VOWEL SIGN AA +0CC1..0CC4 ; Right # Mc [4] KANNADA VOWEL SIGN U..KANNADA VOWEL SIGN VOCALIC RR +0CD5..0CD6 ; Right # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0D02..0D03 ; Right # Mc [2] MALAYALAM SIGN ANUSVARA..MALAYALAM SIGN VISARGA +0D3E..0D40 ; Right # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D42 ; Right # Mn [2] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN UU +0D57 ; Right # Mc MALAYALAM AU LENGTH MARK +0D82..0D83 ; Right # Mc [2] SINHALA SIGN ANUSVARAYA..SINHALA SIGN VISARGAYA +0DCF..0DD1 ; Right # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD8 ; Right # Mc SINHALA VOWEL SIGN GAETTA-PILLA +0DDF ; Right # Mc SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Right # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Right # Lo THAI CHARACTER SARA A +0E32..0E33 ; Right # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E45 ; Right # Lo THAI CHARACTER LAKKHANGYAO +0EB0 ; Right # Lo LAO VOWEL SIGN A +0EB2..0EB3 ; Right # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0F3E ; Right # Mc TIBETAN SIGN YAR TSHES +0F7F ; Right # Mc TIBETAN SIGN RNAM BCAD +102B..102C ; Right # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +1038 ; Right # Mc MYANMAR SIGN VISARGA +103B ; Right # Mc MYANMAR CONSONANT SIGN MEDIAL YA +1056..1057 ; Right # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1062..1064 ; Right # Mc [3] MYANMAR VOWEL SIGN SGAW KAREN EU..MYANMAR TONE MARK SGAW KAREN KE PHO +1067..106D ; Right # Mc [7] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1083 ; Right # Mc MYANMAR VOWEL SIGN SHAN AA +1087..108C ; Right # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108F ; Right # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109C ; Right # Mc [3] MYANMAR SIGN KHAMTI TONE-1..MYANMAR VOWEL SIGN AITON A +17B6 ; Right # Mc KHMER VOWEL SIGN AA +17C7..17C8 ; Right # Mc [2] KHMER SIGN REAHMUK..KHMER SIGN YUUKALEAPINTU +1923..1924 ; Right # Mc [2] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AI +1929..192B ; Right # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1930..1931 ; Right # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Right # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +19B0..19B4 ; Right # Lo [5] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN UU +19B8..19B9 ; Right # Lo [2] NEW TAI LUE VOWEL SIGN OA..NEW TAI LUE VOWEL SIGN UE +19BB..19C0 ; Right # Lo [6] NEW TAI LUE VOWEL SIGN AAY..NEW TAI LUE VOWEL SIGN IY +19C8..19C9 ; Right # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A1A ; Right # Mc BUGINESE VOWEL SIGN O +1A57 ; Right # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A61 ; Right # Mc TAI THAM VOWEL SIGN A +1A63..1A64 ; Right # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A6D ; Right # Mc TAI THAM VOWEL SIGN OY +1B04 ; Right # Mc BALINESE SIGN BISAH +1B35 ; Right # Mc BALINESE VOWEL SIGN TEDUNG +1B44 ; Right # Mc BALINESE ADEG ADEG +1B82 ; Right # Mc SUNDANESE SIGN PANGWISAD +1BA1 ; Right # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA7 ; Right # Mc SUNDANESE VOWEL SIGN PANOLONG +1BAA ; Right # Mc SUNDANESE SIGN PAMAAEH +1BE7 ; Right # Mc BATAK VOWEL SIGN E +1BEA..1BEC ; Right # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BEE ; Right # Mc BATAK VOWEL SIGN U +1BF2..1BF3 ; Right # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +1C24..1C26 ; Right # Mc [3] LEPCHA SUBJOINED LETTER YA..LEPCHA VOWEL SIGN AA +1C2A..1C2B ; Right # Mc [2] LEPCHA VOWEL SIGN U..LEPCHA VOWEL SIGN UU +1CE1 ; Right # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +A823..A824 ; Right # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A827 ; Right # Mc SYLOTI NAGRI VOWEL SIGN OO +A880..A881 ; Right # Mc [2] SAURASHTRA SIGN ANUSVARA..SAURASHTRA SIGN VISARGA +A8B4..A8C3 ; Right # Mc [16] SAURASHTRA CONSONANT SIGN HAARU..SAURASHTRA VOWEL SIGN AU +A952..A953 ; Right # Mc [2] REJANG CONSONANT SIGN H..REJANG VIRAMA +A983 ; Right # Mc JAVANESE SIGN WIGNYAN +A9B4..A9B5 ; Right # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9BD..A9BF ; Right # Mc [3] JAVANESE CONSONANT SIGN KERET..JAVANESE CONSONANT SIGN CAKRA +AA33 ; Right # Mc CHAM CONSONANT SIGN YA +AA4D ; Right # Mc CHAM CONSONANT SIGN FINAL H +AA7B ; Right # Mc MYANMAR SIGN PAO KAREN TONE +AA7D ; Right # Mc MYANMAR SIGN TAI LAING TONE-5 +AAB1 ; Right # Lo TAI VIET VOWEL AA +AABA ; Right # Lo TAI VIET VOWEL UA +AABD ; Right # Lo TAI VIET VOWEL AN +AAEF ; Right # Mc MEETEI MAYEK VOWEL SIGN AAU +AAF5 ; Right # Mc MEETEI MAYEK VOWEL SIGN VISARGA +ABE3..ABE4 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE6..ABE7 ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE9..ABEA ; Right # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +ABEC ; Right # Mc MEETEI MAYEK LUM IYEK +11000 ; Right # Mc BRAHMI SIGN CANDRABINDU +11002 ; Right # Mc BRAHMI SIGN VISARGA +11082 ; Right # Mc KAITHI SIGN VISARGA +110B0 ; Right # Mc KAITHI VOWEL SIGN AA +110B2 ; Right # Mc KAITHI VOWEL SIGN II +110B7..110B8 ; Right # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11182 ; Right # Mc SHARADA SIGN VISARGA +111B3 ; Right # Mc SHARADA VOWEL SIGN AA +111B5 ; Right # Mc SHARADA VOWEL SIGN II +111C0 ; Right # Mc SHARADA SIGN VIRAMA +1122C..1122E ; Right # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +11235 ; Right # Mc KHOJKI SIGN VIRAMA +112E0 ; Right # Mc KHUDAWADI VOWEL SIGN AA +112E2 ; Right # Mc KHUDAWADI VOWEL SIGN II +11302..11303 ; Right # Mc [2] GRANTHA SIGN ANUSVARA..GRANTHA SIGN VISARGA +1133E..1133F ; Right # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11341..11344 ; Right # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +1134D ; Right # Mc GRANTHA SIGN VIRAMA +11357 ; Right # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Right # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +11435 ; Right # Mc NEWA VOWEL SIGN AA +11437 ; Right # Mc NEWA VOWEL SIGN II +11440..11441 ; Right # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +11445 ; Right # Mc NEWA SIGN VISARGA +114B0 ; Right # Mc TIRHUTA VOWEL SIGN AA +114B2 ; Right # Mc TIRHUTA VOWEL SIGN II +114BD ; Right # Mc TIRHUTA VOWEL SIGN SHORT O +114C1 ; Right # Mc TIRHUTA SIGN VISARGA +115AF ; Right # Mc SIDDHAM VOWEL SIGN AA +115B1 ; Right # Mc SIDDHAM VOWEL SIGN II +115BE ; Right # Mc SIDDHAM SIGN VISARGA +11630..11632 ; Right # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +1163B..1163C ; Right # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +1163E ; Right # Mc MODI SIGN VISARGA +116AC ; Right # Mc TAKRI SIGN VISARGA +116AF ; Right # Mc TAKRI VOWEL SIGN II +116B6 ; Right # Mc TAKRI SIGN VIRAMA +11720..11721 ; Right # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +11C2F ; Right # Mc BHAIKSUKI VOWEL SIGN AA +11C3E ; Right # Mc BHAIKSUKI SIGN VISARGA +11CA9 ; Right # Mc MARCHEN SUBJOINED LETTER YA +11CB4 ; Right # Mc MARCHEN VOWEL SIGN O + +# Indic_Positional_Category=Left + +093F ; Left # Mc DEVANAGARI VOWEL SIGN I +094E ; Left # Mc DEVANAGARI VOWEL SIGN PRISHTHAMATRA E +09BF ; Left # Mc BENGALI VOWEL SIGN I +09C7..09C8 ; Left # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +0A3F ; Left # Mc GURMUKHI VOWEL SIGN I +0ABF ; Left # Mc GUJARATI VOWEL SIGN I +0B47 ; Left # Mc ORIYA VOWEL SIGN E +0BC6..0BC8 ; Left # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0D46..0D48 ; Left # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0DD9 ; Left # Mc SINHALA VOWEL SIGN KOMBUVA +0DDB ; Left # Mc SINHALA VOWEL SIGN KOMBU DEKA +0F3F ; Left # Mc TIBETAN SIGN MAR TSHES +1031 ; Left # Mc MYANMAR VOWEL SIGN E +1084 ; Left # Mc MYANMAR VOWEL SIGN SHAN E +17C1..17C3 ; Left # Mc [3] KHMER VOWEL SIGN E..KHMER VOWEL SIGN AI +1A19 ; Left # Mc BUGINESE VOWEL SIGN E +1A55 ; Left # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A6E..1A72 ; Left # Mc [5] TAI THAM VOWEL SIGN E..TAI THAM VOWEL SIGN THAM AI +1B3E..1B3F ; Left # Mc [2] BALINESE VOWEL SIGN TALING..BALINESE VOWEL SIGN TALING REPA +1BA6 ; Left # Mc SUNDANESE VOWEL SIGN PANAELAENG +1C27..1C28 ; Left # Mc [2] LEPCHA VOWEL SIGN I..LEPCHA VOWEL SIGN O +1C34..1C35 ; Left # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A9BA..A9BB ; Left # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +AA2F..AA30 ; Left # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA34 ; Left # Mc CHAM CONSONANT SIGN RA +AAEB ; Left # Mc MEETEI MAYEK VOWEL SIGN II +AAEE ; Left # Mc MEETEI MAYEK VOWEL SIGN AU +110B1 ; Left # Mc KAITHI VOWEL SIGN I +1112C ; Left # Mc CHAKMA VOWEL SIGN E +111B4 ; Left # Mc SHARADA VOWEL SIGN I +112E1 ; Left # Mc KHUDAWADI VOWEL SIGN I +11347..11348 ; Left # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +11436 ; Left # Mc NEWA VOWEL SIGN I +114B1 ; Left # Mc TIRHUTA VOWEL SIGN I +114B9 ; Left # Mc TIRHUTA VOWEL SIGN E +115B0 ; Left # Mc SIDDHAM VOWEL SIGN I +115B8 ; Left # Mc SIDDHAM VOWEL SIGN E +116AE ; Left # Mc TAKRI VOWEL SIGN I +11726 ; Left # Mc AHOM VOWEL SIGN E +11CB1 ; Left # Mc MARCHEN VOWEL SIGN I + +# Indic_Positional_Category=Visual_Order_Left + +# These are dependent vowels that occur to the left of the consonant +# letter in a syllable, but which occur in scripts using the visual order +# model, instead of the logical order model. Because of the different +# model, these left-side vowels occur first in the backing store (before +# the consonant letter) and are not reordered during text rendering. +# +# [Derivation: Logical_Order_Exception=Yes] + +0E40..0E44 ; Visual_Order_Left # Lo [5] THAI CHARACTER SARA E..THAI CHARACTER SARA AI MAIMALAI +0EC0..0EC4 ; Visual_Order_Left # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +19B5..19B7 ; Visual_Order_Left # Lo [3] NEW TAI LUE VOWEL SIGN E..NEW TAI LUE VOWEL SIGN O +19BA ; Visual_Order_Left # Lo NEW TAI LUE VOWEL SIGN AY +AAB5..AAB6 ; Visual_Order_Left # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB9 ; Visual_Order_Left # Lo TAI VIET VOWEL UEA +AABB..AABC ; Visual_Order_Left # Lo [2] TAI VIET VOWEL AUE..TAI VIET VOWEL AY + +# Indic_Positional_Category=Left_And_Right + +09CB..09CC ; Left_And_Right # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +0B4B ; Left_And_Right # Mc ORIYA VOWEL SIGN O +0BCA..0BCC ; Left_And_Right # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0D4A..0D4C ; Left_And_Right # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0DDC ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA AELA-PILLA +0DDE ; Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA GAYANUKITTA +17C0 ; Left_And_Right # Mc KHMER VOWEL SIGN IE +17C4..17C5 ; Left_And_Right # Mc [2] KHMER VOWEL SIGN OO..KHMER VOWEL SIGN AU +1B40..1B41 ; Left_And_Right # Mc [2] BALINESE VOWEL SIGN TALING TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1134B..1134C ; Left_And_Right # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +114BC ; Left_And_Right # Mc TIRHUTA VOWEL SIGN O +114BE ; Left_And_Right # Mc TIRHUTA VOWEL SIGN AU +115BA ; Left_And_Right # Mc SIDDHAM VOWEL SIGN O + +# Indic_Positional_Category=Top + +0900..0902 ; Top # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +093A ; Top # Mn DEVANAGARI VOWEL SIGN OE +0945..0948 ; Top # Mn [4] DEVANAGARI VOWEL SIGN CANDRA E..DEVANAGARI VOWEL SIGN AI +0951 ; Top # Mn DEVANAGARI STRESS SIGN UDATTA +0953..0955 ; Top # Mn [3] DEVANAGARI GRAVE ACCENT..DEVANAGARI VOWEL SIGN CANDRA LONG E +0981 ; Top # Mn BENGALI SIGN CANDRABINDU +0A01..0A02 ; Top # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A47..0A48 ; Top # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Top # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0A70..0A71 ; Top # Mn [2] GURMUKHI TIPPI..GURMUKHI ADDAK +0A81..0A82 ; Top # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0AC5 ; Top # Mn GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Top # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0B01 ; Top # Mn ORIYA SIGN CANDRABINDU +0B3F ; Top # Mn ORIYA VOWEL SIGN I +0B56 ; Top # Mn ORIYA AI LENGTH MARK +0B82 ; Top # Mn TAMIL SIGN ANUSVARA +0BC0 ; Top # Mn TAMIL VOWEL SIGN II +0BCD ; Top # Mn TAMIL SIGN VIRAMA +0C00 ; Top # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C3E..0C40 ; Top # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C46..0C47 ; Top # Mn [2] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN EE +0C4A..0C4D ; Top # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA +0C55 ; Top # Mn TELUGU LENGTH MARK +0C81 ; Top # Mn KANNADA SIGN CANDRABINDU +0CBF ; Top # Mn KANNADA VOWEL SIGN I +0CC6 ; Top # Mn KANNADA VOWEL SIGN E +0CCC..0CCD ; Top # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA +0D01 ; Top # Mn MALAYALAM SIGN CANDRABINDU +0D4D ; Top # Mn MALAYALAM SIGN VIRAMA +0DCA ; Top # Mn SINHALA SIGN AL-LAKUNA +0DD2..0DD3 ; Top # Mn [2] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN DIGA IS-PILLA +0E31 ; Top # Mn THAI CHARACTER MAI HAN-AKAT +0E34..0E37 ; Top # Mn [4] THAI CHARACTER SARA I..THAI CHARACTER SARA UEE +0E47..0E4E ; Top # Mn [8] THAI CHARACTER MAITAIKHU..THAI CHARACTER YAMAKKAN +0EB1 ; Top # Mn LAO VOWEL SIGN MAI KAN +0EB4..0EB7 ; Top # Mn [4] LAO VOWEL SIGN I..LAO VOWEL SIGN YY +0EBB ; Top # Mn LAO VOWEL SIGN MAI KON +0EC8..0ECD ; Top # Mn [6] LAO TONE MAI EK..LAO NIGGAHITA +0F39 ; Top # Mn TIBETAN MARK TSA -PHRU +0F72 ; Top # Mn TIBETAN VOWEL SIGN I +0F7A..0F7E ; Top # Mn [5] TIBETAN VOWEL SIGN E..TIBETAN SIGN RJES SU NGA RO +0F80 ; Top # Mn TIBETAN VOWEL SIGN REVERSED I +0F82..0F83 ; Top # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +0F86..0F87 ; Top # Mn [2] TIBETAN SIGN LCI RTAGS..TIBETAN SIGN YANG RTAGS +102D..102E ; Top # Mn [2] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN II +1032..1036 ; Top # Mn [5] MYANMAR VOWEL SIGN AI..MYANMAR SIGN ANUSVARA +103A ; Top # Mn MYANMAR SIGN ASAT +1071..1074 ; Top # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1085..1086 ; Top # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109D ; Top # Mn MYANMAR VOWEL SIGN AITON AI +1712 ; Top # Mn TAGALOG VOWEL SIGN I +1732 ; Top # Mn HANUNOO VOWEL SIGN I +1752 ; Top # Mn BUHID VOWEL SIGN I +1772 ; Top # Mn TAGBANWA VOWEL SIGN I +17B7..17BA ; Top # Mn [4] KHMER VOWEL SIGN I..KHMER VOWEL SIGN YY +17C6 ; Top # Mn KHMER SIGN NIKAHIT +17C9..17D1 ; Top # Mn [9] KHMER SIGN MUUSIKATOAN..KHMER SIGN VIRIAM +17D3 ; Top # Mn KHMER SIGN BATHAMASAT +17DD ; Top # Mn KHMER SIGN ATTHACAN +1920..1921 ; Top # Mn [2] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN I +1927..1928 ; Top # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Top # Mn LIMBU SIGN KEMPHRENG +1A17 ; Top # Mn BUGINESE VOWEL SIGN I +1A1B ; Top # Mn BUGINESE VOWEL SIGN AE +1A58..1A5A ; Top # Mn [3] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN LOW PA +1A62 ; Top # Mn TAI THAM VOWEL SIGN MAI SAT +1A65..1A68 ; Top # Mn [4] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN UUE +1A6B ; Top # Mn TAI THAM VOWEL SIGN O +1A73..1A7C ; Top # Mn [10] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN KHUEN-LUE KARAN +1B00..1B03 ; Top # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG +1B34 ; Top # Mn BALINESE SIGN REREKAN +1B36..1B37 ; Top # Mn [2] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN ULU SARI +1B42 ; Top # Mn BALINESE VOWEL SIGN PEPET +1B6B ; Top # Mn BALINESE MUSICAL SYMBOL COMBINING TEGEH +1B6D..1B73 ; Top # Mn [7] BALINESE MUSICAL SYMBOL COMBINING KEMPUL..BALINESE MUSICAL SYMBOL COMBINING GONG +1B80..1B81 ; Top # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR +1BA4 ; Top # Mn SUNDANESE VOWEL SIGN PANGHULU +1BA8..1BA9 ; Top # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE6 ; Top # Mn BATAK SIGN TOMPI +1BE8..1BE9 ; Top # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BED ; Top # Mn BATAK VOWEL SIGN KARO O +1BEF..1BF1 ; Top # Mn [3] BATAK VOWEL SIGN U FOR SIMALUNGUN SA..BATAK CONSONANT SIGN H +1C2D..1C33 ; Top # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +1C36 ; Top # Mn LEPCHA SIGN RAN +1CD0..1CD2 ; Top # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CDA..1CDB ; Top # Mn [2] VEDIC TONE DOUBLE SVARITA..VEDIC TONE TRIPLE SVARITA +1CE0 ; Top # Mn VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CF4 ; Top # Mn VEDIC TONE CANDRA ABOVE +1DFB ; Top # Mn COMBINING DELETION MARK +A806 ; Top # Mn SYLOTI NAGRI SIGN HASANTA +A80B ; Top # Mn SYLOTI NAGRI SIGN ANUSVARA +A826 ; Top # Mn SYLOTI NAGRI VOWEL SIGN E +A8C5 ; Top # Mn SAURASHTRA SIGN CANDRABINDU +A8E0..A8F1 ; Top # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +A94A ; Top # Mn REJANG VOWEL SIGN AI +A94F..A951 ; Top # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A980..A982 ; Top # Mn [3] JAVANESE SIGN PANYANGGA..JAVANESE SIGN LAYAR +A9B3 ; Top # Mn JAVANESE SIGN CECAK TELU +A9B6..A9B7 ; Top # Mn [2] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN WULU MELIK +A9BC ; Top # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Top # Mn MYANMAR SIGN SHAN SAW +AA29..AA2C ; Top # Mn [4] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN EI +AA2E ; Top # Mn CHAM VOWEL SIGN OE +AA31 ; Top # Mn CHAM VOWEL SIGN AU +AA43 ; Top # Mn CHAM CONSONANT SIGN FINAL NG +AA4C ; Top # Mn CHAM CONSONANT SIGN FINAL M +AA7C ; Top # Mn MYANMAR SIGN TAI LAING TONE-2 +AAB0 ; Top # Mn TAI VIET MAI KANG +AAB2..AAB3 ; Top # Mn [2] TAI VIET VOWEL I..TAI VIET VOWEL UE +AAB7..AAB8 ; Top # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AABE..AABF ; Top # Mn [2] TAI VIET VOWEL AM..TAI VIET TONE MAI EK +AAC1 ; Top # Mn TAI VIET TONE MAI THO +AAED ; Top # Mn MEETEI MAYEK VOWEL SIGN AAI +ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP +10A05 ; Top # Mn KHAROSHTHI VOWEL SIGN E +10A0F ; Top # Mn KHAROSHTHI SIGN VISARGA +10A38 ; Top # Mn KHAROSHTHI SIGN BAR ABOVE +11001 ; Top # Mn BRAHMI SIGN ANUSVARA +11038..1103B ; Top # Mn [4] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN II +11042..11046 ; Top # Mn [5] BRAHMI VOWEL SIGN E..BRAHMI VIRAMA +11080..11081 ; Top # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +110B5..110B6 ; Top # Mn [2] KAITHI VOWEL SIGN E..KAITHI VOWEL SIGN AI +11100..11102 ; Top # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA +11127..11129 ; Top # Mn [3] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN II +1112D ; Top # Mn CHAKMA VOWEL SIGN AI +11130 ; Top # Mn CHAKMA VOWEL SIGN OI +11134 ; Top # Mn CHAKMA MAAYYAA +11180..11181 ; Top # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +111BC..111BE ; Top # Mn [3] SHARADA VOWEL SIGN E..SHARADA VOWEL SIGN O +111CB ; Top # Mn SHARADA VOWEL MODIFIER MARK +11230..11231 ; Top # Mn [2] KHOJKI VOWEL SIGN E..KHOJKI VOWEL SIGN AI +11234 ; Top # Mn KHOJKI SIGN ANUSVARA +11236..11237 ; Top # Mn [2] KHOJKI SIGN NUKTA..KHOJKI SIGN SHADDA +1123E ; Top # Mn KHOJKI SIGN SUKUN +112DF ; Top # Mn KHUDAWADI SIGN ANUSVARA +112E5..112E8 ; Top # Mn [4] KHUDAWADI VOWEL SIGN E..KHUDAWADI VOWEL SIGN AU +11301 ; Top # Mn GRANTHA SIGN CANDRABINDU +11340 ; Top # Mn GRANTHA VOWEL SIGN II +11366..1136C ; Top # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Top # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA +1143E..1143F ; Top # Mn [2] NEWA VOWEL SIGN E..NEWA VOWEL SIGN AI +11443..11444 ; Top # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +114BA ; Top # Mn TIRHUTA VOWEL SIGN SHORT E +114BF..114C0 ; Top # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Top # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +11639..1163A ; Top # Mn [2] MODI VOWEL SIGN E..MODI VOWEL SIGN AI +1163D ; Top # Mn MODI SIGN ANUSVARA +11640 ; Top # Mn MODI SIGN ARDHACANDRA +116AB ; Top # Mn TAKRI SIGN ANUSVARA +116AD ; Top # Mn TAKRI VOWEL SIGN AA +116B2..116B5 ; Top # Mn [4] TAKRI VOWEL SIGN E..TAKRI VOWEL SIGN AU +1171F ; Top # Mn AHOM CONSONANT SIGN MEDIAL LIGATING RA +11722..11723 ; Top # Mn [2] AHOM VOWEL SIGN I..AHOM VOWEL SIGN II +11727 ; Top # Mn AHOM VOWEL SIGN AW +11729..1172B ; Top # Mn [3] AHOM VOWEL SIGN AI..AHOM SIGN KILLER +11C30..11C31 ; Top # Mn [2] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN II +11C38..11C3D ; Top # Mn [6] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI SIGN ANUSVARA +11CB3 ; Top # Mn MARCHEN VOWEL SIGN E +11CB5..11CB6 ; Top # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU + +# Indic_Positional_Category=Bottom + +093C ; Bottom # Mn DEVANAGARI SIGN NUKTA +0941..0944 ; Bottom # Mn [4] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN VOCALIC RR +094D ; Bottom # Mn DEVANAGARI SIGN VIRAMA +0952 ; Bottom # Mn DEVANAGARI STRESS SIGN ANUDATTA +0956..0957 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN UE..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Bottom # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BC ; Bottom # Mn BENGALI SIGN NUKTA +09C1..09C4 ; Bottom # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09CD ; Bottom # Mn BENGALI SIGN VIRAMA +09E2..09E3 ; Bottom # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3C ; Bottom # Mn GURMUKHI SIGN NUKTA +0A41..0A42 ; Bottom # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A4D ; Bottom # Mn GURMUKHI SIGN VIRAMA +0A75 ; Bottom # Mn GURMUKHI SIGN YAKASH +0ABC ; Bottom # Mn GUJARATI SIGN NUKTA +0AC1..0AC4 ; Bottom # Mn [4] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN VOCALIC RR +0ACD ; Bottom # Mn GUJARATI SIGN VIRAMA +0AE2..0AE3 ; Bottom # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3C ; Bottom # Mn ORIYA SIGN NUKTA +0B41..0B44 ; Bottom # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B4D ; Bottom # Mn ORIYA SIGN VIRAMA +0B62..0B63 ; Bottom # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0C56 ; Bottom # Mn TELUGU AI LENGTH MARK +0C62..0C63 ; Bottom # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBC ; Bottom # Mn KANNADA SIGN NUKTA +0CE2..0CE3 ; Bottom # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D43..0D44 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC R..MALAYALAM VOWEL SIGN VOCALIC RR +0D62..0D63 ; Bottom # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DD4 ; Bottom # Mn SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Bottom # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0E38..0E3A ; Bottom # Mn [3] THAI CHARACTER SARA U..THAI CHARACTER PHINTHU +0EB8..0EB9 ; Bottom # Mn [2] LAO VOWEL SIGN U..LAO VOWEL SIGN UU +0EBC ; Bottom # Mn LAO SEMIVOWEL SIGN LO +0F18..0F19 ; Bottom # Mn [2] TIBETAN ASTROLOGICAL SIGN -KHYUD PA..TIBETAN ASTROLOGICAL SIGN SDONG TSHUGS +0F35 ; Bottom # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Bottom # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0F71 ; Bottom # Mn TIBETAN VOWEL SIGN AA +0F74..0F75 ; Bottom # Mn [2] TIBETAN VOWEL SIGN U..TIBETAN VOWEL SIGN UU +0F84 ; Bottom # Mn TIBETAN MARK HALANTA +0F8D..0F97 ; Bottom # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Bottom # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +0FC6 ; Bottom # Mn TIBETAN SYMBOL PADMA GDAN +102F..1030 ; Bottom # Mn [2] MYANMAR VOWEL SIGN U..MYANMAR VOWEL SIGN UU +1037 ; Bottom # Mn MYANMAR SIGN DOT BELOW +103D..103E ; Bottom # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +1058..1059 ; Bottom # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +105E..1060 ; Bottom # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Bottom # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +108D ; Bottom # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +1713..1714 ; Bottom # Mn [2] TAGALOG VOWEL SIGN U..TAGALOG SIGN VIRAMA +1733..1734 ; Bottom # Mn [2] HANUNOO VOWEL SIGN U..HANUNOO SIGN PAMUDPOD +1753 ; Bottom # Mn BUHID VOWEL SIGN U +1773 ; Bottom # Mn TAGBANWA VOWEL SIGN U +17BB..17BD ; Bottom # Mn [3] KHMER VOWEL SIGN U..KHMER VOWEL SIGN UA +1922 ; Bottom # Mn LIMBU VOWEL SIGN U +1932 ; Bottom # Mn LIMBU SMALL LETTER ANUSVARA +1939 ; Bottom # Mn LIMBU SIGN MUKPHRENG +193B ; Bottom # Mn LIMBU SIGN SA-I +1A18 ; Bottom # Mn BUGINESE VOWEL SIGN U +1A56 ; Bottom # Mn TAI THAM CONSONANT SIGN MEDIAL LA +1A5B..1A5E ; Bottom # Mn [4] TAI THAM CONSONANT SIGN HIGH RATHA OR LOW PA..TAI THAM CONSONANT SIGN SA +1A69..1A6A ; Bottom # Mn [2] TAI THAM VOWEL SIGN U..TAI THAM VOWEL SIGN UU +1A6C ; Bottom # Mn TAI THAM VOWEL SIGN OA BELOW +1A7F ; Bottom # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1B38..1B3A ; Bottom # Mn [3] BALINESE VOWEL SIGN SUKU..BALINESE VOWEL SIGN RA REPA +1B6C ; Bottom # Mn BALINESE MUSICAL SYMBOL COMBINING ENDEP +1BA2..1BA3 ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BA5 ; Bottom # Mn SUNDANESE VOWEL SIGN PANYUKU +1BAC..1BAD ; Bottom # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C2C ; Bottom # Mn LEPCHA VOWEL SIGN E +1C37 ; Bottom # Mn LEPCHA SIGN NUKTA +1CD5..1CD9 ; Bottom # Mn [5] VEDIC TONE YAJURVEDIC AGGRAVATED INDEPENDENT SVARITA..VEDIC TONE YAJURVEDIC KATHAKA INDEPENDENT SVARITA SCHROEDER +1CDC..1CDF ; Bottom # Mn [4] VEDIC TONE KATHAKA ANUDATTA..VEDIC TONE THREE DOTS BELOW +1CED ; Bottom # Mn VEDIC SIGN TIRYAK +A825 ; Bottom # Mn SYLOTI NAGRI VOWEL SIGN U +A8C4 ; Bottom # Mn SAURASHTRA SIGN VIRAMA +A92B..A92D ; Bottom # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +A947..A949 ; Bottom # Mn [3] REJANG VOWEL SIGN I..REJANG VOWEL SIGN E +A94B..A94E ; Bottom # Mn [4] REJANG VOWEL SIGN O..REJANG VOWEL SIGN EA +A9B8..A9B9 ; Bottom # Mn [2] JAVANESE VOWEL SIGN SUKU..JAVANESE VOWEL SIGN SUKU MENDUT +AA2D ; Bottom # Mn CHAM VOWEL SIGN U +AA32 ; Bottom # Mn CHAM VOWEL SIGN UE +AA35..AA36 ; Bottom # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +AAB4 ; Bottom # Mn TAI VIET VOWEL U +AAEC ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UU +ABE8 ; Bottom # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK +10A02..10A03 ; Bottom # Mn [2] KHAROSHTHI VOWEL SIGN U..KHAROSHTHI VOWEL SIGN VOCALIC R +10A0C..10A0E ; Bottom # Mn [3] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN ANUSVARA +10A39..10A3A ; Bottom # Mn [2] KHAROSHTHI SIGN CAUDA..KHAROSHTHI SIGN DOT BELOW +1103C..11041 ; Bottom # Mn [6] BRAHMI VOWEL SIGN U..BRAHMI VOWEL SIGN VOCALIC LL +110B3..110B4 ; Bottom # Mn [2] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN UU +110B9..110BA ; Bottom # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +1112A..1112B ; Bottom # Mn [2] CHAKMA VOWEL SIGN U..CHAKMA VOWEL SIGN UU +11131..11132 ; Bottom # Mn [2] CHAKMA O MARK..CHAKMA AU MARK +11173 ; Bottom # Mn MAHAJANI SIGN NUKTA +111B6..111BB ; Bottom # Mn [6] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN VOCALIC LL +111CC ; Bottom # Mn SHARADA EXTRA SHORT VOWEL MARK +1122F ; Bottom # Mn KHOJKI VOWEL SIGN U +112E3..112E4 ; Bottom # Mn [2] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN UU +112E9..112EA ; Bottom # Mn [2] KHUDAWADI SIGN NUKTA..KHUDAWADI SIGN VIRAMA +11438..1143D ; Bottom # Mn [6] NEWA VOWEL SIGN U..NEWA VOWEL SIGN VOCALIC LL +11442 ; Bottom # Mn NEWA SIGN VIRAMA +11446 ; Bottom # Mn NEWA SIGN NUKTA +114B3..114B8 ; Bottom # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114C2..114C3 ; Bottom # Mn [2] TIRHUTA SIGN VIRAMA..TIRHUTA SIGN NUKTA +115B2..115B5 ; Bottom # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115BF..115C0 ; Bottom # Mn [2] SIDDHAM SIGN VIRAMA..SIDDHAM SIGN NUKTA +115DC..115DD ; Bottom # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11633..11638 ; Bottom # Mn [6] MODI VOWEL SIGN U..MODI VOWEL SIGN VOCALIC LL +1163F ; Bottom # Mn MODI SIGN VIRAMA +116B0..116B1 ; Bottom # Mn [2] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN UU +116B7 ; Bottom # Mn TAKRI SIGN NUKTA +1171D ; Bottom # Mn AHOM CONSONANT SIGN MEDIAL LA +11724..11725 ; Bottom # Mn [2] AHOM VOWEL SIGN U..AHOM VOWEL SIGN UU +11728 ; Bottom # Mn AHOM VOWEL SIGN O +11C32..11C36 ; Bottom # Mn [5] BHAIKSUKI VOWEL SIGN U..BHAIKSUKI VOWEL SIGN VOCALIC L +11C3F ; Bottom # Mn BHAIKSUKI SIGN VIRAMA +11C92..11CA7 ; Bottom # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CAA..11CB0 ; Bottom # Mn [7] MARCHEN SUBJOINED LETTER RA..MARCHEN VOWEL SIGN AA +11CB2 ; Bottom # Mn MARCHEN VOWEL SIGN U + +# Indic_Positional_Category=Top_And_Bottom + +0C48 ; Top_And_Bottom # Mn TELUGU VOWEL SIGN AI +0F73 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN II +0F76..0F79 ; Top_And_Bottom # Mn [4] TIBETAN VOWEL SIGN VOCALIC R..TIBETAN VOWEL SIGN VOCALIC LL +0F81 ; Top_And_Bottom # Mn TIBETAN VOWEL SIGN REVERSED II +1B3C ; Top_And_Bottom # Mn BALINESE VOWEL SIGN LA LENGA +1112E..1112F ; Top_And_Bottom # Mn [2] CHAKMA VOWEL SIGN O..CHAKMA VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Right + +0AC9 ; Top_And_Right # Mc GUJARATI VOWEL SIGN CANDRA O +0B57 ; Top_And_Right # Mc ORIYA AU LENGTH MARK +0CC0 ; Top_And_Right # Mc KANNADA VOWEL SIGN II +0CC7..0CC8 ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Top_And_Right # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +1925..1926 ; Top_And_Right # Mc [2] LIMBU VOWEL SIGN OO..LIMBU VOWEL SIGN AU +1B43 ; Top_And_Right # Mc BALINESE VOWEL SIGN PEPET TEDUNG +111BF ; Top_And_Right # Mc SHARADA VOWEL SIGN AU +11232..11233 ; Top_And_Right # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU + +# Indic_Positional_Category=Top_And_Left + +0B48 ; Top_And_Left # Mc ORIYA VOWEL SIGN AI +0DDA ; Top_And_Left # Mc SINHALA VOWEL SIGN DIGA KOMBUVA +17BE ; Top_And_Left # Mc KHMER VOWEL SIGN OE +1C29 ; Top_And_Left # Mc LEPCHA VOWEL SIGN OO +114BB ; Top_And_Left # Mc TIRHUTA VOWEL SIGN AI +115B9 ; Top_And_Left # Mc SIDDHAM VOWEL SIGN AI + +# Indic_Positional_Category=Top_And_Left_And_Right + +0B4C ; Top_And_Left_And_Right # Mc ORIYA VOWEL SIGN AU +0DDD ; Top_And_Left_And_Right # Mc SINHALA VOWEL SIGN KOMBUVA HAA DIGA AELA-PILLA +17BF ; Top_And_Left_And_Right # Mc KHMER VOWEL SIGN YA +115BB ; Top_And_Left_And_Right # Mc SIDDHAM VOWEL SIGN AU + +# Indic_Positional_Category=Bottom_And_Right + +1B3B ; Bottom_And_Right # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +A9C0 ; Bottom_And_Right # Mc JAVANESE PANGKON + +# Indic_Positional_Category=Top_And_Bottom_And_Right + +1B3D ; Top_And_Bottom_And_Right # Mc BALINESE VOWEL SIGN LA LENGA TEDUNG + +# Indic_Positional_Category=Overstruck + +1CD4 ; Overstruck # Mn VEDIC SIGN YAJURVEDIC MIDLINE SVARITA +1CE2..1CE8 ; Overstruck # Mn [7] VEDIC SIGN VISARGA SVARITA..VEDIC SIGN VISARGA ANUDATTA WITH TAIL +10A01 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN I +10A06 ; Overstruck # Mn KHAROSHTHI VOWEL SIGN O + +# EOF diff --git a/data/9.0.0-indic-syllabic-category.txt b/data/9.0.0-indic-syllabic-category.txt new file mode 100644 index 0000000..d6c6162 --- /dev/null +++ b/data/9.0.0-indic-syllabic-category.txt @@ -0,0 +1,1159 @@ +# IndicSyllabicCategory-9.0.0.txt +# Date: 2016-05-21, 02:46:00 GMT [RP] +# © 2016 Unicode®, Inc. +# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. +# For terms of use, see http://www.unicode.org/terms_of_use.html +# +# For documentation, see UAX #44: Unicode Character Database, +# at http://www.unicode.org/reports/tr44/ +# +# This file defines the following property: +# +# Indic_Syllabic_Category enumerated property +# +# Scope: This property is aimed at two general problem +# areas involving the analysis and processing of Indic scripts: +# +# 1. Specification of syllabic structure. +# 2. Specification of segmentation rules. +# +# Both of these problem areas may benefit from having defined subtypes +# of Indic script characters which are relevant to how Indic +# syllables (or aksaras) are constructed. Note that rules for +# syllabic structure in Indic scripts may differ significantly +# from how phonological syllables are defined. +# +# Format: +# Field 0 Unicode code point value or range of code point values +# Field 1 Indic_Syllabic_Category property value +# +# Field 1 is followed by a comment field, starting with the number sign '#', +# which shows the General_Category property value, the Unicode character name +# or names, and, in lines with ranges of code points, the code point count in +# square brackets. +# +# The scripts assessed as Indic in the structural sense used for the +# Indic_Syllabic_Category are the following: +# +# Ahom, Balinese, Batak, Bengali, Bhaiksuki, Brahmi, Buginese, Buhid, +# Chakma, Cham, Devanagari, Grantha, Gujarati, Gurmukhi, Hanunoo, +# Javanese, Kaithi, Kannada, Kayah Li, Kharoshthi, Khmer, Khojki, +# Khudawadi, Lao, Lepcha, Limbu, Mahajani, Malayalam, Marchen, Meetei +# Mayek, Modi, Multani, Myanmar, Newa, New Tai Lue, Oriya, Phags-pa, +# Rejang, Saurashtra, Sharada, Siddham, Sinhala, Sundanese, Syloti +# Nagri, Tagalog, Tagbanwa, Tai Le, Tai Tham, Tai Viet, Takri, Tamil, +# Telugu, Thai, Tibetan, and Tirhuta. +# +# All characters for all other scripts not in that list +# take the default value for this property, unless they +# are individually listed in this data file. +# + +# ================================================ + +# Property: Indic_Syllabic_Category +# +# All code points not explicitly listed for Indic_Syllabic_Category +# have the value Other. +# +# @missing: 0000..10FFFF; Other + +# ================================================ + +# Indic_Syllabic_Category=Bindu + +# Bindu/Anusvara (nasalization or -n) +# Excludes various Vedic nasalization signs. + +# [Not derivable] + +0900..0902 ; Bindu # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA +0981 ; Bindu # Mn BENGALI SIGN CANDRABINDU +0982 ; Bindu # Mc BENGALI SIGN ANUSVARA +0A01..0A02 ; Bindu # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI +0A70 ; Bindu # Mn GURMUKHI TIPPI +0A81..0A82 ; Bindu # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA +0B01 ; Bindu # Mn ORIYA SIGN CANDRABINDU +0B02 ; Bindu # Mc ORIYA SIGN ANUSVARA +0B82 ; Bindu # Mn TAMIL SIGN ANUSVARA +0C00 ; Bindu # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE +0C01..0C02 ; Bindu # Mc [2] TELUGU SIGN CANDRABINDU..TELUGU SIGN ANUSVARA +0C81 ; Bindu # Mn KANNADA SIGN CANDRABINDU +0C82 ; Bindu # Mc KANNADA SIGN ANUSVARA +0D01 ; Bindu # Mn MALAYALAM SIGN CANDRABINDU +0D02 ; Bindu # Mc MALAYALAM SIGN ANUSVARA +0D82 ; Bindu # Mc SINHALA SIGN ANUSVARAYA +0E4D ; Bindu # Mn THAI CHARACTER NIKHAHIT +0ECD ; Bindu # Mn LAO NIGGAHITA +0F7E ; Bindu # Mn TIBETAN SIGN RJES SU NGA RO +0F82..0F83 ; Bindu # Mn [2] TIBETAN SIGN NYI ZLA NAA DA..TIBETAN SIGN SNA LDAN +1036 ; Bindu # Mn MYANMAR SIGN ANUSVARA +17C6 ; Bindu # Mn KHMER SIGN NIKAHIT +1932 ; Bindu # Mn LIMBU SMALL LETTER ANUSVARA +1B00..1B02 ; Bindu # Mn [3] BALINESE SIGN ULU RICEM..BALINESE SIGN CECEK +1B80 ; Bindu # Mn SUNDANESE SIGN PANYECEK +1C34..1C35 ; Bindu # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG +A80B ; Bindu # Mn SYLOTI NAGRI SIGN ANUSVARA +A873 ; Bindu # Lo PHAGS-PA LETTER CANDRABINDU +A880 ; Bindu # Mc SAURASHTRA SIGN ANUSVARA +A8C5 ; Bindu # Mn SAURASHTRA SIGN CANDRABINDU +A980..A981 ; Bindu # Mn [2] JAVANESE SIGN PANYANGGA..JAVANESE SIGN CECAK +10A0E ; Bindu # Mn KHAROSHTHI SIGN ANUSVARA +11000 ; Bindu # Mc BRAHMI SIGN CANDRABINDU +11001 ; Bindu # Mn BRAHMI SIGN ANUSVARA +11080..11081 ; Bindu # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA +11100..11101 ; Bindu # Mn [2] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN ANUSVARA +11180..11181 ; Bindu # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA +11234 ; Bindu # Mn KHOJKI SIGN ANUSVARA +112DF ; Bindu # Mn KHUDAWADI SIGN ANUSVARA +11300..11301 ; Bindu # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU +11302 ; Bindu # Mc GRANTHA SIGN ANUSVARA +11443..11444 ; Bindu # Mn [2] NEWA SIGN CANDRABINDU..NEWA SIGN ANUSVARA +114BF..114C0 ; Bindu # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA +115BC..115BD ; Bindu # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA +1163D ; Bindu # Mn MODI SIGN ANUSVARA +116AB ; Bindu # Mn TAKRI SIGN ANUSVARA +11C3C..11C3D ; Bindu # Mn [2] BHAIKSUKI SIGN CANDRABINDU..BHAIKSUKI SIGN ANUSVARA +11CB5..11CB6 ; Bindu # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU + +# ================================================ + +# Indic_Syllabic_Category=Visarga + +# Visarga (-h) +# Includes specialized case for Sanskrit: ardhavisarga +# Excludes letters for jihvamuliya and upadhmaniya, which are +# related, but structured somewhat differently. + +# [Not derivable] + +0903 ; Visarga # Mc DEVANAGARI SIGN VISARGA +0983 ; Visarga # Mc BENGALI SIGN VISARGA +0A03 ; Visarga # Mc GURMUKHI SIGN VISARGA +0A83 ; Visarga # Mc GUJARATI SIGN VISARGA +0B03 ; Visarga # Mc ORIYA SIGN VISARGA +0C03 ; Visarga # Mc TELUGU SIGN VISARGA +0C83 ; Visarga # Mc KANNADA SIGN VISARGA +0D03 ; Visarga # Mc MALAYALAM SIGN VISARGA +0D83 ; Visarga # Mc SINHALA SIGN VISARGAYA +0F7F ; Visarga # Mc TIBETAN SIGN RNAM BCAD +1038 ; Visarga # Mc MYANMAR SIGN VISARGA +17C7 ; Visarga # Mc KHMER SIGN REAHMUK +1B04 ; Visarga # Mc BALINESE SIGN BISAH +1B82 ; Visarga # Mc SUNDANESE SIGN PANGWISAD +1CF2..1CF3 ; Visarga # Mc [2] VEDIC SIGN ARDHAVISARGA..VEDIC SIGN ROTATED ARDHAVISARGA +A881 ; Visarga # Mc SAURASHTRA SIGN VISARGA +A983 ; Visarga # Mc JAVANESE SIGN WIGNYAN +AAF5 ; Visarga # Mc MEETEI MAYEK VOWEL SIGN VISARGA +10A0F ; Visarga # Mn KHAROSHTHI SIGN VISARGA +11002 ; Visarga # Mc BRAHMI SIGN VISARGA +11082 ; Visarga # Mc KAITHI SIGN VISARGA +11102 ; Visarga # Mn CHAKMA SIGN VISARGA +11182 ; Visarga # Mc SHARADA SIGN VISARGA +11303 ; Visarga # Mc GRANTHA SIGN VISARGA +11445 ; Visarga # Mc NEWA SIGN VISARGA +114C1 ; Visarga # Mc TIRHUTA SIGN VISARGA +115BE ; Visarga # Mc SIDDHAM SIGN VISARGA +1163E ; Visarga # Mc MODI SIGN VISARGA +116AC ; Visarga # Mc TAKRI SIGN VISARGA +11C3E ; Visarga # Mc BHAIKSUKI SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Avagraha + +# Avagraha (elision of initial a- in sandhi) + +# [Not derivable] + +093D ; Avagraha # Lo DEVANAGARI SIGN AVAGRAHA +09BD ; Avagraha # Lo BENGALI SIGN AVAGRAHA +0ABD ; Avagraha # Lo GUJARATI SIGN AVAGRAHA +0B3D ; Avagraha # Lo ORIYA SIGN AVAGRAHA +0C3D ; Avagraha # Lo TELUGU SIGN AVAGRAHA +0CBD ; Avagraha # Lo KANNADA SIGN AVAGRAHA +0D3D ; Avagraha # Lo MALAYALAM SIGN AVAGRAHA +0F85 ; Avagraha # Po TIBETAN MARK PALUTA +17DC ; Avagraha # Lo KHMER SIGN AVAKRAHASANYA +1BBA ; Avagraha # Lo SUNDANESE AVAGRAHA +111C1 ; Avagraha # Lo SHARADA SIGN AVAGRAHA +1133D ; Avagraha # Lo GRANTHA SIGN AVAGRAHA +11447 ; Avagraha # Lo NEWA SIGN AVAGRAHA +114C4 ; Avagraha # Lo TIRHUTA SIGN AVAGRAHA +11C40 ; Avagraha # Lo BHAIKSUKI SIGN AVAGRAHA + +# ================================================ + +# Indic_Syllabic_Category=Nukta + +# Nukta (diacritic for borrowed consonants or other consonant +# modifications) + +# [Derivation: (ccc=7) + 0F39 + 10A38..10A3A - 1037 - 1E94A] + +093C ; Nukta # Mn DEVANAGARI SIGN NUKTA +09BC ; Nukta # Mn BENGALI SIGN NUKTA +0A3C ; Nukta # Mn GURMUKHI SIGN NUKTA +0ABC ; Nukta # Mn GUJARATI SIGN NUKTA +0B3C ; Nukta # Mn ORIYA SIGN NUKTA +0CBC ; Nukta # Mn KANNADA SIGN NUKTA +0F39 ; Nukta # Mn TIBETAN MARK TSA -PHRU +1B34 ; Nukta # Mn BALINESE SIGN REREKAN +1BE6 ; Nukta # Mn BATAK SIGN TOMPI +1C37 ; Nukta # Mn LEPCHA SIGN NUKTA +A9B3 ; Nukta # Mn JAVANESE SIGN CECAK TELU +10A38..10A3A ; Nukta # Mn [3] KHAROSHTHI SIGN BAR ABOVE..KHAROSHTHI SIGN DOT BELOW +110BA ; Nukta # Mn KAITHI SIGN NUKTA +11173 ; Nukta # Mn MAHAJANI SIGN NUKTA +111CA ; Nukta # Mn SHARADA SIGN NUKTA +11236 ; Nukta # Mn KHOJKI SIGN NUKTA +112E9 ; Nukta # Mn KHUDAWADI SIGN NUKTA +1133C ; Nukta # Mn GRANTHA SIGN NUKTA +11446 ; Nukta # Mn NEWA SIGN NUKTA +114C3 ; Nukta # Mn TIRHUTA SIGN NUKTA +115C0 ; Nukta # Mn SIDDHAM SIGN NUKTA +116B7 ; Nukta # Mn TAKRI SIGN NUKTA + +# ================================================ + +# Indic_Syllabic_Category=Virama + +# Virama (killing of inherent vowel in consonant sequence +# or consonant stacker) +# Only includes characters that can act both as visible killer viramas +# and consonant stackers. Separate property values exist for characters +# that can only act as pure killers or only as consonant stackers. + +# [Derivation: (ccc=9) - (InSC=Pure_Killer) - (InSC=Invisible_Stacker) +# - (InSC=Number_Joiner) - 2D7F] + +094D ; Virama # Mn DEVANAGARI SIGN VIRAMA +09CD ; Virama # Mn BENGALI SIGN VIRAMA +0A4D ; Virama # Mn GURMUKHI SIGN VIRAMA +0ACD ; Virama # Mn GUJARATI SIGN VIRAMA +0B4D ; Virama # Mn ORIYA SIGN VIRAMA +0BCD ; Virama # Mn TAMIL SIGN VIRAMA +0C4D ; Virama # Mn TELUGU SIGN VIRAMA +0CCD ; Virama # Mn KANNADA SIGN VIRAMA +0D4D ; Virama # Mn MALAYALAM SIGN VIRAMA +0DCA ; Virama # Mn SINHALA SIGN AL-LAKUNA +1B44 ; Virama # Mc BALINESE ADEG ADEG +A8C4 ; Virama # Mn SAURASHTRA SIGN VIRAMA +A9C0 ; Virama # Mc JAVANESE PANGKON +11046 ; Virama # Mn BRAHMI VIRAMA +110B9 ; Virama # Mn KAITHI SIGN VIRAMA +111C0 ; Virama # Mc SHARADA SIGN VIRAMA +11235 ; Virama # Mc KHOJKI SIGN VIRAMA +1134D ; Virama # Mc GRANTHA SIGN VIRAMA +11442 ; Virama # Mn NEWA SIGN VIRAMA +114C2 ; Virama # Mn TIRHUTA SIGN VIRAMA +115BF ; Virama # Mn SIDDHAM SIGN VIRAMA +1163F ; Virama # Mn MODI SIGN VIRAMA +116B6 ; Virama # Mc TAKRI SIGN VIRAMA +11C3F ; Virama # Mn BHAIKSUKI SIGN VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Pure_Killer + +# Pure killer (killing of inherent vowel in consonant sequence, +# with no consonant stacking behavior) + +# [Not derivable] + +0E3A ; Pure_Killer # Mn THAI CHARACTER PHINTHU +0E4E ; Pure_Killer # Mn THAI CHARACTER YAMAKKAN +0F84 ; Pure_Killer # Mn TIBETAN MARK HALANTA +103A ; Pure_Killer # Mn MYANMAR SIGN ASAT +1714 ; Pure_Killer # Mn TAGALOG SIGN VIRAMA +1734 ; Pure_Killer # Mn HANUNOO SIGN PAMUDPOD +17D1 ; Pure_Killer # Mn KHMER SIGN VIRIAM +1BAA ; Pure_Killer # Mc SUNDANESE SIGN PAMAAEH +1BF2..1BF3 ; Pure_Killer # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN +A806 ; Pure_Killer # Mn SYLOTI NAGRI SIGN HASANTA +A953 ; Pure_Killer # Mc REJANG VIRAMA +ABED ; Pure_Killer # Mn MEETEI MAYEK APUN IYEK +11134 ; Pure_Killer # Mn CHAKMA MAAYYAA +112EA ; Pure_Killer # Mn KHUDAWADI SIGN VIRAMA +1172B ; Pure_Killer # Mn AHOM SIGN KILLER + +# ================================================ + +# Indic_Syllabic_Category=Invisible_Stacker + +# Invisible stacker (invisible consonant stacker virama) + +# [Not derivable] + +1039 ; Invisible_Stacker # Mn MYANMAR SIGN VIRAMA +17D2 ; Invisible_Stacker # Mn KHMER SIGN COENG +1A60 ; Invisible_Stacker # Mn TAI THAM SIGN SAKOT +1BAB ; Invisible_Stacker # Mn SUNDANESE SIGN VIRAMA +AAF6 ; Invisible_Stacker # Mn MEETEI MAYEK VIRAMA +10A3F ; Invisible_Stacker # Mn KHAROSHTHI VIRAMA +11133 ; Invisible_Stacker # Mn CHAKMA VIRAMA + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Independent + +# Independent Vowels (contrasted with matras) + +# [Not derivable] + +0904..0914 ; Vowel_Independent # Lo [17] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER AU +0960..0961 ; Vowel_Independent # Lo [2] DEVANAGARI LETTER VOCALIC RR..DEVANAGARI LETTER VOCALIC LL +0972..0977 ; Vowel_Independent # Lo [6] DEVANAGARI LETTER CANDRA A..DEVANAGARI LETTER UUE +0985..098C ; Vowel_Independent # Lo [8] BENGALI LETTER A..BENGALI LETTER VOCALIC L +098F..0990 ; Vowel_Independent # Lo [2] BENGALI LETTER E..BENGALI LETTER AI +0993..0994 ; Vowel_Independent # Lo [2] BENGALI LETTER O..BENGALI LETTER AU +09E0..09E1 ; Vowel_Independent # Lo [2] BENGALI LETTER VOCALIC RR..BENGALI LETTER VOCALIC LL +0A05..0A0A ; Vowel_Independent # Lo [6] GURMUKHI LETTER A..GURMUKHI LETTER UU +0A0F..0A10 ; Vowel_Independent # Lo [2] GURMUKHI LETTER EE..GURMUKHI LETTER AI +0A13..0A14 ; Vowel_Independent # Lo [2] GURMUKHI LETTER OO..GURMUKHI LETTER AU +0A85..0A8D ; Vowel_Independent # Lo [9] GUJARATI LETTER A..GUJARATI VOWEL CANDRA E +0A8F..0A91 ; Vowel_Independent # Lo [3] GUJARATI LETTER E..GUJARATI VOWEL CANDRA O +0A93..0A94 ; Vowel_Independent # Lo [2] GUJARATI LETTER O..GUJARATI LETTER AU +0AE0..0AE1 ; Vowel_Independent # Lo [2] GUJARATI LETTER VOCALIC RR..GUJARATI LETTER VOCALIC LL +0B05..0B0C ; Vowel_Independent # Lo [8] ORIYA LETTER A..ORIYA LETTER VOCALIC L +0B0F..0B10 ; Vowel_Independent # Lo [2] ORIYA LETTER E..ORIYA LETTER AI +0B13..0B14 ; Vowel_Independent # Lo [2] ORIYA LETTER O..ORIYA LETTER AU +0B60..0B61 ; Vowel_Independent # Lo [2] ORIYA LETTER VOCALIC RR..ORIYA LETTER VOCALIC LL +0B85..0B8A ; Vowel_Independent # Lo [6] TAMIL LETTER A..TAMIL LETTER UU +0B8E..0B90 ; Vowel_Independent # Lo [3] TAMIL LETTER E..TAMIL LETTER AI +0B92..0B94 ; Vowel_Independent # Lo [3] TAMIL LETTER O..TAMIL LETTER AU +0C05..0C0C ; Vowel_Independent # Lo [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L +0C0E..0C10 ; Vowel_Independent # Lo [3] TELUGU LETTER E..TELUGU LETTER AI +0C12..0C14 ; Vowel_Independent # Lo [3] TELUGU LETTER O..TELUGU LETTER AU +0C60..0C61 ; Vowel_Independent # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL +0C85..0C8C ; Vowel_Independent # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L +0C8E..0C90 ; Vowel_Independent # Lo [3] KANNADA LETTER E..KANNADA LETTER AI +0C92..0C94 ; Vowel_Independent # Lo [3] KANNADA LETTER O..KANNADA LETTER AU +0CE0..0CE1 ; Vowel_Independent # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL +0D05..0D0C ; Vowel_Independent # Lo [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L +0D0E..0D10 ; Vowel_Independent # Lo [3] MALAYALAM LETTER E..MALAYALAM LETTER AI +0D12..0D14 ; Vowel_Independent # Lo [3] MALAYALAM LETTER O..MALAYALAM LETTER AU +0D5F..0D61 ; Vowel_Independent # Lo [3] MALAYALAM LETTER ARCHAIC II..MALAYALAM LETTER VOCALIC LL +0D85..0D96 ; Vowel_Independent # Lo [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA +1021..102A ; Vowel_Independent # Lo [10] MYANMAR LETTER A..MYANMAR LETTER AU +1052..1055 ; Vowel_Independent # Lo [4] MYANMAR LETTER VOCALIC R..MYANMAR LETTER VOCALIC LL +1700..1702 ; Vowel_Independent # Lo [3] TAGALOG LETTER A..TAGALOG LETTER U +1720..1722 ; Vowel_Independent # Lo [3] HANUNOO LETTER A..HANUNOO LETTER U +1740..1742 ; Vowel_Independent # Lo [3] BUHID LETTER A..BUHID LETTER U +1760..1762 ; Vowel_Independent # Lo [3] TAGBANWA LETTER A..TAGBANWA LETTER U +17A3..17B3 ; Vowel_Independent # Lo [17] KHMER INDEPENDENT VOWEL QAQ..KHMER INDEPENDENT VOWEL QAU +1A4D..1A52 ; Vowel_Independent # Lo [6] TAI THAM LETTER I..TAI THAM LETTER OO +1B05..1B12 ; Vowel_Independent # Lo [14] BALINESE LETTER AKARA..BALINESE LETTER OKARA TEDUNG +1B83..1B89 ; Vowel_Independent # Lo [7] SUNDANESE LETTER A..SUNDANESE LETTER EU +1BE4..1BE5 ; Vowel_Independent # Lo [2] BATAK LETTER I..BATAK LETTER U +A800..A801 ; Vowel_Independent # Lo [2] SYLOTI NAGRI LETTER A..SYLOTI NAGRI LETTER I +A803..A805 ; Vowel_Independent # Lo [3] SYLOTI NAGRI LETTER U..SYLOTI NAGRI LETTER O +A882..A891 ; Vowel_Independent # Lo [16] SAURASHTRA LETTER A..SAURASHTRA LETTER AU +A984..A988 ; Vowel_Independent # Lo [5] JAVANESE LETTER A..JAVANESE LETTER U +A98C..A98E ; Vowel_Independent # Lo [3] JAVANESE LETTER E..JAVANESE LETTER O +AA00..AA05 ; Vowel_Independent # Lo [6] CHAM LETTER A..CHAM LETTER O +AAE0..AAE1 ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER E..MEETEI MAYEK LETTER O +ABCE..ABCF ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER UN..MEETEI MAYEK LETTER I +ABD1 ; Vowel_Independent # Lo MEETEI MAYEK LETTER ATIYA +11005..11012 ; Vowel_Independent # Lo [14] BRAHMI LETTER A..BRAHMI LETTER AU +11083..1108C ; Vowel_Independent # Lo [10] KAITHI LETTER A..KAITHI LETTER AU +11103..11106 ; Vowel_Independent # Lo [4] CHAKMA LETTER AA..CHAKMA LETTER E +11183..11190 ; Vowel_Independent # Lo [14] SHARADA LETTER A..SHARADA LETTER AU +11200..11207 ; Vowel_Independent # Lo [8] KHOJKI LETTER A..KHOJKI LETTER AU +11280..11283 ; Vowel_Independent # Lo [4] MULTANI LETTER A..MULTANI LETTER E +112B0..112B9 ; Vowel_Independent # Lo [10] KHUDAWADI LETTER A..KHUDAWADI LETTER AU +11305..1130C ; Vowel_Independent # Lo [8] GRANTHA LETTER A..GRANTHA LETTER VOCALIC L +1130F..11310 ; Vowel_Independent # Lo [2] GRANTHA LETTER EE..GRANTHA LETTER AI +11313..11314 ; Vowel_Independent # Lo [2] GRANTHA LETTER OO..GRANTHA LETTER AU +11360..11361 ; Vowel_Independent # Lo [2] GRANTHA LETTER VOCALIC RR..GRANTHA LETTER VOCALIC LL +11400..1140D ; Vowel_Independent # Lo [14] NEWA LETTER A..NEWA LETTER AU +11481..1148E ; Vowel_Independent # Lo [14] TIRHUTA LETTER A..TIRHUTA LETTER AU +11580..1158D ; Vowel_Independent # Lo [14] SIDDHAM LETTER A..SIDDHAM LETTER AU +115D8..115DB ; Vowel_Independent # Lo [4] SIDDHAM LETTER THREE-CIRCLE ALTERNATE I..SIDDHAM LETTER ALTERNATE U +11600..1160D ; Vowel_Independent # Lo [14] MODI LETTER A..MODI LETTER AU +11680..11689 ; Vowel_Independent # Lo [10] TAKRI LETTER A..TAKRI LETTER AU +11C00..11C08 ; Vowel_Independent # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L +11C0A..11C0D ; Vowel_Independent # Lo [4] BHAIKSUKI LETTER E..BHAIKSUKI LETTER AU + +# ================================================ + +# Indic_Syllabic_Category=Vowel_Dependent + +# Dependent Vowels (contrasted with independent vowels and/or with complex placement) +# Matras (in Indic scripts) + +# [Not derivable] + +093A ; Vowel_Dependent # Mn DEVANAGARI VOWEL SIGN OE +093B ; Vowel_Dependent # Mc DEVANAGARI VOWEL SIGN OOE +093E..0940 ; Vowel_Dependent # Mc [3] DEVANAGARI VOWEL SIGN AA..DEVANAGARI VOWEL SIGN II +0941..0948 ; Vowel_Dependent # Mn [8] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN AI +0949..094C ; Vowel_Dependent # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU +094E..094F ; Vowel_Dependent # Mc [2] DEVANAGARI VOWEL SIGN PRISHTHAMATRA E..DEVANAGARI VOWEL SIGN AW +0955..0957 ; Vowel_Dependent # Mn [3] DEVANAGARI VOWEL SIGN CANDRA LONG E..DEVANAGARI VOWEL SIGN UUE +0962..0963 ; Vowel_Dependent # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL +09BE..09C0 ; Vowel_Dependent # Mc [3] BENGALI VOWEL SIGN AA..BENGALI VOWEL SIGN II +09C1..09C4 ; Vowel_Dependent # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR +09C7..09C8 ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI +09CB..09CC ; Vowel_Dependent # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU +09D7 ; Vowel_Dependent # Mc BENGALI AU LENGTH MARK +09E2..09E3 ; Vowel_Dependent # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL +0A3E..0A40 ; Vowel_Dependent # Mc [3] GURMUKHI VOWEL SIGN AA..GURMUKHI VOWEL SIGN II +0A41..0A42 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU +0A47..0A48 ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI +0A4B..0A4C ; Vowel_Dependent # Mn [2] GURMUKHI VOWEL SIGN OO..GURMUKHI VOWEL SIGN AU +0ABE..0AC0 ; Vowel_Dependent # Mc [3] GUJARATI VOWEL SIGN AA..GUJARATI VOWEL SIGN II +0AC1..0AC5 ; Vowel_Dependent # Mn [5] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN CANDRA E +0AC7..0AC8 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI +0AC9 ; Vowel_Dependent # Mc GUJARATI VOWEL SIGN CANDRA O +0ACB..0ACC ; Vowel_Dependent # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU +0AE2..0AE3 ; Vowel_Dependent # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL +0B3E ; Vowel_Dependent # Mc ORIYA VOWEL SIGN AA +0B3F ; Vowel_Dependent # Mn ORIYA VOWEL SIGN I +0B40 ; Vowel_Dependent # Mc ORIYA VOWEL SIGN II +0B41..0B44 ; Vowel_Dependent # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR +0B47..0B48 ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI +0B4B..0B4C ; Vowel_Dependent # Mc [2] ORIYA VOWEL SIGN O..ORIYA VOWEL SIGN AU +0B56 ; Vowel_Dependent # Mn ORIYA AI LENGTH MARK +0B57 ; Vowel_Dependent # Mc ORIYA AU LENGTH MARK +0B62..0B63 ; Vowel_Dependent # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0BBE..0BBF ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I +0BC0 ; Vowel_Dependent # Mn TAMIL VOWEL SIGN II +0BC1..0BC2 ; Vowel_Dependent # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU +0BC6..0BC8 ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI +0BCA..0BCC ; Vowel_Dependent # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU +0BD7 ; Vowel_Dependent # Mc TAMIL AU LENGTH MARK +0C3E..0C40 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II +0C41..0C44 ; Vowel_Dependent # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR +0C46..0C48 ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI +0C4A..0C4C ; Vowel_Dependent # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU +0C55..0C56 ; Vowel_Dependent # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK +0C62..0C63 ; Vowel_Dependent # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL +0CBE ; Vowel_Dependent # Mc KANNADA VOWEL SIGN AA +0CBF ; Vowel_Dependent # Mn KANNADA VOWEL SIGN I +0CC0..0CC4 ; Vowel_Dependent # Mc [5] KANNADA VOWEL SIGN II..KANNADA VOWEL SIGN VOCALIC RR +0CC6 ; Vowel_Dependent # Mn KANNADA VOWEL SIGN E +0CC7..0CC8 ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI +0CCA..0CCB ; Vowel_Dependent # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO +0CCC ; Vowel_Dependent # Mn KANNADA VOWEL SIGN AU +0CD5..0CD6 ; Vowel_Dependent # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CE2..0CE3 ; Vowel_Dependent # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL +0D3E..0D40 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II +0D41..0D44 ; Vowel_Dependent # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR +0D46..0D48 ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI +0D4A..0D4C ; Vowel_Dependent # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU +0D57 ; Vowel_Dependent # Mc MALAYALAM AU LENGTH MARK +0D62..0D63 ; Vowel_Dependent # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL +0DCF..0DD1 ; Vowel_Dependent # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA +0DD2..0DD4 ; Vowel_Dependent # Mn [3] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA +0DD6 ; Vowel_Dependent # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA +0DD8..0DDF ; Vowel_Dependent # Mc [8] SINHALA VOWEL SIGN GAETTA-PILLA..SINHALA VOWEL SIGN GAYANUKITTA +0DF2..0DF3 ; Vowel_Dependent # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA +0E30 ; Vowel_Dependent # Lo THAI CHARACTER SARA A +0E31 ; Vowel_Dependent # Mn THAI CHARACTER MAI HAN-AKAT +0E32..0E33 ; Vowel_Dependent # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM +0E34..0E39 ; Vowel_Dependent # Mn [6] THAI CHARACTER SARA I..THAI CHARACTER SARA UU +0E40..0E45 ; Vowel_Dependent # Lo [6] THAI CHARACTER SARA E..THAI CHARACTER LAKKHANGYAO +0E47 ; Vowel_Dependent # Mn THAI CHARACTER MAITAIKHU +0EB0 ; Vowel_Dependent # Lo LAO VOWEL SIGN A +0EB1 ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KAN +0EB2..0EB3 ; Vowel_Dependent # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM +0EB4..0EB9 ; Vowel_Dependent # Mn [6] LAO VOWEL SIGN I..LAO VOWEL SIGN UU +0EBB ; Vowel_Dependent # Mn LAO VOWEL SIGN MAI KON +0EC0..0EC4 ; Vowel_Dependent # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI +0F71..0F7D ; Vowel_Dependent # Mn [13] TIBETAN VOWEL SIGN AA..TIBETAN VOWEL SIGN OO +0F80..0F81 ; Vowel_Dependent # Mn [2] TIBETAN VOWEL SIGN REVERSED I..TIBETAN VOWEL SIGN REVERSED II +102B..102C ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA +102D..1030 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN UU +1031 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN E +1032..1035 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN AI..MYANMAR VOWEL SIGN E ABOVE +1056..1057 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR +1058..1059 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL +1062 ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN SGAW KAREN EU +1067..1068 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR VOWEL SIGN WESTERN PWO KAREN UE +1071..1074 ; Vowel_Dependent # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE +1083..1084 ; Vowel_Dependent # Mc [2] MYANMAR VOWEL SIGN SHAN AA..MYANMAR VOWEL SIGN SHAN E +1085..1086 ; Vowel_Dependent # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y +109C ; Vowel_Dependent # Mc MYANMAR VOWEL SIGN AITON A +109D ; Vowel_Dependent # Mn MYANMAR VOWEL SIGN AITON AI +1712..1713 ; Vowel_Dependent # Mn [2] TAGALOG VOWEL SIGN I..TAGALOG VOWEL SIGN U +1732..1733 ; Vowel_Dependent # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1752..1753 ; Vowel_Dependent # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U +1772..1773 ; Vowel_Dependent # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U +17B6 ; Vowel_Dependent # Mc KHMER VOWEL SIGN AA +17B7..17BD ; Vowel_Dependent # Mn [7] KHMER VOWEL SIGN I..KHMER VOWEL SIGN UA +17BE..17C5 ; Vowel_Dependent # Mc [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU +17C8 ; Vowel_Dependent # Mc KHMER SIGN YUUKALEAPINTU +1920..1922 ; Vowel_Dependent # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U +1923..1926 ; Vowel_Dependent # Mc [4] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AU +1927..1928 ; Vowel_Dependent # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O +193A ; Vowel_Dependent # Mn LIMBU SIGN KEMPHRENG +19B0..19C0 ; Vowel_Dependent # Lo [17] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE VOWEL SIGN IY +1A17..1A18 ; Vowel_Dependent # Mn [2] BUGINESE VOWEL SIGN I..BUGINESE VOWEL SIGN U +1A19..1A1A ; Vowel_Dependent # Mc [2] BUGINESE VOWEL SIGN E..BUGINESE VOWEL SIGN O +1A1B ; Vowel_Dependent # Mn BUGINESE VOWEL SIGN AE +1A61 ; Vowel_Dependent # Mc TAI THAM VOWEL SIGN A +1A62 ; Vowel_Dependent # Mn TAI THAM VOWEL SIGN MAI SAT +1A63..1A64 ; Vowel_Dependent # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA +1A65..1A6C ; Vowel_Dependent # Mn [8] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN OA BELOW +1A6D..1A72 ; Vowel_Dependent # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI +1A73..1A74 ; Vowel_Dependent # Mn [2] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN MAI KANG +1B35 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN TEDUNG +1B36..1B3A ; Vowel_Dependent # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA +1B3B ; Vowel_Dependent # Mc BALINESE VOWEL SIGN RA REPA TEDUNG +1B3C ; Vowel_Dependent # Mn BALINESE VOWEL SIGN LA LENGA +1B3D..1B41 ; Vowel_Dependent # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG +1B42 ; Vowel_Dependent # Mn BALINESE VOWEL SIGN PEPET +1B43 ; Vowel_Dependent # Mc BALINESE VOWEL SIGN PEPET TEDUNG +1BA4..1BA5 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PANGHULU..SUNDANESE VOWEL SIGN PANYUKU +1BA6..1BA7 ; Vowel_Dependent # Mc [2] SUNDANESE VOWEL SIGN PANAELAENG..SUNDANESE VOWEL SIGN PANOLONG +1BA8..1BA9 ; Vowel_Dependent # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG +1BE7 ; Vowel_Dependent # Mc BATAK VOWEL SIGN E +1BE8..1BE9 ; Vowel_Dependent # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE +1BEA..1BEC ; Vowel_Dependent # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O +1BED ; Vowel_Dependent # Mn BATAK VOWEL SIGN KARO O +1BEE ; Vowel_Dependent # Mc BATAK VOWEL SIGN U +1BEF ; Vowel_Dependent # Mn BATAK VOWEL SIGN U FOR SIMALUNGUN SA +1C26..1C2B ; Vowel_Dependent # Mc [6] LEPCHA VOWEL SIGN AA..LEPCHA VOWEL SIGN UU +1C2C ; Vowel_Dependent # Mn LEPCHA VOWEL SIGN E +A823..A824 ; Vowel_Dependent # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I +A825..A826 ; Vowel_Dependent # Mn [2] SYLOTI NAGRI VOWEL SIGN U..SYLOTI NAGRI VOWEL SIGN E +A827 ; Vowel_Dependent # Mc SYLOTI NAGRI VOWEL SIGN OO +A8B5..A8C3 ; Vowel_Dependent # Mc [15] SAURASHTRA VOWEL SIGN AA..SAURASHTRA VOWEL SIGN AU +A947..A94E ; Vowel_Dependent # Mn [8] REJANG VOWEL SIGN I..REJANG VOWEL SIGN EA +A9B4..A9B5 ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG +A9B6..A9B9 ; Vowel_Dependent # Mn [4] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN SUKU MENDUT +A9BA..A9BB ; Vowel_Dependent # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE +A9BC ; Vowel_Dependent # Mn JAVANESE VOWEL SIGN PEPET +A9E5 ; Vowel_Dependent # Mn MYANMAR SIGN SHAN SAW +AA29..AA2E ; Vowel_Dependent # Mn [6] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN OE +AA2F..AA30 ; Vowel_Dependent # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI +AA31..AA32 ; Vowel_Dependent # Mn [2] CHAM VOWEL SIGN AU..CHAM VOWEL SIGN UE +AAB0 ; Vowel_Dependent # Mn TAI VIET MAI KANG +AAB1 ; Vowel_Dependent # Lo TAI VIET VOWEL AA +AAB2..AAB4 ; Vowel_Dependent # Mn [3] TAI VIET VOWEL I..TAI VIET VOWEL U +AAB5..AAB6 ; Vowel_Dependent # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O +AAB7..AAB8 ; Vowel_Dependent # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA +AAB9..AABD ; Vowel_Dependent # Lo [5] TAI VIET VOWEL UEA..TAI VIET VOWEL AN +AABE ; Vowel_Dependent # Mn TAI VIET VOWEL AM +AAEB ; Vowel_Dependent # Mc MEETEI MAYEK VOWEL SIGN II +AAEC..AAED ; Vowel_Dependent # Mn [2] MEETEI MAYEK VOWEL SIGN UU..MEETEI MAYEK VOWEL SIGN AAI +AAEE..AAEF ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN AU..MEETEI MAYEK VOWEL SIGN AAU +ABE3..ABE4 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP +ABE5 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN ANAP +ABE6..ABE7 ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP +ABE8 ; Vowel_Dependent # Mn MEETEI MAYEK VOWEL SIGN UNAP +ABE9..ABEA ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG +10A01..10A03 ; Vowel_Dependent # Mn [3] KHAROSHTHI VOWEL SIGN I..KHAROSHTHI VOWEL SIGN VOCALIC R +10A05..10A06 ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O +10A0C..10A0D ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN DOUBLE RING BELOW +11038..11045 ; Vowel_Dependent # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +110B0..110B2 ; Vowel_Dependent # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II +110B3..110B6 ; Vowel_Dependent # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI +110B7..110B8 ; Vowel_Dependent # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +11127..1112B ; Vowel_Dependent # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU +1112C ; Vowel_Dependent # Mc CHAKMA VOWEL SIGN E +1112D..11132 ; Vowel_Dependent # Mn [6] CHAKMA VOWEL SIGN AI..CHAKMA AU MARK +111B3..111B5 ; Vowel_Dependent # Mc [3] SHARADA VOWEL SIGN AA..SHARADA VOWEL SIGN II +111B6..111BE ; Vowel_Dependent # Mn [9] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN O +111BF ; Vowel_Dependent # Mc SHARADA VOWEL SIGN AU +111CB..111CC ; Vowel_Dependent # Mn [2] SHARADA VOWEL MODIFIER MARK..SHARADA EXTRA SHORT VOWEL MARK +1122C..1122E ; Vowel_Dependent # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II +1122F..11231 ; Vowel_Dependent # Mn [3] KHOJKI VOWEL SIGN U..KHOJKI VOWEL SIGN AI +11232..11233 ; Vowel_Dependent # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU +112E0..112E2 ; Vowel_Dependent # Mc [3] KHUDAWADI VOWEL SIGN AA..KHUDAWADI VOWEL SIGN II +112E3..112E8 ; Vowel_Dependent # Mn [6] KHUDAWADI VOWEL SIGN U..KHUDAWADI VOWEL SIGN AU +1133E..1133F ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I +11340 ; Vowel_Dependent # Mn GRANTHA VOWEL SIGN II +11341..11344 ; Vowel_Dependent # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR +11347..11348 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI +1134B..1134C ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN OO..GRANTHA VOWEL SIGN AU +11357 ; Vowel_Dependent # Mc GRANTHA AU LENGTH MARK +11362..11363 ; Vowel_Dependent # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL +11435..11437 ; Vowel_Dependent # Mc [3] NEWA VOWEL SIGN AA..NEWA VOWEL SIGN II +11438..1143F ; Vowel_Dependent # Mn [8] NEWA VOWEL SIGN U..NEWA VOWEL SIGN AI +11440..11441 ; Vowel_Dependent # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU +114B0..114B2 ; Vowel_Dependent # Mc [3] TIRHUTA VOWEL SIGN AA..TIRHUTA VOWEL SIGN II +114B3..114B8 ; Vowel_Dependent # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL +114B9 ; Vowel_Dependent # Mc TIRHUTA VOWEL SIGN E +114BA ; Vowel_Dependent # Mn TIRHUTA VOWEL SIGN SHORT E +114BB..114BE ; Vowel_Dependent # Mc [4] TIRHUTA VOWEL SIGN AI..TIRHUTA VOWEL SIGN AU +115AF..115B1 ; Vowel_Dependent # Mc [3] SIDDHAM VOWEL SIGN AA..SIDDHAM VOWEL SIGN II +115B2..115B5 ; Vowel_Dependent # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR +115B8..115BB ; Vowel_Dependent # Mc [4] SIDDHAM VOWEL SIGN E..SIDDHAM VOWEL SIGN AU +115DC..115DD ; Vowel_Dependent # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU +11630..11632 ; Vowel_Dependent # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II +11633..1163A ; Vowel_Dependent # Mn [8] MODI VOWEL SIGN U..MODI VOWEL SIGN AI +1163B..1163C ; Vowel_Dependent # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU +11640 ; Vowel_Dependent # Mn MODI SIGN ARDHACANDRA +116AD ; Vowel_Dependent # Mn TAKRI VOWEL SIGN AA +116AE..116AF ; Vowel_Dependent # Mc [2] TAKRI VOWEL SIGN I..TAKRI VOWEL SIGN II +116B0..116B5 ; Vowel_Dependent # Mn [6] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN AU +11720..11721 ; Vowel_Dependent # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA +11722..11725 ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN I..AHOM VOWEL SIGN UU +11726 ; Vowel_Dependent # Mc AHOM VOWEL SIGN E +11727..1172A ; Vowel_Dependent # Mn [4] AHOM VOWEL SIGN AW..AHOM VOWEL SIGN AM +11C2F ; Vowel_Dependent # Mc BHAIKSUKI VOWEL SIGN AA +11C30..11C36 ; Vowel_Dependent # Mn [7] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN VOCALIC L +11C38..11C3B ; Vowel_Dependent # Mn [4] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI VOWEL SIGN AU +11CB0 ; Vowel_Dependent # Mn MARCHEN VOWEL SIGN AA +11CB1 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN I +11CB2..11CB3 ; Vowel_Dependent # Mn [2] MARCHEN VOWEL SIGN U..MARCHEN VOWEL SIGN E +11CB4 ; Vowel_Dependent # Mc MARCHEN VOWEL SIGN O + +# ================================================ + +# Indic_Syllabic_Category=Vowel + +# (Other) Vowels (reanalyzed as ordinary alphabetic letters or marks) + +# [Not derivable] + +1963..196D ; Vowel # Lo [11] TAI LE LETTER A..TAI LE LETTER AI +A85E..A861 ; Vowel # Lo [4] PHAGS-PA LETTER I..PHAGS-PA LETTER O +A866 ; Vowel # Lo PHAGS-PA LETTER EE +A922..A925 ; Vowel # Lo [4] KAYAH LI LETTER A..KAYAH LI LETTER OO +A926..A92A ; Vowel # Mn [5] KAYAH LI VOWEL UE..KAYAH LI VOWEL O +11150..11154 ; Vowel # Lo [5] MAHAJANI LETTER A..MAHAJANI LETTER O + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Placeholder + +# Consonant Placeholder +# This includes generic placeholders used for +# Indic script layout (NBSP and dotted circle), as well as a few script- +# specific vowel-holder characters which are not technically +# consonants, but serve instead as bases for placement of vowel marks. + +# [Not derivable] + +002D ; Consonant_Placeholder # Pd HYPHEN-MINUS +00A0 ; Consonant_Placeholder # Zs NO-BREAK SPACE +00D7 ; Consonant_Placeholder # Sm MULTIPLICATION SIGN +0A72..0A73 ; Consonant_Placeholder # Lo [2] GURMUKHI IRI..GURMUKHI URA +104E ; Consonant_Placeholder # Po MYANMAR SYMBOL AFOREMENTIONED +1900 ; Consonant_Placeholder # Lo LIMBU VOWEL-CARRIER LETTER +2010..2014 ; Consonant_Placeholder # Pd [5] HYPHEN..EM DASH +25CC ; Consonant_Placeholder # So DOTTED CIRCLE +AA74..AA76 ; Consonant_Placeholder # Lo [3] MYANMAR LOGOGRAM KHAMTI OAY..MYANMAR LOGOGRAM KHAMTI HM + +# ================================================ + +# Indic_Syllabic_Category=Consonant + +# Consonant (ordinary abugida consonants, with inherent vowels) + +# [Not derivable] + +0915..0939 ; Consonant # Lo [37] DEVANAGARI LETTER KA..DEVANAGARI LETTER HA +0958..095F ; Consonant # Lo [8] DEVANAGARI LETTER QA..DEVANAGARI LETTER YYA +0978..097F ; Consonant # Lo [8] DEVANAGARI LETTER MARWARI DDA..DEVANAGARI LETTER BBA +0995..09A8 ; Consonant # Lo [20] BENGALI LETTER KA..BENGALI LETTER NA +09AA..09B0 ; Consonant # Lo [7] BENGALI LETTER PA..BENGALI LETTER RA +09B2 ; Consonant # Lo BENGALI LETTER LA +09B6..09B9 ; Consonant # Lo [4] BENGALI LETTER SHA..BENGALI LETTER HA +09DC..09DD ; Consonant # Lo [2] BENGALI LETTER RRA..BENGALI LETTER RHA +09DF ; Consonant # Lo BENGALI LETTER YYA +09F0..09F1 ; Consonant # Lo [2] BENGALI LETTER RA WITH MIDDLE DIAGONAL..BENGALI LETTER RA WITH LOWER DIAGONAL +0A15..0A28 ; Consonant # Lo [20] GURMUKHI LETTER KA..GURMUKHI LETTER NA +0A2A..0A30 ; Consonant # Lo [7] GURMUKHI LETTER PA..GURMUKHI LETTER RA +0A32..0A33 ; Consonant # Lo [2] GURMUKHI LETTER LA..GURMUKHI LETTER LLA +0A35..0A36 ; Consonant # Lo [2] GURMUKHI LETTER VA..GURMUKHI LETTER SHA +0A38..0A39 ; Consonant # Lo [2] GURMUKHI LETTER SA..GURMUKHI LETTER HA +0A59..0A5C ; Consonant # Lo [4] GURMUKHI LETTER KHHA..GURMUKHI LETTER RRA +0A5E ; Consonant # Lo GURMUKHI LETTER FA +0A95..0AA8 ; Consonant # Lo [20] GUJARATI LETTER KA..GUJARATI LETTER NA +0AAA..0AB0 ; Consonant # Lo [7] GUJARATI LETTER PA..GUJARATI LETTER RA +0AB2..0AB3 ; Consonant # Lo [2] GUJARATI LETTER LA..GUJARATI LETTER LLA +0AB5..0AB9 ; Consonant # Lo [5] GUJARATI LETTER VA..GUJARATI LETTER HA +0AF9 ; Consonant # Lo GUJARATI LETTER ZHA +0B15..0B28 ; Consonant # Lo [20] ORIYA LETTER KA..ORIYA LETTER NA +0B2A..0B30 ; Consonant # Lo [7] ORIYA LETTER PA..ORIYA LETTER RA +0B32..0B33 ; Consonant # Lo [2] ORIYA LETTER LA..ORIYA LETTER LLA +0B35..0B39 ; Consonant # Lo [5] ORIYA LETTER VA..ORIYA LETTER HA +0B5C..0B5D ; Consonant # Lo [2] ORIYA LETTER RRA..ORIYA LETTER RHA +0B5F ; Consonant # Lo ORIYA LETTER YYA +0B71 ; Consonant # Lo ORIYA LETTER WA +0B95 ; Consonant # Lo TAMIL LETTER KA +0B99..0B9A ; Consonant # Lo [2] TAMIL LETTER NGA..TAMIL LETTER CA +0B9C ; Consonant # Lo TAMIL LETTER JA +0B9E..0B9F ; Consonant # Lo [2] TAMIL LETTER NYA..TAMIL LETTER TTA +0BA3..0BA4 ; Consonant # Lo [2] TAMIL LETTER NNA..TAMIL LETTER TA +0BA8..0BAA ; Consonant # Lo [3] TAMIL LETTER NA..TAMIL LETTER PA +0BAE..0BB9 ; Consonant # Lo [12] TAMIL LETTER MA..TAMIL LETTER HA +0C15..0C28 ; Consonant # Lo [20] TELUGU LETTER KA..TELUGU LETTER NA +0C2A..0C39 ; Consonant # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C58..0C5A ; Consonant # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C95..0CA8 ; Consonant # Lo [20] KANNADA LETTER KA..KANNADA LETTER NA +0CAA..0CB3 ; Consonant # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA +0CB5..0CB9 ; Consonant # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA +0CDE ; Consonant # Lo KANNADA LETTER FA +0D15..0D3A ; Consonant # Lo [38] MALAYALAM LETTER KA..MALAYALAM LETTER TTTA +0D9A..0DB1 ; Consonant # Lo [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA +0DB3..0DBB ; Consonant # Lo [9] SINHALA LETTER SANYAKA DAYANNA..SINHALA LETTER RAYANNA +0DBD ; Consonant # Lo SINHALA LETTER DANTAJA LAYANNA +0DC0..0DC6 ; Consonant # Lo [7] SINHALA LETTER VAYANNA..SINHALA LETTER FAYANNA +0E01..0E2E ; Consonant # Lo [46] THAI CHARACTER KO KAI..THAI CHARACTER HO NOKHUK +0E81..0E82 ; Consonant # Lo [2] LAO LETTER KO..LAO LETTER KHO SUNG +0E84 ; Consonant # Lo LAO LETTER KHO TAM +0E87..0E88 ; Consonant # Lo [2] LAO LETTER NGO..LAO LETTER CO +0E8A ; Consonant # Lo LAO LETTER SO TAM +0E8D ; Consonant # Lo LAO LETTER NYO +0E94..0E97 ; Consonant # Lo [4] LAO LETTER DO..LAO LETTER THO TAM +0E99..0E9F ; Consonant # Lo [7] LAO LETTER NO..LAO LETTER FO SUNG +0EA1..0EA3 ; Consonant # Lo [3] LAO LETTER MO..LAO LETTER LO LING +0EA5 ; Consonant # Lo LAO LETTER LO LOOT +0EA7 ; Consonant # Lo LAO LETTER WO +0EAA..0EAB ; Consonant # Lo [2] LAO LETTER SO SUNG..LAO LETTER HO SUNG +0EAD..0EAE ; Consonant # Lo [2] LAO LETTER O..LAO LETTER HO TAM +0EDC..0EDF ; Consonant # Lo [4] LAO HO NO..LAO LETTER KHMU NYO +0F40..0F47 ; Consonant # Lo [8] TIBETAN LETTER KA..TIBETAN LETTER JA +0F49..0F6C ; Consonant # Lo [36] TIBETAN LETTER NYA..TIBETAN LETTER RRA +1000..1020 ; Consonant # Lo [33] MYANMAR LETTER KA..MYANMAR LETTER LLA +103F ; Consonant # Lo MYANMAR LETTER GREAT SA +1050..1051 ; Consonant # Lo [2] MYANMAR LETTER SHA..MYANMAR LETTER SSA +105A..105D ; Consonant # Lo [4] MYANMAR LETTER MON NGA..MYANMAR LETTER MON BBE +1061 ; Consonant # Lo MYANMAR LETTER SGAW KAREN SHA +1065..1066 ; Consonant # Lo [2] MYANMAR LETTER WESTERN PWO KAREN THA..MYANMAR LETTER WESTERN PWO KAREN PWA +106E..1070 ; Consonant # Lo [3] MYANMAR LETTER EASTERN PWO KAREN NNA..MYANMAR LETTER EASTERN PWO KAREN GHWA +1075..1081 ; Consonant # Lo [13] MYANMAR LETTER SHAN KA..MYANMAR LETTER SHAN HA +108E ; Consonant # Lo MYANMAR LETTER RUMAI PALAUNG FA +1703..170C ; Consonant # Lo [10] TAGALOG LETTER KA..TAGALOG LETTER YA +170E..1711 ; Consonant # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1723..1731 ; Consonant # Lo [15] HANUNOO LETTER KA..HANUNOO LETTER HA +1743..1751 ; Consonant # Lo [15] BUHID LETTER KA..BUHID LETTER HA +1763..176C ; Consonant # Lo [10] TAGBANWA LETTER KA..TAGBANWA LETTER YA +176E..1770 ; Consonant # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA +1780..17A2 ; Consonant # Lo [35] KHMER LETTER KA..KHMER LETTER QA +1901..191E ; Consonant # Lo [30] LIMBU LETTER KA..LIMBU LETTER TRA +1950..1962 ; Consonant # Lo [19] TAI LE LETTER KA..TAI LE LETTER NA +1980..19AB ; Consonant # Lo [44] NEW TAI LUE LETTER HIGH QA..NEW TAI LUE LETTER LOW SUA +1A00..1A16 ; Consonant # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA +1A20..1A4C ; Consonant # Lo [45] TAI THAM LETTER HIGH KA..TAI THAM LETTER LOW HA +1A53..1A54 ; Consonant # Lo [2] TAI THAM LETTER LAE..TAI THAM LETTER GREAT SA +1B13..1B33 ; Consonant # Lo [33] BALINESE LETTER KA..BALINESE LETTER HA +1B45..1B4B ; Consonant # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B8A..1BA0 ; Consonant # Lo [23] SUNDANESE LETTER KA..SUNDANESE LETTER HA +1BAE..1BAF ; Consonant # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA +1BBB..1BBD ; Consonant # Lo [3] SUNDANESE LETTER REU..SUNDANESE LETTER BHA +1BC0..1BE3 ; Consonant # Lo [36] BATAK LETTER A..BATAK LETTER MBA +1C00..1C23 ; Consonant # Lo [36] LEPCHA LETTER KA..LEPCHA LETTER A +1C4D..1C4F ; Consonant # Lo [3] LEPCHA LETTER TTA..LEPCHA LETTER DDA +A807..A80A ; Consonant # Lo [4] SYLOTI NAGRI LETTER KO..SYLOTI NAGRI LETTER GHO +A80C..A822 ; Consonant # Lo [23] SYLOTI NAGRI LETTER CO..SYLOTI NAGRI LETTER HO +A840..A85D ; Consonant # Lo [30] PHAGS-PA LETTER KA..PHAGS-PA LETTER A +A862..A865 ; Consonant # Lo [4] PHAGS-PA LETTER QA..PHAGS-PA LETTER GGA +A869..A870 ; Consonant # Lo [8] PHAGS-PA LETTER TTA..PHAGS-PA LETTER ASPIRATED FA +A872 ; Consonant # Lo PHAGS-PA SUPERFIXED LETTER RA +A892..A8B3 ; Consonant # Lo [34] SAURASHTRA LETTER KA..SAURASHTRA LETTER LLA +A90A..A921 ; Consonant # Lo [24] KAYAH LI LETTER KA..KAYAH LI LETTER CA +A930..A946 ; Consonant # Lo [23] REJANG LETTER KA..REJANG LETTER A +A989..A98B ; Consonant # Lo [3] JAVANESE LETTER PA CEREK..JAVANESE LETTER NGA LELET RASWADI +A98F..A9B2 ; Consonant # Lo [36] JAVANESE LETTER KA..JAVANESE LETTER HA +A9E0..A9E4 ; Consonant # Lo [5] MYANMAR LETTER SHAN GHA..MYANMAR LETTER SHAN BHA +A9E7..A9EF ; Consonant # Lo [9] MYANMAR LETTER TAI LAING NYA..MYANMAR LETTER TAI LAING NNA +A9FA..A9FE ; Consonant # Lo [5] MYANMAR LETTER TAI LAING LLA..MYANMAR LETTER TAI LAING BHA +AA06..AA28 ; Consonant # Lo [35] CHAM LETTER KA..CHAM LETTER HA +AA60..AA6F ; Consonant # Lo [16] MYANMAR LETTER KHAMTI GA..MYANMAR LETTER KHAMTI FA +AA71..AA73 ; Consonant # Lo [3] MYANMAR LETTER KHAMTI XA..MYANMAR LETTER KHAMTI RA +AA7A ; Consonant # Lo MYANMAR LETTER AITON RA +AA7E..AA7F ; Consonant # Lo [2] MYANMAR LETTER SHWE PALAUNG CHA..MYANMAR LETTER SHWE PALAUNG SHA +AA80..AAAF ; Consonant # Lo [48] TAI VIET LETTER LOW KO..TAI VIET LETTER HIGH O +AAE2..AAEA ; Consonant # Lo [9] MEETEI MAYEK LETTER CHA..MEETEI MAYEK LETTER SSA +ABC0..ABCD ; Consonant # Lo [14] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER HUK +ABD0 ; Consonant # Lo MEETEI MAYEK LETTER PHAM +ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTER BHAM +10A00 ; Consonant # Lo KHAROSHTHI LETTER A +10A10..10A13 ; Consonant # Lo [4] KHAROSHTHI LETTER KA..KHAROSHTHI LETTER GHA +10A15..10A17 ; Consonant # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA +10A19..10A33 ; Consonant # Lo [27] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER TTTHA +11013..11037 ; Consonant # Lo [37] BRAHMI LETTER KA..BRAHMI LETTER OLD TAMIL NNNA +1108D..110AF ; Consonant # Lo [35] KAITHI LETTER KA..KAITHI LETTER HA +11107..11126 ; Consonant # Lo [32] CHAKMA LETTER KAA..CHAKMA LETTER HAA +11155..11172 ; Consonant # Lo [30] MAHAJANI LETTER KA..MAHAJANI LETTER RRA +11191..111B2 ; Consonant # Lo [34] SHARADA LETTER KA..SHARADA LETTER HA +11208..11211 ; Consonant # Lo [10] KHOJKI LETTER KA..KHOJKI LETTER JJA +11213..1122B ; Consonant # Lo [25] KHOJKI LETTER NYA..KHOJKI LETTER LLA +11284..11286 ; Consonant # Lo [3] MULTANI LETTER KA..MULTANI LETTER GA +11288 ; Consonant # Lo MULTANI LETTER GHA +1128A..1128D ; Consonant # Lo [4] MULTANI LETTER CA..MULTANI LETTER JJA +1128F..1129D ; Consonant # Lo [15] MULTANI LETTER NYA..MULTANI LETTER BA +1129F..112A8 ; Consonant # Lo [10] MULTANI LETTER BHA..MULTANI LETTER RHA +112BA..112DE ; Consonant # Lo [37] KHUDAWADI LETTER KA..KHUDAWADI LETTER HA +11315..11328 ; Consonant # Lo [20] GRANTHA LETTER KA..GRANTHA LETTER NA +1132A..11330 ; Consonant # Lo [7] GRANTHA LETTER PA..GRANTHA LETTER RA +11332..11333 ; Consonant # Lo [2] GRANTHA LETTER LA..GRANTHA LETTER LLA +11335..11339 ; Consonant # Lo [5] GRANTHA LETTER VA..GRANTHA LETTER HA +1140E..11434 ; Consonant # Lo [39] NEWA LETTER KA..NEWA LETTER HA +1148F..114AF ; Consonant # Lo [33] TIRHUTA LETTER KA..TIRHUTA LETTER HA +1158E..115AE ; Consonant # Lo [33] SIDDHAM LETTER KA..SIDDHAM LETTER HA +1160E..1162F ; Consonant # Lo [34] MODI LETTER KA..MODI LETTER LLA +1168A..116AA ; Consonant # Lo [33] TAKRI LETTER KA..TAKRI LETTER RRA +11700..11719 ; Consonant # Lo [26] AHOM LETTER KA..AHOM LETTER JHA +11C0E..11C2E ; Consonant # Lo [33] BHAIKSUKI LETTER KA..BHAIKSUKI LETTER HA +11C72..11C8F ; Consonant # Lo [30] MARCHEN LETTER KA..MARCHEN LETTER A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Dead + +# Dead Consonant (special consonant with killed vowel) + +# [Not derivable] + +09CE ; Consonant_Dead # Lo BENGALI LETTER KHANDA TA +0D54..0D56 ; Consonant_Dead # Lo [3] MALAYALAM LETTER CHILLU M..MALAYALAM LETTER CHILLU LLL +0D7A..0D7F ; Consonant_Dead # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K + +# ================================================ + +# Indic_Syllabic_Category=Consonant_With_Stacker + +# Consonants that may make stacked ligatures with the next consonant +# without the use of a virama + +# [Not derivable] + +0CF1..0CF2 ; Consonant_With_Stacker # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA +11003..11004 ; Consonant_With_Stacker # Lo [2] BRAHMI SIGN JIHVAMULIYA..BRAHMI SIGN UPADHMANIYA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Prefixed + +# Cluster-intial consonants + +# [Not derivable] + +111C2..111C3 ; Consonant_Prefixed # Lo [2] SHARADA SIGN JIHVAMULIYA..SHARADA SIGN UPADHMANIYA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Preceding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when preceding the main consonant + +# [Not derivable] + +0D4E ; Consonant_Preceding_Repha # Lo MALAYALAM LETTER DOT REPH + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Succeeding_Repha + +# Repha Form of RA (reanalyzed in some scripts), when succeeding the main consonant + +# [Not derivable] + +17CC ; Consonant_Succeeding_Repha # Mn KHMER SIGN ROBAT +1B03 ; Consonant_Succeeding_Repha # Mn BALINESE SIGN SURANG +1B81 ; Consonant_Succeeding_Repha # Mn SUNDANESE SIGN PANGLAYAR +A982 ; Consonant_Succeeding_Repha # Mn JAVANESE SIGN LAYAR + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Subjoined + +# Subjoined Consonant (C2 form subtending a base consonant in Tibetan, etc.) + +# [Not derivable] + +0F8D..0F97 ; Consonant_Subjoined # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA +0F99..0FBC ; Consonant_Subjoined # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA +1929..192B ; Consonant_Subjoined # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA +1BA1 ; Consonant_Subjoined # Mc SUNDANESE CONSONANT SIGN PAMINGKAL +1BA2..1BA3 ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE CONSONANT SIGN PANYIKU +1BAC..1BAD ; Consonant_Subjoined # Mn [2] SUNDANESE CONSONANT SIGN PASANGAN MA..SUNDANESE CONSONANT SIGN PASANGAN WA +1C24..1C25 ; Consonant_Subjoined # Mc [2] LEPCHA SUBJOINED LETTER YA..LEPCHA SUBJOINED LETTER RA +A867..A868 ; Consonant_Subjoined # Lo [2] PHAGS-PA SUBJOINED LETTER WA..PHAGS-PA SUBJOINED LETTER YA +A871 ; Consonant_Subjoined # Lo PHAGS-PA SUBJOINED LETTER RA +A9BD ; Consonant_Subjoined # Mc JAVANESE CONSONANT SIGN KERET +11C92..11CA7 ; Consonant_Subjoined # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA +11CA9 ; Consonant_Subjoined # Mc MARCHEN SUBJOINED LETTER YA +11CAA..11CAF ; Consonant_Subjoined # Mn [6] MARCHEN SUBJOINED LETTER RA..MARCHEN SUBJOINED LETTER A + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Medial + +# Medial Consonant (medial liquid, occurring in clusters) + +# [Not derivable] + +0A75 ; Consonant_Medial # Mn GURMUKHI SIGN YAKASH +0EBC ; Consonant_Medial # Mn LAO SEMIVOWEL SIGN LO +0EBD ; Consonant_Medial # Lo LAO SEMIVOWEL SIGN NYO +103B..103C ; Consonant_Medial # Mc [2] MYANMAR CONSONANT SIGN MEDIAL YA..MYANMAR CONSONANT SIGN MEDIAL RA +103D..103E ; Consonant_Medial # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA +105E..1060 ; Consonant_Medial # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA +1082 ; Consonant_Medial # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA +1A55 ; Consonant_Medial # Mc TAI THAM CONSONANT SIGN MEDIAL RA +1A56 ; Consonant_Medial # Mn TAI THAM CONSONANT SIGN MEDIAL LA +A9BE..A9BF ; Consonant_Medial # Mc [2] JAVANESE CONSONANT SIGN PENGKAL..JAVANESE CONSONANT SIGN CAKRA +AA33..AA34 ; Consonant_Medial # Mc [2] CHAM CONSONANT SIGN YA..CHAM CONSONANT SIGN RA +AA35..AA36 ; Consonant_Medial # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA +1171D..1171F ; Consonant_Medial # Mn [3] AHOM CONSONANT SIGN MEDIAL LA..AHOM CONSONANT SIGN MEDIAL LIGATING RA + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Final + +# Final Consonant (special final forms which do not take vowels) + +# [Not derivable] + +1930..1931 ; Consonant_Final # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA +1933..1938 ; Consonant_Final # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA +1939 ; Consonant_Final # Mn LIMBU SIGN MUKPHRENG +19C1..19C7 ; Consonant_Final # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B +1A57 ; Consonant_Final # Mc TAI THAM CONSONANT SIGN LA TANG LAI +1A58..1A5E ; Consonant_Final # Mn [7] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN SA +1BBE..1BBF ; Consonant_Final # Lo [2] SUNDANESE LETTER FINAL K..SUNDANESE LETTER FINAL M +1BF0..1BF1 ; Consonant_Final # Mn [2] BATAK CONSONANT SIGN NG..BATAK CONSONANT SIGN H +1C2D..1C33 ; Consonant_Final # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T +A8B4 ; Consonant_Final # Mc SAURASHTRA CONSONANT SIGN HAARU +A94F..A951 ; Consonant_Final # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R +A952 ; Consonant_Final # Mc REJANG CONSONANT SIGN H +AA40..AA42 ; Consonant_Final # Lo [3] CHAM LETTER FINAL K..CHAM LETTER FINAL NG +AA43 ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL NG +AA44..AA4B ; Consonant_Final # Lo [8] CHAM LETTER FINAL CH..CHAM LETTER FINAL SS +AA4C ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL M +AA4D ; Consonant_Final # Mc CHAM CONSONANT SIGN FINAL H +ABDB..ABE2 ; Consonant_Final # Lo [8] MEETEI MAYEK LETTER KOK LONSUM..MEETEI MAYEK LETTER I LONSUM + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Head_Letter + +# Head Letter (Tibetan) + +# [Not derivable] + +0F88..0F8C ; Consonant_Head_Letter # Lo [5] TIBETAN SIGN LCE TSA CAN..TIBETAN SIGN INVERTED MCHU CAN + +# ================================================ + +# Indic_Syllabic_Category=Modifying_Letter + +# Reanalyzed letters not participating in the abugida structure, but +# serving to modify the sound of an adjacent vowel or consonant. +# Note that this is not the same as General_Category=Modifier_Letter. + +# [Not derivable] + +0B83 ; Modifying_Letter # Lo TAMIL SIGN VISARGA + +# ================================================ + +# Indic_Syllabic_Category=Tone_Letter + +# Tone Letter (spacing lexical tone mark with status as a letter) + +# [Not derivable] + +1970..1974 ; Tone_Letter # Lo [5] TAI LE LETTER TONE-2..TAI LE LETTER TONE-6 +AAC0 ; Tone_Letter # Lo TAI VIET TONE MAI NUENG +AAC2 ; Tone_Letter # Lo TAI VIET TONE MAI SONG + +# ================================================ + +# Indic_Syllabic_Category=Tone_Mark + +# Tone Mark (nonspacing or spacing lexical tone mark) + +# [Not derivable] + +0E48..0E4B ; Tone_Mark # Mn [4] THAI CHARACTER MAI EK..THAI CHARACTER MAI CHATTAWA +0EC8..0ECB ; Tone_Mark # Mn [4] LAO TONE MAI EK..LAO TONE MAI CATAWA +1037 ; Tone_Mark # Mn MYANMAR SIGN DOT BELOW +1063..1064 ; Tone_Mark # Mc [2] MYANMAR TONE MARK SGAW KAREN HATHI..MYANMAR TONE MARK SGAW KAREN KE PHO +1069..106D ; Tone_Mark # Mc [5] MYANMAR SIGN WESTERN PWO KAREN TONE-1..MYANMAR SIGN WESTERN PWO KAREN TONE-5 +1087..108C ; Tone_Mark # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 +108D ; Tone_Mark # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE +108F ; Tone_Mark # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 +109A..109B ; Tone_Mark # Mc [2] MYANMAR SIGN KHAMTI TONE-1..MYANMAR SIGN KHAMTI TONE-3 +19C8..19C9 ; Tone_Mark # Lo [2] NEW TAI LUE TONE MARK-1..NEW TAI LUE TONE MARK-2 +1A75..1A79 ; Tone_Mark # Mn [5] TAI THAM SIGN TONE-1..TAI THAM SIGN KHUEN TONE-5 +A92B..A92D ; Tone_Mark # Mn [3] KAYAH LI TONE PLOPHU..KAYAH LI TONE CALYA PLOPHU +AA7B ; Tone_Mark # Mc MYANMAR SIGN PAO KAREN TONE +AA7C ; Tone_Mark # Mn MYANMAR SIGN TAI LAING TONE-2 +AA7D ; Tone_Mark # Mc MYANMAR SIGN TAI LAING TONE-5 +AABF ; Tone_Mark # Mn TAI VIET TONE MAI EK +AAC1 ; Tone_Mark # Mn TAI VIET TONE MAI THO +ABEC ; Tone_Mark # Mc MEETEI MAYEK LUM IYEK + +# ================================================ + +# Indic_Syllabic_Category=Gemination_Mark + +# Gemination Mark (doubling of the preceding or following consonant) + +# [Not derivable] + +0A71 ; Gemination_Mark # Mn GURMUKHI ADDAK +11237 ; Gemination_Mark # Mn KHOJKI SIGN SHADDA + +# ================================================ + +# Indic_Syllabic_Category=Cantillation_Mark + +# Cantillation Mark (recitation marks, such as svara markers for the Samaveda) + +# [Not derivable] + +0951..0952 ; Cantillation_Mark # Mn [2] DEVANAGARI STRESS SIGN UDATTA..DEVANAGARI STRESS SIGN ANUDATTA +1CD0..1CD2 ; Cantillation_Mark # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA +1CD4..1CE0 ; Cantillation_Mark # Mn [13] VEDIC SIGN YAJURVEDIC MIDLINE SVARITA..VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA +1CE1 ; Cantillation_Mark # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA +1CF4 ; Cantillation_Mark # Mn VEDIC TONE CANDRA ABOVE +1CF8..1CF9 ; Cantillation_Mark # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE +A8E0..A8F1 ; Cantillation_Mark # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA +1123E ; Cantillation_Mark # Mn KHOJKI SIGN SUKUN +11366..1136C ; Cantillation_Mark # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX +11370..11374 ; Cantillation_Mark # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA + +# ================================================ + +# Indic_Syllabic_Category=Register_Shifter + +# Register Shifter (shifts register for consonants, akin to a tone mark) + +# [Not derivable] + +17C9..17CA ; Register_Shifter # Mn [2] KHMER SIGN MUUSIKATOAN..KHMER SIGN TRIISAP + +# ================================================ + +# Indic_Syllabic_Category=Syllable_Modifier + +# Syllable Modifier (miscellaneous combining characters that modify +# something in the orthographic syllable they succeed) + +# [Not derivable] + +00B2..00B3 ; Syllable_Modifier # No [2] SUPERSCRIPT TWO..SUPERSCRIPT THREE +0F35 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG NYI ZLA +0F37 ; Syllable_Modifier # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS +0FC6 ; Syllable_Modifier # Mn TIBETAN SYMBOL PADMA GDAN +17CB ; Syllable_Modifier # Mn KHMER SIGN BANTOC +17CE..17D0 ; Syllable_Modifier # Mn [3] KHMER SIGN KAKABAT..KHMER SIGN SAMYOK SANNYA +17D3 ; Syllable_Modifier # Mn KHMER SIGN BATHAMASAT +17DD ; Syllable_Modifier # Mn KHMER SIGN ATTHACAN +193B ; Syllable_Modifier # Mn LIMBU SIGN SA-I +1A7A..1A7C ; Syllable_Modifier # Mn [3] TAI THAM SIGN RA HAAM..TAI THAM SIGN KHUEN-LUE KARAN +1A7F ; Syllable_Modifier # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT +1C36 ; Syllable_Modifier # Mn LEPCHA SIGN RAN +1DFB ; Syllable_Modifier # Mn COMBINING DELETION MARK +2074 ; Syllable_Modifier # No SUPERSCRIPT FOUR +2082..2084 ; Syllable_Modifier # No [3] SUBSCRIPT TWO..SUBSCRIPT FOUR + +# ================================================ + +# Indic_Syllabic_Category=Consonant_Killer + +# Consonant Killer (signifies that the previous consonant or consonants are +# not pronounced) + +# [Not derivable] + +0E4C ; Consonant_Killer # Mn THAI CHARACTER THANTHAKHAT +17CD ; Consonant_Killer # Mn KHMER SIGN TOANDAKHIAT + +# ================================================ + +# Indic_Syllabic_Category=Non_Joiner + +# Non_Joiner (Zero Width Non-Joiner) + +# [Not derivable] + +200C ; Non_Joiner # Cf ZERO WIDTH NON-JOINER + +# ================================================ + +# Indic_Syllabic_Category=Joiner + +# Joiner (Zero Width Joiner) + +# [Not derivable] + +200D ; Joiner # Cf ZERO WIDTH JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number_Joiner + +# Number_Joiner (forms ligatures between numbers for multiplication) + +# [Not derivable] + +1107F ; Number_Joiner # Mn BRAHMI NUMBER JOINER + +# ================================================ + +# Indic_Syllabic_Category=Number + +# Number (can be used as vowel-holders like consonant placeholders) + +# [Not derivable] + +0030..0039 ; Number # Nd [10] DIGIT ZERO..DIGIT NINE +0966..096F ; Number # Nd [10] DEVANAGARI DIGIT ZERO..DEVANAGARI DIGIT NINE +09E6..09EF ; Number # Nd [10] BENGALI DIGIT ZERO..BENGALI DIGIT NINE +0A66..0A6F ; Number # Nd [10] GURMUKHI DIGIT ZERO..GURMUKHI DIGIT NINE +0AE6..0AEF ; Number # Nd [10] GUJARATI DIGIT ZERO..GUJARATI DIGIT NINE +0B66..0B6F ; Number # Nd [10] ORIYA DIGIT ZERO..ORIYA DIGIT NINE +0BE6..0BEF ; Number # Nd [10] TAMIL DIGIT ZERO..TAMIL DIGIT NINE +0C66..0C6F ; Number # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE +0CE6..0CEF ; Number # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE +0D66..0D6F ; Number # Nd [10] MALAYALAM DIGIT ZERO..MALAYALAM DIGIT NINE +0DE6..0DEF ; Number # Nd [10] SINHALA LITH DIGIT ZERO..SINHALA LITH DIGIT NINE +0E50..0E59 ; Number # Nd [10] THAI DIGIT ZERO..THAI DIGIT NINE +0ED0..0ED9 ; Number # Nd [10] LAO DIGIT ZERO..LAO DIGIT NINE +0F20..0F29 ; Number # Nd [10] TIBETAN DIGIT ZERO..TIBETAN DIGIT NINE +0F2A..0F33 ; Number # No [10] TIBETAN DIGIT HALF ONE..TIBETAN DIGIT HALF ZERO +1040..1049 ; Number # Nd [10] MYANMAR DIGIT ZERO..MYANMAR DIGIT NINE +1090..1099 ; Number # Nd [10] MYANMAR SHAN DIGIT ZERO..MYANMAR SHAN DIGIT NINE +17E0..17E9 ; Number # Nd [10] KHMER DIGIT ZERO..KHMER DIGIT NINE +1946..194F ; Number # Nd [10] LIMBU DIGIT ZERO..LIMBU DIGIT NINE +19D0..19D9 ; Number # Nd [10] NEW TAI LUE DIGIT ZERO..NEW TAI LUE DIGIT NINE +1A80..1A89 ; Number # Nd [10] TAI THAM HORA DIGIT ZERO..TAI THAM HORA DIGIT NINE +1A90..1A99 ; Number # Nd [10] TAI THAM THAM DIGIT ZERO..TAI THAM THAM DIGIT NINE +1B50..1B59 ; Number # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE +1BB0..1BB9 ; Number # Nd [10] SUNDANESE DIGIT ZERO..SUNDANESE DIGIT NINE +1C40..1C49 ; Number # Nd [10] LEPCHA DIGIT ZERO..LEPCHA DIGIT NINE +A8D0..A8D9 ; Number # Nd [10] SAURASHTRA DIGIT ZERO..SAURASHTRA DIGIT NINE +A900..A909 ; Number # Nd [10] KAYAH LI DIGIT ZERO..KAYAH LI DIGIT NINE +A9D0..A9D9 ; Number # Nd [10] JAVANESE DIGIT ZERO..JAVANESE DIGIT NINE +A9F0..A9F9 ; Number # Nd [10] MYANMAR TAI LAING DIGIT ZERO..MYANMAR TAI LAING DIGIT NINE +AA50..AA59 ; Number # Nd [10] CHAM DIGIT ZERO..CHAM DIGIT NINE +ABF0..ABF9 ; Number # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE +10A40..10A47 ; Number # No [8] KHAROSHTHI DIGIT ONE..KHAROSHTHI NUMBER ONE THOUSAND +11066..1106F ; Number # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11136..1113F ; Number # Nd [10] CHAKMA DIGIT ZERO..CHAKMA DIGIT NINE +111D0..111D9 ; Number # Nd [10] SHARADA DIGIT ZERO..SHARADA DIGIT NINE +111E1..111F4 ; Number # No [20] SINHALA ARCHAIC DIGIT ONE..SINHALA ARCHAIC NUMBER ONE THOUSAND +112F0..112F9 ; Number # Nd [10] KHUDAWADI DIGIT ZERO..KHUDAWADI DIGIT NINE +11450..11459 ; Number # Nd [10] NEWA DIGIT ZERO..NEWA DIGIT NINE +114D0..114D9 ; Number # Nd [10] TIRHUTA DIGIT ZERO..TIRHUTA DIGIT NINE +11650..11659 ; Number # Nd [10] MODI DIGIT ZERO..MODI DIGIT NINE +116C0..116C9 ; Number # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE +11730..11739 ; Number # Nd [10] AHOM DIGIT ZERO..AHOM DIGIT NINE +1173A..1173B ; Number # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY +11C50..11C59 ; Number # Nd [10] BHAIKSUKI DIGIT ZERO..BHAIKSUKI DIGIT NINE +11C5A..11C6C ; Number # No [19] BHAIKSUKI NUMBER ONE..BHAIKSUKI HUNDREDS UNIT MARK + +# ================================================ + +# Indic_Syllabic_Category=Brahmi_Joining_Number + +# Brahmi Joining Number (similar to Number in that in can be used as +# vowel-holders like Consonant_Placeholder, but may also be joined by +# a Number_Joiner of the same script, e.g. in Brahmi) + +# [Not derivable] + +11052..11065 ; Brahmi_Joining_Number # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND + +# EOF diff --git a/data/resources.js b/data/resources.js index 1b9ac8b..966c3f7 100644 --- a/data/resources.js +++ b/data/resources.js @@ -285,6 +285,8 @@ const resources = [ 'case-folding': 'https://unicode.org/Public/6.0.0/ucd/CaseFolding.txt', 'special-casing': 'https://unicode.org/Public/6.0.0/ucd/SpecialCasing.txt', 'bidi-mirroring': 'https://unicode.org/Public/6.0.0/ucd/BidiMirroring.txt', + 'indic-positional-category': 'https://unicode.org/Public/6.0.0/ucd/IndicMatraCategory.txt', + 'indic-syllabic-category': 'https://unicode.org/Public/6.0.0/ucd/IndicSyllabicCategory.txt', 'line-break': 'https://unicode.org/Public/6.0.0/ucd/LineBreak.txt', 'grapheme-cluster-break': 'https://unicode.org/Public/6.0.0/ucd/auxiliary/GraphemeBreakProperty.txt', @@ -315,6 +317,8 @@ const resources = [ 'case-folding': 'https://unicode.org/Public/6.1.0/ucd/CaseFolding.txt', 'special-casing': 'https://unicode.org/Public/6.1.0/ucd/SpecialCasing.txt', 'bidi-mirroring': 'https://unicode.org/Public/6.1.0/ucd/BidiMirroring.txt', + 'indic-positional-category': 'https://unicode.org/Public/6.1.0/ucd/IndicMatraCategory.txt', + 'indic-syllabic-category': 'https://unicode.org/Public/6.1.0/ucd/IndicSyllabicCategory.txt', 'line-break': 'https://unicode.org/Public/6.1.0/ucd/LineBreak.txt', 'grapheme-cluster-break': 'https://unicode.org/Public/6.1.0/ucd/auxiliary/GraphemeBreakProperty.txt', @@ -345,6 +349,8 @@ const resources = [ 'case-folding': 'https://unicode.org/Public/6.2.0/ucd/CaseFolding.txt', 'special-casing': 'https://unicode.org/Public/6.2.0/ucd/SpecialCasing.txt', 'bidi-mirroring': 'https://unicode.org/Public/6.2.0/ucd/BidiMirroring.txt', + 'indic-positional-category': 'https://unicode.org/Public/6.2.0/ucd/IndicMatraCategory.txt', + 'indic-syllabic-category': 'https://unicode.org/Public/6.2.0/ucd/IndicSyllabicCategory.txt', 'line-break': 'https://unicode.org/Public/6.2.0/ucd/LineBreak.txt', 'grapheme-cluster-break': 'https://unicode.org/Public/6.2.0/ucd/auxiliary/GraphemeBreakProperty.txt', @@ -376,6 +382,8 @@ const resources = [ 'special-casing': 'https://unicode.org/Public/6.3.0/ucd/SpecialCasing.txt', 'bidi-mirroring': 'https://unicode.org/Public/6.3.0/ucd/BidiMirroring.txt', 'bidi-brackets': 'https://unicode.org/Public/6.3.0/ucd/BidiBrackets.txt', + 'indic-positional-category': 'https://unicode.org/Public/6.3.0/ucd/IndicMatraCategory.txt', + 'indic-syllabic-category': 'https://unicode.org/Public/6.3.0/ucd/IndicSyllabicCategory.txt', 'line-break': 'https://unicode.org/Public/6.3.0/ucd/LineBreak.txt', 'grapheme-cluster-break': 'https://unicode.org/Public/6.3.0/ucd/auxiliary/GraphemeBreakProperty.txt', @@ -405,6 +413,8 @@ const resources = [ 'https://unicode.org/Public/7.0.0/ucd/CompositionExclusions.txt', 'case-folding': 'https://unicode.org/Public/7.0.0/ucd/CaseFolding.txt', 'special-casing': 'https://unicode.org/Public/7.0.0/ucd/SpecialCasing.txt', + 'indic-positional-category': 'https://unicode.org/Public/7.0.0/ucd/IndicMatraCategory.txt', + 'indic-syllabic-category': 'https://unicode.org/Public/7.0.0/ucd/IndicSyllabicCategory.txt', 'bidi-mirroring': 'https://unicode.org/Public/7.0.0/ucd/BidiMirroring.txt', 'bidi-brackets': 'https://unicode.org/Public/7.0.0/ucd/BidiBrackets.txt', 'line-break': 'https://unicode.org/Public/7.0.0/ucd/LineBreak.txt', @@ -438,6 +448,8 @@ const resources = [ 'special-casing': 'https://unicode.org/Public/8.0.0/ucd/SpecialCasing.txt', 'bidi-mirroring': 'https://unicode.org/Public/8.0.0/ucd/BidiMirroring.txt', 'bidi-brackets': 'https://unicode.org/Public/8.0.0/ucd/BidiBrackets.txt', + 'indic-positional-category': 'https://unicode.org/Public/8.0.0/ucd/IndicPositionalCategory.txt', + 'indic-syllabic-category': 'https://unicode.org/Public/8.0.0/ucd/IndicSyllabicCategory.txt', 'line-break': 'https://unicode.org/Public/8.0.0/ucd/LineBreak.txt', 'grapheme-cluster-break': 'https://unicode.org/Public/8.0.0/ucd/auxiliary/GraphemeBreakProperty.txt', @@ -469,6 +481,8 @@ const resources = [ 'special-casing': 'https://unicode.org/Public/9.0.0/ucd/SpecialCasing.txt', 'bidi-mirroring': 'https://unicode.org/Public/9.0.0/ucd/BidiMirroring.txt', 'bidi-brackets': 'https://unicode.org/Public/9.0.0/ucd/BidiBrackets.txt', + 'indic-positional-category': 'https://unicode.org/Public/9.0.0/ucd/IndicPositionalCategory.txt', + 'indic-syllabic-category': 'https://unicode.org/Public/9.0.0/ucd/IndicSyllabicCategory.txt', 'line-break': 'https://unicode.org/Public/9.0.0/ucd/LineBreak.txt', 'grapheme-cluster-break': 'https://unicode.org/Public/9.0.0/ucd/auxiliary/GraphemeBreakProperty.txt', @@ -500,6 +514,8 @@ const resources = [ 'special-casing': 'https://unicode.org/Public/10.0.0/ucd/SpecialCasing.txt', 'bidi-mirroring': 'https://unicode.org/Public/10.0.0/ucd/BidiMirroring.txt', 'bidi-brackets': 'https://unicode.org/Public/10.0.0/ucd/BidiBrackets.txt', + 'indic-positional-category': 'https://unicode.org/Public/10.0.0/ucd/IndicPositionalCategory.txt', + 'indic-syllabic-category': 'https://unicode.org/Public/10.0.0/ucd/IndicSyllabicCategory.txt', 'line-break': 'https://unicode.org/Public/10.0.0/ucd/LineBreak.txt', 'grapheme-cluster-break': 'https://unicode.org/Public/10.0.0/ucd/auxiliary/GraphemeBreakProperty.txt', @@ -531,6 +547,8 @@ const resources = [ 'special-casing': 'https://unicode.org/Public/11.0.0/ucd/SpecialCasing.txt', 'bidi-mirroring': 'https://unicode.org/Public/11.0.0/ucd/BidiMirroring.txt', 'bidi-brackets': 'https://unicode.org/Public/11.0.0/ucd/BidiBrackets.txt', + 'indic-positional-category': 'https://unicode.org/Public/11.0.0/ucd/IndicPositionalCategory.txt', + 'indic-syllabic-category': 'https://unicode.org/Public/11.0.0/ucd/IndicSyllabicCategory.txt', 'line-break': 'https://unicode.org/Public/11.0.0/ucd/LineBreak.txt', 'grapheme-cluster-break': 'https://unicode.org/Public/11.0.0/ucd/auxiliary/GraphemeBreakProperty.txt', @@ -572,6 +590,8 @@ const resources = [ 'special-casing': 'https://unicode.org/Public/12.0.0/ucd/SpecialCasing.txt', 'bidi-mirroring': 'https://unicode.org/Public/12.0.0/ucd/BidiMirroring.txt', 'bidi-brackets': 'https://unicode.org/Public/12.0.0/ucd/BidiBrackets.txt', + 'indic-positional-category': 'https://unicode.org/Public/12.0.0/ucd/IndicPositionalCategory.txt', + 'indic-syllabic-category': 'https://unicode.org/Public/12.0.0/ucd/IndicSyllabicCategory.txt', 'line-break': 'https://unicode.org/Public/12.0.0/ucd/LineBreak.txt', 'grapheme-cluster-break': 'https://unicode.org/Public/12.0.0/ucd/auxiliary/GraphemeBreakProperty.txt', @@ -613,6 +633,8 @@ const resources = [ 'special-casing': 'https://unicode.org/Public/12.1.0/ucd/SpecialCasing.txt', 'bidi-mirroring': 'https://unicode.org/Public/12.1.0/ucd/BidiMirroring.txt', 'bidi-brackets': 'https://unicode.org/Public/12.1.0/ucd/BidiBrackets.txt', + 'indic-positional-category': 'https://unicode.org/Public/12.1.0/ucd/IndicPositionalCategory.txt', + 'indic-syllabic-category': 'https://unicode.org/Public/12.1.0/ucd/IndicSyllabicCategory.txt', 'line-break': 'https://unicode.org/Public/12.1.0/ucd/LineBreak.txt', 'grapheme-cluster-break': 'https://unicode.org/Public/12.1.0/ucd/auxiliary/GraphemeBreakProperty.txt', @@ -654,6 +676,8 @@ const resources = [ 'special-casing': 'https://unicode.org/Public/13.0.0/ucd/SpecialCasing.txt', 'bidi-mirroring': 'https://unicode.org/Public/13.0.0/ucd/BidiMirroring.txt', 'bidi-brackets': 'https://unicode.org/Public/13.0.0/ucd/BidiBrackets.txt', + 'indic-positional-category': 'https://unicode.org/Public/13.0.0/ucd/IndicPositionalCategory.txt', + 'indic-syllabic-category': 'https://unicode.org/Public/13.0.0/ucd/IndicSyllabicCategory.txt', 'line-break': 'https://unicode.org/Public/13.0.0/ucd/LineBreak.txt', 'grapheme-cluster-break': 'https://unicode.org/Public/13.0.0/ucd/auxiliary/GraphemeBreakProperty.txt', @@ -695,6 +719,8 @@ const resources = [ 'special-casing': 'https://unicode.org/Public/14.0.0/ucd/SpecialCasing.txt', 'bidi-mirroring': 'https://unicode.org/Public/14.0.0/ucd/BidiMirroring.txt', 'bidi-brackets': 'https://unicode.org/Public/14.0.0/ucd/BidiBrackets.txt', + 'indic-positional-category': 'https://unicode.org/Public/14.0.0/ucd/IndicPositionalCategory.txt', + 'indic-syllabic-category': 'https://unicode.org/Public/14.0.0/ucd/IndicSyllabicCategory.txt', 'line-break': 'https://unicode.org/Public/14.0.0/ucd/LineBreak.txt', 'grapheme-cluster-break': 'https://unicode.org/Public/14.0.0/ucd/auxiliary/GraphemeBreakProperty.txt', @@ -736,6 +762,8 @@ const resources = [ 'special-casing': 'https://unicode.org/Public/15.0.0/ucd/SpecialCasing.txt', 'bidi-mirroring': 'https://unicode.org/Public/15.0.0/ucd/BidiMirroring.txt', 'bidi-brackets': 'https://unicode.org/Public/15.0.0/ucd/BidiBrackets.txt', + 'indic-positional-category': 'https://unicode.org/Public/15.0.0/ucd/IndicPositionalCategory.txt', + 'indic-syllabic-category': 'https://unicode.org/Public/15.0.0/ucd/IndicSyllabicCategory.txt', 'line-break': 'https://unicode.org/Public/15.0.0/ucd/LineBreak.txt', 'grapheme-cluster-break': 'https://unicode.org/Public/15.0.0/ucd/auxiliary/GraphemeBreakProperty.txt', @@ -777,6 +805,8 @@ const resources = [ 'special-casing': 'https://unicode.org/Public/15.1.0/ucd/SpecialCasing.txt', 'bidi-mirroring': 'https://unicode.org/Public/15.1.0/ucd/BidiMirroring.txt', 'bidi-brackets': 'https://unicode.org/Public/15.1.0/ucd/BidiBrackets.txt', + 'indic-positional-category': 'https://unicode.org/Public/15.1.0/ucd/IndicPositionalCategory.txt', + 'indic-syllabic-category': 'https://unicode.org/Public/15.1.0/ucd/IndicSyllabicCategory.txt', 'line-break': 'https://unicode.org/Public/15.1.0/ucd/LineBreak.txt', 'grapheme-cluster-break': 'https://unicode.org/Public/15.1.0/ucd/auxiliary/GraphemeBreakProperty.txt', @@ -818,6 +848,8 @@ const resources = [ 'special-casing': 'https://unicode.org/Public/16.0.0/ucd/SpecialCasing.txt', 'bidi-mirroring': 'https://unicode.org/Public/16.0.0/ucd/BidiMirroring.txt', 'bidi-brackets': 'https://unicode.org/Public/16.0.0/ucd/BidiBrackets.txt', + 'indic-positional-category': 'https://unicode.org/Public/16.0.0/ucd/IndicPositionalCategory.txt', + 'indic-syllabic-category': 'https://unicode.org/Public/16.0.0/ucd/IndicSyllabicCategory.txt', 'line-break': 'https://unicode.org/Public/16.0.0/ucd/LineBreak.txt', 'grapheme-cluster-break': 'https://unicode.org/Public/16.0.0/ucd/auxiliary/GraphemeBreakProperty.txt', @@ -859,6 +891,8 @@ const resources = [ 'special-casing': 'https://unicode.org/Public/17.0.0/ucd/SpecialCasing.txt', 'bidi-mirroring': 'https://unicode.org/Public/17.0.0/ucd/BidiMirroring.txt', 'bidi-brackets': 'https://unicode.org/Public/17.0.0/ucd/BidiBrackets.txt', + 'indic-positional-category': 'https://unicode.org/Public/17.0.0/ucd/IndicPositionalCategory.txt', + 'indic-syllabic-category': 'https://unicode.org/Public/17.0.0/ucd/IndicSyllabicCategory.txt', 'line-break': 'https://unicode.org/Public/17.0.0/ucd/LineBreak.txt', 'grapheme-cluster-break': 'https://unicode.org/Public/17.0.0/ucd/auxiliary/GraphemeBreakProperty.txt', diff --git a/index.js b/index.js index b16df33..4326ac4 100644 --- a/index.js +++ b/index.js @@ -8,6 +8,8 @@ parsers.parseBidiBrackets = require('./scripts/parse-bidi-brackets.js'); parsers.parseCaseFolding = require('./scripts/parse-case-folding.js'); parsers.parseBidiClass = require('./scripts/parse-bidi-class.js'); parsers.parseCompositionExclusions = require('./scripts/parse-composition-exclusions.js'); +parsers.parseIndicPositionalCategory = require('./scripts/parse-indic-positional-category.js'); +parsers.parseIndicSyllabicCategory = require('./scripts/parse-indic-syllabic-category.js'); parsers.parseLineBreak = require('./scripts/parse-line-break.js'); parsers.parseScriptExtensions = require('./scripts/parse-script-extensions.js'); parsers.parseSpecialCasing = require('./scripts/parse-special-casing.js'); @@ -120,6 +122,21 @@ const generateData = function(version) { 'map': parsers.parseBidiBrackets(version), 'type': 'Bidi_Paired_Bracket_Type' })); + { + const InPCName = +version.split(".")[0] >= 8 ? 'Indic_Positional_Category' : 'Indic_Matra_Category'; + console.log('Parsing Unicode v%s `%s`…', version, InPCName); + extend(dirMap, utils.writeFiles({ + 'version': version, + 'map': parsers.parseIndicPositionalCategory(version), + 'type': InPCName + })); + } + console.log('Parsing Unicode v%s `Indic_Syllabic_Category`…', version); + extend(dirMap, utils.writeFiles({ + 'version': version, + 'map': parsers.parseIndicSyllabicCategory(version), + 'type': 'Indic_Syllabic_Category' + })); console.log('Parsing Unicode v%s `Line_Break`…', version); extend(dirMap, utils.writeFiles({ 'version': version, diff --git a/scripts/download.js b/scripts/download.js index a79a1cc..f35a861 100644 --- a/scripts/download.js +++ b/scripts/download.js @@ -41,6 +41,8 @@ const TYPES = [ 'special-casing', 'bidi-mirroring', 'bidi-brackets', + 'indic-positional-category', + 'indic-syllabic-category', 'line-break', 'grapheme-cluster-break', 'word-break', diff --git a/scripts/parse-indic-positional-category.js b/scripts/parse-indic-positional-category.js new file mode 100644 index 0000000..54a963a --- /dev/null +++ b/scripts/parse-indic-positional-category.js @@ -0,0 +1,43 @@ +'use strict'; + +const utils = require('./utils.js'); +const regenerate = require('regenerate'); + +const parseIndicPositionalCategory = function(version) { + const source = utils.readDataFile(version, 'indic-positional-category'); + if (!source) { + return; + } + const NAKey = +version.split(".")[0] >= 17 ? 'Not_Applicable' : 'NA'; + const map = { + // All code points not explicitly listed for Indic_Positional_Category have the value Not_Applicable (NA). + [NAKey]: regenerate().addRange(0, 0x10FFFF) + }; + const lines = source.split('\n'); + for (const line of lines) { + if (!line || /^#/.test(line)) { + continue; + } + const data = line.trim().split(';'); + const charRange = data[0].replace('..', '-').trim(); + const rangeParts = charRange.split('-'); + const value = data[1].split('#')[0].trim(); + const propertyValue = value; + map[propertyValue] ??= regenerate(); + if (rangeParts.length == 2) { + const [from, to] = [ + parseInt(rangeParts[0], 16), + parseInt(rangeParts[1], 16), + ]; + map[NAKey].removeRange(from, to); + map[propertyValue].addRange(from, to); + } else { + const codePoint = parseInt(charRange, 16); + map[NAKey].remove(codePoint); + map[propertyValue].add(codePoint); + } + } + return map; +}; + +module.exports = parseIndicPositionalCategory; diff --git a/scripts/parse-indic-syllabic-category.js b/scripts/parse-indic-syllabic-category.js new file mode 100644 index 0000000..7784fd5 --- /dev/null +++ b/scripts/parse-indic-syllabic-category.js @@ -0,0 +1,42 @@ +'use strict'; + +const utils = require('./utils.js'); +const regenerate = require('regenerate'); + +const parseIndicSyllabicCategory = function(version) { + const source = utils.readDataFile(version, 'indic-syllabic-category'); + if (!source) { + return; + } + const map = { + // All code points not explicitly listed for Indic_Syllabic_Category have the value Other. + 'Other': regenerate().addRange(0, 0x10FFFF) + }; + const lines = source.split('\n'); + for (const line of lines) { + if (!line || /^#/.test(line)) { + continue; + } + const data = line.trim().split(';'); + const charRange = data[0].replace('..', '-').trim(); + const rangeParts = charRange.split('-'); + const value = data[1].split('#')[0].trim(); + const propertyValue = value; + map[propertyValue] ??= regenerate(); + if (rangeParts.length == 2) { + const [from, to] = [ + parseInt(rangeParts[0], 16), + parseInt(rangeParts[1], 16), + ]; + map['Other'].removeRange(from, to); + map[propertyValue].addRange(from, to); + } else { + const codePoint = parseInt(charRange, 16); + map['Other'].remove(codePoint); + map[propertyValue].add(codePoint); + } + } + return map; +}; + +module.exports = parseIndicSyllabicCategory;