* Added a unicode directory containing files from unicode.org

as well as extractors for the data.
This commit is contained in:
Abdulaziz Ghuloum 2007-05-19 22:09:30 -04:00
parent caa5eed9a0
commit a1879ccc57
32 changed files with 122092 additions and 24 deletions

Binary file not shown.

View File

@ -13,15 +13,31 @@
(define $write-char
(lambda (c p)
(let ([idx (port-output-index p)])
(if ($fx< idx ($port-output-size p))
(let ([b ($char->fixnum c)])
(if ($fx< b 128)
(begin
($bytevector-set! ($port-output-buffer p) idx b)
($set-port-output-index! p ($fxadd1 idx)))
(($port-handler p) 'write-char c p)))
(($port-handler p) 'write-char c p)))))
(let ([b ($char->fixnum c)])
(cond
[($fx<= b #x7F)
($write-byte b p)]
[($fx<= b #x7FF)
($write-byte
($fxlogor #b11000000 ($fxsra b 6)) p)
($write-byte
($fxlogor #b10000000 ($fxlogand b #b111111)) p)]
[($fx<= b #xFFFF)
($write-byte
($fxlogor #b11100000 ($fxsra b 12)) p)
($write-byte
($fxlogor #b10000000 ($fxlogand ($fxsra b 6) #b111111)) p)
($write-byte
($fxlogor #b10000000 ($fxlogand b #b111111)) p)]
[else
($write-byte
($fxlogor #b11110000 ($fxsra b 18)) p)
($write-byte
($fxlogor #b10000000 ($fxlogand ($fxsra b 12) #b111111)) p)
($write-byte
($fxlogor #b10000000 ($fxlogand ($fxsra b 6) #b111111)) p)
($write-byte
($fxlogor #b10000000 ($fxlogand b #b111111)) p)]))))
(define $write-byte
(lambda (b p)

View File

@ -105,20 +105,15 @@
(write-char #\8 p)
(write-char #\( p)
(let ([n ($bytevector-length x)])
(let ([i
(cond
[(fx> n 0)
(let f ([idx 1] [i (writer ($bytevector-u8-ref x 0) p m h i)])
(cond
[(fx= idx n)
i]
[else
(write-char #\space p)
(f (fxadd1 idx)
(writer (bytevector-u8-ref x idx) p m h i))]))]
[else i])])
(write-char #\) p)
i))))
(when (fx> n 0)
(write-fixnum ($bytevector-u8-ref x 0) p)
(let f ([idx 1] [n n] [x x] [p p])
(unless ($fx= idx n)
(write-char #\space p)
(write-fixnum ($bytevector-u8-ref x idx) p)
(f (fxadd1 idx) n x p)))))
(write-char #\) p)
i))
(define write-record
(lambda (x p m h i)
@ -270,7 +265,8 @@
[(in-map? b subsequents-map)
(write-char c p)]
[else
(write-inline-hex b p)]))))
(write-inline-hex b p)]))
(write-subsequent* str ($fxadd1 i) j p)))
(define write-symbol-hex-esc
(lambda (str p)

View File

@ -0,0 +1,338 @@
# ArabicShaping-5.0.0.txt
# Date: 2006-07-14, 11:23:00 PST [KW]
#
# This file is a normative contributory data file in the
# Unicode Character Database.
#
# Copyright (c) 1991-2006 Unicode, Inc.
# For terms of use, see http://www.unicode.org/terms_of_use.html
#
# This file defines the shaping classes for Arabic and Syriac
# positional shaping, repeating in machine readable form the
# information printed in Tables 8-3, 8-7, 8-8, 8-11, 8-12, and
# 8-13 of The Unicode Standard, Version 4.0.
#
# See sections 8.2 and 8.3 of The Unicode Standard, Version 4.0
# for more information.
#
# Each line contains four fields, separated by a semicolon.
#
# Field 0: the code point, in 4-digit hexadecimal
# form, of an Arabic or Syriac character.
# Field 1: gives a short schematic name for that character,
# abbreviated from the normative Unicode character name.
# Field 2: defines the joining type (property name: Joining_Type)
# R Right_Joining
# L Left_Joining
# D Dual_Joining
# C Join_Causing
# U Non_Joining
# T Transparent
# See the Arabic block description for more information on these types.
# Field 3: defines the joining group (property name: Joining_Group)
#
# The values of the joining group are based schematically on character
# names. Where a schematic character name consists of two or more parts separated
# by spaces, the formal Joining_Group property value, as specified in
# PropertyValueAliases.txt, consists of the same name parts joined by
# underscores. Hence, the entry:
#
# 0629; TEH MARBUTA; R; TEH MARBUTA
#
# corresponds to [Joining_Group = Teh_Marbuta].
#
# Note: For historical reasons, the property value [Joining_Group = Hamza_On_Heh_Goal]
# is anachronistically named. It used to apply to both of the following characters
# in earlier versions of the standard:
#
# U+06C2 ARABIC LETTER HEH GOAL WITH HAMZA ABOVE
# U+06C3 ARABIC LETTER TEH MARBUTA GOAL
#
# However, it currently applies only to U+06C3, and *not* to U+06C2.
# To avoid destabilizing existing Joining_Group property aliases, the
# value Hamza_On_Heh_Goal has not been changed, despite the fact that it
# no longer applies to Hamza On Heh Goal, but only to Teh Marbuta Goal.
#
# Note: Code points that are not explicitly listed in this file are
# either of joining type T or U:
#
# - Those that not explicitly listed that are of General Category Mn, Me, or Cf
# have joining type T.
# - All others not explicitly listed have type U.
#
# For an explicit listing of characters of joining type T, see
# the derived property file DerivedJoiningType.txt.
#
# There are currently no characters of type L defined in Unicode.
#
# #############################################################
# Unicode; Schematic Name; Joining Type; Joining Group
# Arabic characters
0600; ARABIC NUMBER SIGN; U; No_Joining_Group
0601; ARABIC SIGN SANAH; U; No_Joining_Group
0602; ARABIC FOOTNOTE MARKER; U; No_Joining_Group
0603; ARABIC SIGN SAFHA; U; No_Joining_Group
060B; AFGHANI SIGN; U; No_Joining_Group
0621; HAMZA; U; No_Joining_Group
0622; MADDA ON ALEF; R; ALEF
0623; HAMZA ON ALEF; R; ALEF
0624; HAMZA ON WAW; R; WAW
0625; HAMZA UNDER ALEF; R; ALEF
0626; HAMZA ON YEH; D; YEH
0627; ALEF; R; ALEF
0628; BEH; D; BEH
0629; TEH MARBUTA; R; TEH MARBUTA
062A; TEH; D; BEH
062B; THEH; D; BEH
062C; JEEM; D; HAH
062D; HAH; D; HAH
062E; KHAH; D; HAH
062F; DAL; R; DAL
0630; THAL; R; DAL
0631; REH; R; REH
0632; ZAIN; R; REH
0633; SEEN; D; SEEN
0634; SHEEN; D; SEEN
0635; SAD; D; SAD
0636; DAD; D; SAD
0637; TAH; D; TAH
0638; ZAH; D; TAH
0639; AIN; D; AIN
063A; GHAIN; D; AIN
0640; TATWEEL; C; No_Joining_Group
0641; FEH; D; FEH
0642; QAF; D; QAF
0643; KAF; D; KAF
0644; LAM; D; LAM
0645; MEEM; D; MEEM
0646; NOON; D; NOON
0647; HEH; D; HEH
0648; WAW; R; WAW
0649; ALEF MAKSURA; D; YEH
064A; YEH; D; YEH
066E; DOTLESS BEH; D; BEH
066F; DOTLESS QAF; D; QAF
0671; HAMZAT WASL ON ALEF; R; ALEF
0672; WAVY HAMZA ON ALEF; R; ALEF
0673; WAVY HAMZA UNDER ALEF; R; ALEF
0674; HIGH HAMZA; U; No_Joining_Group
0675; HIGH HAMZA ALEF; R; ALEF
0676; HIGH HAMZA WAW; R; WAW
0677; HIGH HAMZA WAW WITH DAMMA; R; WAW
0678; HIGH HAMZA YEH; D; YEH
0679; TEH WITH SMALL TAH; D; BEH
067A; TEH WITH 2 DOTS VERTICAL ABOVE; D; BEH
067B; BEH WITH 2 DOTS VERTICAL BELOW; D; BEH
067C; TEH WITH RING; D; BEH
067D; TEH WITH 3 DOTS ABOVE DOWNWARD; D; BEH
067E; TEH WITH 3 DOTS BELOW; D; BEH
067F; TEH WITH 4 DOTS ABOVE; D; BEH
0680; BEH WITH 4 DOTS BELOW; D; BEH
0681; HAMZA ON HAH; D; HAH
0682; HAH WITH 2 DOTS VERTICAL ABOVE; D; HAH
0683; HAH WITH MIDDLE 2 DOTS; D; HAH
0684; HAH WITH MIDDLE 2 DOTS VERTICAL; D; HAH
0685; HAH WITH 3 DOTS ABOVE; D; HAH
0686; HAH WITH MIDDLE 3 DOTS DOWNWARD; D; HAH
0687; HAH WITH MIDDLE 4 DOTS; D; HAH
0688; DAL WITH SMALL TAH; R; DAL
0689; DAL WITH RING; R; DAL
068A; DAL WITH DOT BELOW; R; DAL
068B; DAL WITH DOT BELOW AND SMALL TAH; R; DAL
068C; DAL WITH 2 DOTS ABOVE; R; DAL
068D; DAL WITH 2 DOTS BELOW; R; DAL
068E; DAL WITH 3 DOTS ABOVE; R; DAL
068F; DAL WITH 3 DOTS ABOVE DOWNWARD; R; DAL
0690; DAL WITH 4 DOTS ABOVE; R; DAL
0691; REH WITH SMALL TAH; R; REH
0692; REH WITH SMALL V; R; REH
0693; REH WITH RING; R; REH
0694; REH WITH DOT BELOW; R; REH
0695; REH WITH SMALL V BELOW; R; REH
0696; REH WITH DOT BELOW AND DOT ABOVE; R; REH
0697; REH WITH 2 DOTS ABOVE; R; REH
0698; REH WITH 3 DOTS ABOVE; R; REH
0699; REH WITH 4 DOTS ABOVE; R; REH
069A; SEEN WITH DOT BELOW AND DOT ABOVE; D; SEEN
069B; SEEN WITH 3 DOTS BELOW; D; SEEN
069C; SEEN WITH 3 DOTS BELOW AND 3 DOTS ABOVE; D; SEEN
069D; SAD WITH 2 DOTS BELOW; D; SAD
069E; SAD WITH 3 DOTS ABOVE; D; SAD
069F; TAH WITH 3 DOTS ABOVE; D; TAH
06A0; AIN WITH 3 DOTS ABOVE; D; AIN
06A1; DOTLESS FEH; D; FEH
06A2; FEH WITH DOT MOVED BELOW; D; FEH
06A3; FEH WITH DOT BELOW; D; FEH
06A4; FEH WITH 3 DOTS ABOVE; D; FEH
06A5; FEH WITH 3 DOTS BELOW; D; FEH
06A6; FEH WITH 4 DOTS ABOVE; D; FEH
06A7; QAF WITH DOT ABOVE; D; QAF
06A8; QAF WITH 3 DOTS ABOVE; D; QAF
06A9; KEHEH; D; GAF
06AA; SWASH KAF; D; SWASH KAF
06AB; KAF WITH RING; D; GAF
06AC; KAF WITH DOT ABOVE; D; KAF
06AD; KAF WITH 3 DOTS ABOVE; D; KAF
06AE; KAF WITH 3 DOTS BELOW; D; KAF
06AF; GAF; D; GAF
06B0; GAF WITH RING; D; GAF
06B1; GAF WITH 2 DOTS ABOVE; D; GAF
06B2; GAF WITH 2 DOTS BELOW; D; GAF
06B3; GAF WITH 2 DOTS VERTICAL BELOW; D; GAF
06B4; GAF WITH 3 DOTS ABOVE; D; GAF
06B5; LAM WITH SMALL V; D; LAM
06B6; LAM WITH DOT ABOVE; D; LAM
06B7; LAM WITH 3 DOTS ABOVE; D; LAM
06B8; LAM WITH 3 DOTS BELOW; D; LAM
06B9; NOON WITH DOT BELOW; D; NOON
06BA; DOTLESS NOON; D; NOON
06BB; DOTLESS NOON WITH SMALL TAH; D; NOON
06BC; NOON WITH RING; D; NOON
06BD; NOON WITH 3 DOTS ABOVE; D; NOON
06BE; KNOTTED HEH; D; KNOTTED HEH
06BF; HAH WITH MIDDLE 3 DOTS DOWNWARD AND DOT ABOVE; D; HAH
06C0; HAMZA ON HEH; R; TEH MARBUTA
06C1; HEH GOAL; D; HEH GOAL
06C2; HAMZA ON HEH GOAL; D; HEH GOAL
06C3; TEH MARBUTA GOAL; R; HAMZA ON HEH GOAL
06C4; WAW WITH RING; R; WAW
06C5; WAW WITH BAR; R; WAW
06C6; WAW WITH SMALL V; R; WAW
06C7; WAW WITH DAMMA; R; WAW
06C8; WAW WITH ALEF ABOVE; R; WAW
06C9; WAW WITH INVERTED SMALL V; R; WAW
06CA; WAW WITH 2 DOTS ABOVE; R; WAW
06CB; WAW WITH 3 DOTS ABOVE; R; WAW
06CC; DOTLESS YEH; D; YEH
06CD; YEH WITH TAIL; R; YEH WITH TAIL
06CE; YEH WITH SMALL V; D; YEH
06CF; WAW WITH DOT ABOVE; R; WAW
06D0; YEH WITH 2 DOTS VERTICAL BELOW; D; YEH
06D1; YEH WITH 3 DOTS BELOW; D; YEH
06D2; YEH BARREE; R; YEH BARREE
06D3; HAMZA ON YEH BARREE; R; YEH BARREE
06D5; AE; R; TEH MARBUTA
06DD; ARABIC END OF AYAH; U; No_Joining_Group
06EE; DAL WITH INVERTED V; R; DAL
06EF; REH WITH INVERTED V; R; REH
06FA; SEEN WITH DOT BELOW AND 3 DOTS ABOVE; D; SEEN
06FB; DAD WITH DOT BELOW; D; SAD
06FC; GHAIN WITH DOT BELOW; D; AIN
06FF; HEH WITH INVERTED V; D; KNOTTED HEH
# Syriac characters
0710; ALAPH; R; ALAPH
0712; BETH; D; BETH
0713; GAMAL; D; GAMAL
0714; GAMAL GARSHUNI; D; GAMAL
0715; DALATH; R; DALATH RISH
0716; DOTLESS DALATH RISH; R; DALATH RISH
0717; HE; R; HE
0718; WAW; R; SYRIAC WAW
0719; ZAIN; R; ZAIN
071A; HETH; D; HETH
071B; TETH; D; TETH
071C; TETH GARSHUNI; D; TETH
071D; YUDH; D; YUDH
071E; YUDH HE; R; YUDH HE
071F; KAPH; D; KAPH
0720; LAMADH; D; LAMADH
0721; MIM; D; MIM
0722; NUN; D; NUN
0723; SEMKATH; D; SEMKATH
0724; FINAL SEMKATH; D; FINAL SEMKATH
0725; E; D; E
0726; PE; D; PE
0727; REVERSED PE; D; REVERSED PE
0728; SADHE; R; SADHE
0729; QAPH; D; QAPH
072A; RISH; R; DALATH RISH
072B; SHIN; D; SHIN
072C; TAW; R; TAW
072D; PERSIAN BHETH; D; BETH
072E; PERSIAN GHAMAL; D; GAMAL
072F; PERSIAN DHALATH; R; DALATH RISH
074D; SOGDIAN ZHAIN; R; ZHAIN
074E; SOGDIAN KHAPH; D; KHAPH
074F; SOGDIAN FE; D; FE
# Arabic supplement characters
0750; BEH WITH 3 DOTS HORIZONTALLY BELOW; D; BEH
0751; BEH WITH DOT BELOW AND 3 DOTS ABOVE; D; BEH
0752; BEH WITH 3 DOTS POINTING UPWARDS BELOW; D; BEH
0753; BEH WITH 3 DOTS POINTING UPWARDS BELOW AND 2 DOTS ABOVE; D; BEH
0754; BEH WITH 2 DOTS BELOW AND DOT ABOVE; D; BEH
0755; BEH WITH INVERTED SMALL V BELOW; D; BEH
0756; BEH WITH SMALL V; D; BEH
0757; HAH WITH 2 DOTS ABOVE; D; HAH
0758; HAH WITH 3 DOTS POINTING UPWARDS BELOW; D; HAH
0759; DAL WITH 2 DOTS VERTICALLY BELOW AND SMALL TAH; R; DAL
075A; DAL WITH INVERTED SMALL V BELOW; R; DAL
075B; REH WITH STROKE; R; REH
075C; SEEN WITH 4 DOTS ABOVE; D; SEEN
075D; AIN WITH 2 DOTS ABOVE; D; AIN
075E; AIN WITH 3 DOTS POINTING DOWNWARDS ABOVE; D; AIN
075F; AIN WITH 2 DOTS VERTICALLY ABOVE; D; AIN
0760; FEH WITH 2 DOTS BELOW; D; FEH
0761; FEH WITH 3 DOTS POINTING UPWARDS BELOW; D; FEH
0762; KEHEH WITH DOT ABOVE; D; GAF
0763; KEHEH WITH 3 DOTS ABOVE; D; GAF
0764; KEHEH WITH 3 DOTS POINTING UPWARDS BELOW; D; GAF
0765; MEEM WITH DOT ABOVE; D; MEEM
0766; MEEM WITH DOT BELOW; D; MEEM
0767; NOON WITH 2 DOTS BELOW; D; NOON
0768; NOON WITH SMALL TAH; D; NOON
0769; NOON WITH SMALL V; D; NOON
076A; LAM WITH BAR; D; LAM
076B; REH WITH 2 DOTS VERTICALLY ABOVE; R; REH
076C; REH WITH HAMZA ABOVE; R; REH
076D; SEEN WITH 2 DOTS VERTICALLY ABOVE; D; SEEN
# N'Ko Characters
07CA; NKO A; D; No_Joining_Group
07CB; NKO EE; D; No_Joining_Group
07CC; NKO I; D; No_Joining_Group
07CD; NKO E; D; No_Joining_Group
07CE; NKO U; D; No_Joining_Group
07CF; NKO OO; D; No_Joining_Group
07D0; NKO O; D; No_Joining_Group
07D1; NKO DAGBASINNA; D; No_Joining_Group
07D2; NKO N; D; No_Joining_Group
07D3; NKO BA; D; No_Joining_Group
07D4; NKO PA; D; No_Joining_Group
07D5; NKO TA; D; No_Joining_Group
07D6; NKO JA; D; No_Joining_Group
07D7; NKO CHA; D; No_Joining_Group
07D8; NKO DA; D; No_Joining_Group
07D9; NKO RA; D; No_Joining_Group
07DA; NKO RRA; D; No_Joining_Group
07DB; NKO SA; D; No_Joining_Group
07DC; NKO GBA; D; No_Joining_Group
07DD; NKO FA; D; No_Joining_Group
07DE; NKO KA; D; No_Joining_Group
07DF; NKO LA; D; No_Joining_Group
07E0; NKO NA WOLOSO; D; No_Joining_Group
07E1; NKO MA; D; No_Joining_Group
07E2; NKO NYA; D; No_Joining_Group
07E3; NKO NA; D; No_Joining_Group
07E4; NKO HA; D; No_Joining_Group
07E5; NKO WA; D; No_Joining_Group
07E6; NKO YA; D; No_Joining_Group
07E7; NKO NYA WOLOSO; D; No_Joining_Group
07E8; NKO JONA JA; D; No_Joining_Group
07E9; NKO JONA CHA; D; No_Joining_Group
07EA; NKO JONA RA; D; No_Joining_Group
07FA; NKO LAJANYALAN; C; No_Joining_Group
# Other
200D; ZERO WIDTH JOINER; C; No_Joining_Group
200C; ZERO WIDTH NON-JOINER; U; No_Joining_Group
# EOF

View File

@ -0,0 +1,582 @@
# BidiMirroring-5.0.0.txt
# Date: 2006-02-16, 16:11:00 PST [KW]
#
# Bidi_Mirroring_Glyph Property
#
# This file is an informative contributory data file in the
# Unicode Character Database.
#
# Copyright (c) 1991-2006 Unicode, Inc.
# For terms of use, see http://www.unicode.org/terms_of_use.html
#
# This data file lists characters that have the mirrored property
# where there is another Unicode character that typically has a glyph
# that is the mirror image of the original character's glyph.
# The repertoire covered by the file is Unicode 5.0.0.
#
# The file contains a list of lines with mappings from one code point
# to another one for character-based mirroring.
# Note that for "real" mirroring, a rendering engine needs to select
# appropriate alternative glyphs, and that many Unicode characters do not
# have a mirror-image Unicode character.
#
# Each mapping line contains two fields, separated by a semicolon (';').
# Each of the two fields contains a code point represented as a
# variable-length hexadecimal value with 4 to 6 digits.
# A comment indicates where the characters are "BEST FIT" mirroring.
#
# Code points with the "mirrored" property but no appropriate mirrors are
# listed as comments at the end of the file.
#
# For information on bidi mirroring, see UAX #9: Bidirectional Algorithm,
# at http://www.unicode.org/unicode/reports/tr9/
#
# This file was originally created by Markus Scherer.
# Extended for Unicode 3.2, 4.0, 4.1, and 5.0 by Ken Whistler.
#
# ############################################################
0028; 0029 # LEFT PARENTHESIS
0029; 0028 # RIGHT PARENTHESIS
003C; 003E # LESS-THAN SIGN
003E; 003C # GREATER-THAN SIGN
005B; 005D # LEFT SQUARE BRACKET
005D; 005B # RIGHT SQUARE BRACKET
007B; 007D # LEFT CURLY BRACKET
007D; 007B # RIGHT CURLY BRACKET
00AB; 00BB # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
00BB; 00AB # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0F3A; 0F3B # TIBETAN MARK GUG RTAGS GYON
0F3B; 0F3A # TIBETAN MARK GUG RTAGS GYAS
0F3C; 0F3D # TIBETAN MARK ANG KHANG GYON
0F3D; 0F3C # TIBETAN MARK ANG KHANG GYAS
169B; 169C # OGHAM FEATHER MARK
169C; 169B # OGHAM REVERSED FEATHER MARK
2018; 2019 # [BEST FIT] LEFT SINGLE QUOTATION MARK
2019; 2018 # [BEST FIT] RIGHT SINGLE QUOTATION MARK
201C; 201D # [BEST FIT] LEFT DOUBLE QUOTATION MARK
201D; 201C # [BEST FIT] RIGHT DOUBLE QUOTATION MARK
2039; 203A # SINGLE LEFT-POINTING ANGLE QUOTATION MARK
203A; 2039 # SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
2045; 2046 # LEFT SQUARE BRACKET WITH QUILL
2046; 2045 # RIGHT SQUARE BRACKET WITH QUILL
207D; 207E # SUPERSCRIPT LEFT PARENTHESIS
207E; 207D # SUPERSCRIPT RIGHT PARENTHESIS
208D; 208E # SUBSCRIPT LEFT PARENTHESIS
208E; 208D # SUBSCRIPT RIGHT PARENTHESIS
2208; 220B # ELEMENT OF
2209; 220C # NOT AN ELEMENT OF
220A; 220D # SMALL ELEMENT OF
220B; 2208 # CONTAINS AS MEMBER
220C; 2209 # DOES NOT CONTAIN AS MEMBER
220D; 220A # SMALL CONTAINS AS MEMBER
2215; 29F5 # DIVISION SLASH
223C; 223D # TILDE OPERATOR
223D; 223C # REVERSED TILDE
2243; 22CD # ASYMPTOTICALLY EQUAL TO
2252; 2253 # APPROXIMATELY EQUAL TO OR THE IMAGE OF
2253; 2252 # IMAGE OF OR APPROXIMATELY EQUAL TO
2254; 2255 # COLON EQUALS
2255; 2254 # EQUALS COLON
2264; 2265 # LESS-THAN OR EQUAL TO
2265; 2264 # GREATER-THAN OR EQUAL TO
2266; 2267 # LESS-THAN OVER EQUAL TO
2267; 2266 # GREATER-THAN OVER EQUAL TO
2268; 2269 # [BEST FIT] LESS-THAN BUT NOT EQUAL TO
2269; 2268 # [BEST FIT] GREATER-THAN BUT NOT EQUAL TO
226A; 226B # MUCH LESS-THAN
226B; 226A # MUCH GREATER-THAN
226E; 226F # [BEST FIT] NOT LESS-THAN
226F; 226E # [BEST FIT] NOT GREATER-THAN
2270; 2271 # [BEST FIT] NEITHER LESS-THAN NOR EQUAL TO
2271; 2270 # [BEST FIT] NEITHER GREATER-THAN NOR EQUAL TO
2272; 2273 # [BEST FIT] LESS-THAN OR EQUIVALENT TO
2273; 2272 # [BEST FIT] GREATER-THAN OR EQUIVALENT TO
2274; 2275 # [BEST FIT] NEITHER LESS-THAN NOR EQUIVALENT TO
2275; 2274 # [BEST FIT] NEITHER GREATER-THAN NOR EQUIVALENT TO
2276; 2277 # LESS-THAN OR GREATER-THAN
2277; 2276 # GREATER-THAN OR LESS-THAN
2278; 2279 # NEITHER LESS-THAN NOR GREATER-THAN
2279; 2278 # NEITHER GREATER-THAN NOR LESS-THAN
227A; 227B # PRECEDES
227B; 227A # SUCCEEDS
227C; 227D # PRECEDES OR EQUAL TO
227D; 227C # SUCCEEDS OR EQUAL TO
227E; 227F # [BEST FIT] PRECEDES OR EQUIVALENT TO
227F; 227E # [BEST FIT] SUCCEEDS OR EQUIVALENT TO
2280; 2281 # [BEST FIT] DOES NOT PRECEDE
2281; 2280 # [BEST FIT] DOES NOT SUCCEED
2282; 2283 # SUBSET OF
2283; 2282 # SUPERSET OF
2284; 2285 # [BEST FIT] NOT A SUBSET OF
2285; 2284 # [BEST FIT] NOT A SUPERSET OF
2286; 2287 # SUBSET OF OR EQUAL TO
2287; 2286 # SUPERSET OF OR EQUAL TO
2288; 2289 # [BEST FIT] NEITHER A SUBSET OF NOR EQUAL TO
2289; 2288 # [BEST FIT] NEITHER A SUPERSET OF NOR EQUAL TO
228A; 228B # [BEST FIT] SUBSET OF WITH NOT EQUAL TO
228B; 228A # [BEST FIT] SUPERSET OF WITH NOT EQUAL TO
228F; 2290 # SQUARE IMAGE OF
2290; 228F # SQUARE ORIGINAL OF
2291; 2292 # SQUARE IMAGE OF OR EQUAL TO
2292; 2291 # SQUARE ORIGINAL OF OR EQUAL TO
2298; 29B8 # CIRCLED DIVISION SLASH
22A2; 22A3 # RIGHT TACK
22A3; 22A2 # LEFT TACK
22A6; 2ADE # ASSERTION
22A8; 2AE4 # TRUE
22A9; 2AE3 # FORCES
22AB; 2AE5 # DOUBLE VERTICAL BAR DOUBLE RIGHT TURNSTILE
22B0; 22B1 # PRECEDES UNDER RELATION
22B1; 22B0 # SUCCEEDS UNDER RELATION
22B2; 22B3 # NORMAL SUBGROUP OF
22B3; 22B2 # CONTAINS AS NORMAL SUBGROUP
22B4; 22B5 # NORMAL SUBGROUP OF OR EQUAL TO
22B5; 22B4 # CONTAINS AS NORMAL SUBGROUP OR EQUAL TO
22B6; 22B7 # ORIGINAL OF
22B7; 22B6 # IMAGE OF
22C9; 22CA # LEFT NORMAL FACTOR SEMIDIRECT PRODUCT
22CA; 22C9 # RIGHT NORMAL FACTOR SEMIDIRECT PRODUCT
22CB; 22CC # LEFT SEMIDIRECT PRODUCT
22CC; 22CB # RIGHT SEMIDIRECT PRODUCT
22CD; 2243 # REVERSED TILDE EQUALS
22D0; 22D1 # DOUBLE SUBSET
22D1; 22D0 # DOUBLE SUPERSET
22D6; 22D7 # LESS-THAN WITH DOT
22D7; 22D6 # GREATER-THAN WITH DOT
22D8; 22D9 # VERY MUCH LESS-THAN
22D9; 22D8 # VERY MUCH GREATER-THAN
22DA; 22DB # LESS-THAN EQUAL TO OR GREATER-THAN
22DB; 22DA # GREATER-THAN EQUAL TO OR LESS-THAN
22DC; 22DD # EQUAL TO OR LESS-THAN
22DD; 22DC # EQUAL TO OR GREATER-THAN
22DE; 22DF # EQUAL TO OR PRECEDES
22DF; 22DE # EQUAL TO OR SUCCEEDS
22E0; 22E1 # [BEST FIT] DOES NOT PRECEDE OR EQUAL
22E1; 22E0 # [BEST FIT] DOES NOT SUCCEED OR EQUAL
22E2; 22E3 # [BEST FIT] NOT SQUARE IMAGE OF OR EQUAL TO
22E3; 22E2 # [BEST FIT] NOT SQUARE ORIGINAL OF OR EQUAL TO
22E4; 22E5 # [BEST FIT] SQUARE IMAGE OF OR NOT EQUAL TO
22E5; 22E4 # [BEST FIT] SQUARE ORIGINAL OF OR NOT EQUAL TO
22E6; 22E7 # [BEST FIT] LESS-THAN BUT NOT EQUIVALENT TO
22E7; 22E6 # [BEST FIT] GREATER-THAN BUT NOT EQUIVALENT TO
22E8; 22E9 # [BEST FIT] PRECEDES BUT NOT EQUIVALENT TO
22E9; 22E8 # [BEST FIT] SUCCEEDS BUT NOT EQUIVALENT TO
22EA; 22EB # [BEST FIT] NOT NORMAL SUBGROUP OF
22EB; 22EA # [BEST FIT] DOES NOT CONTAIN AS NORMAL SUBGROUP
22EC; 22ED # [BEST FIT] NOT NORMAL SUBGROUP OF OR EQUAL TO
22ED; 22EC # [BEST FIT] DOES NOT CONTAIN AS NORMAL SUBGROUP OR EQUAL
22F0; 22F1 # UP RIGHT DIAGONAL ELLIPSIS
22F1; 22F0 # DOWN RIGHT DIAGONAL ELLIPSIS
22F2; 22FA # ELEMENT OF WITH LONG HORIZONTAL STROKE
22F3; 22FB # ELEMENT OF WITH VERTICAL BAR AT END OF HORIZONTAL STROKE
22F4; 22FC # SMALL ELEMENT OF WITH VERTICAL BAR AT END OF HORIZONTAL STROKE
22F6; 22FD # ELEMENT OF WITH OVERBAR
22F7; 22FE # SMALL ELEMENT OF WITH OVERBAR
22FA; 22F2 # CONTAINS WITH LONG HORIZONTAL STROKE
22FB; 22F3 # CONTAINS WITH VERTICAL BAR AT END OF HORIZONTAL STROKE
22FC; 22F4 # SMALL CONTAINS WITH VERTICAL BAR AT END OF HORIZONTAL STROKE
22FD; 22F6 # CONTAINS WITH OVERBAR
22FE; 22F7 # SMALL CONTAINS WITH OVERBAR
2308; 2309 # LEFT CEILING
2309; 2308 # RIGHT CEILING
230A; 230B # LEFT FLOOR
230B; 230A # RIGHT FLOOR
2329; 232A # LEFT-POINTING ANGLE BRACKET
232A; 2329 # RIGHT-POINTING ANGLE BRACKET
2768; 2769 # MEDIUM LEFT PARENTHESIS ORNAMENT
2769; 2768 # MEDIUM RIGHT PARENTHESIS ORNAMENT
276A; 276B # MEDIUM FLATTENED LEFT PARENTHESIS ORNAMENT
276B; 276A # MEDIUM FLATTENED RIGHT PARENTHESIS ORNAMENT
276C; 276D # MEDIUM LEFT-POINTING ANGLE BRACKET ORNAMENT
276D; 276C # MEDIUM RIGHT-POINTING ANGLE BRACKET ORNAMENT
276E; 276F # HEAVY LEFT-POINTING ANGLE QUOTATION MARK ORNAMENT
276F; 276E # HEAVY RIGHT-POINTING ANGLE QUOTATION MARK ORNAMENT
2770; 2771 # HEAVY LEFT-POINTING ANGLE BRACKET ORNAMENT
2771; 2770 # HEAVY RIGHT-POINTING ANGLE BRACKET ORNAMENT
2772; 2773 # LIGHT LEFT TORTOISE SHELL BRACKET
2773; 2772 # LIGHT RIGHT TORTOISE SHELL BRACKET
2774; 2775 # MEDIUM LEFT CURLY BRACKET ORNAMENT
2775; 2774 # MEDIUM RIGHT CURLY BRACKET ORNAMENT
27C3; 27C4 # OPEN SUBSET
27C4; 27C3 # OPEN SUPERSET
27C5; 27C6 # LEFT S-SHAPED BAG DELIMITER
27C6; 27C5 # RIGHT S-SHAPED BAG DELIMITER
27D5; 27D6 # LEFT OUTER JOIN
27D6; 27D5 # RIGHT OUTER JOIN
27DD; 27DE # LONG RIGHT TACK
27DE; 27DD # LONG LEFT TACK
27E2; 27E3 # WHITE CONCAVE-SIDED DIAMOND WITH LEFTWARDS TICK
27E3; 27E2 # WHITE CONCAVE-SIDED DIAMOND WITH RIGHTWARDS TICK
27E4; 27E5 # WHITE SQUARE WITH LEFTWARDS TICK
27E5; 27E4 # WHITE SQUARE WITH RIGHTWARDS TICK
27E6; 27E7 # MATHEMATICAL LEFT WHITE SQUARE BRACKET
27E7; 27E6 # MATHEMATICAL RIGHT WHITE SQUARE BRACKET
27E8; 27E9 # MATHEMATICAL LEFT ANGLE BRACKET
27E9; 27E8 # MATHEMATICAL RIGHT ANGLE BRACKET
27EA; 27EB # MATHEMATICAL LEFT DOUBLE ANGLE BRACKET
27EB; 27EA # MATHEMATICAL RIGHT DOUBLE ANGLE BRACKET
2983; 2984 # LEFT WHITE CURLY BRACKET
2984; 2983 # RIGHT WHITE CURLY BRACKET
2985; 2986 # LEFT WHITE PARENTHESIS
2986; 2985 # RIGHT WHITE PARENTHESIS
2987; 2988 # Z NOTATION LEFT IMAGE BRACKET
2988; 2987 # Z NOTATION RIGHT IMAGE BRACKET
2989; 298A # Z NOTATION LEFT BINDING BRACKET
298A; 2989 # Z NOTATION RIGHT BINDING BRACKET
298B; 298C # LEFT SQUARE BRACKET WITH UNDERBAR
298C; 298B # RIGHT SQUARE BRACKET WITH UNDERBAR
298D; 2990 # LEFT SQUARE BRACKET WITH TICK IN TOP CORNER
298E; 298F # RIGHT SQUARE BRACKET WITH TICK IN BOTTOM CORNER
298F; 298E # LEFT SQUARE BRACKET WITH TICK IN BOTTOM CORNER
2990; 298D # RIGHT SQUARE BRACKET WITH TICK IN TOP CORNER
2991; 2992 # LEFT ANGLE BRACKET WITH DOT
2992; 2991 # RIGHT ANGLE BRACKET WITH DOT
2993; 2994 # LEFT ARC LESS-THAN BRACKET
2994; 2993 # RIGHT ARC GREATER-THAN BRACKET
2995; 2996 # DOUBLE LEFT ARC GREATER-THAN BRACKET
2996; 2995 # DOUBLE RIGHT ARC LESS-THAN BRACKET
2997; 2998 # LEFT BLACK TORTOISE SHELL BRACKET
2998; 2997 # RIGHT BLACK TORTOISE SHELL BRACKET
29B8; 2298 # CIRCLED REVERSE SOLIDUS
29C0; 29C1 # CIRCLED LESS-THAN
29C1; 29C0 # CIRCLED GREATER-THAN
29C4; 29C5 # SQUARED RISING DIAGONAL SLASH
29C5; 29C4 # SQUARED FALLING DIAGONAL SLASH
29CF; 29D0 # LEFT TRIANGLE BESIDE VERTICAL BAR
29D0; 29CF # VERTICAL BAR BESIDE RIGHT TRIANGLE
29D1; 29D2 # BOWTIE WITH LEFT HALF BLACK
29D2; 29D1 # BOWTIE WITH RIGHT HALF BLACK
29D4; 29D5 # TIMES WITH LEFT HALF BLACK
29D5; 29D4 # TIMES WITH RIGHT HALF BLACK
29D8; 29D9 # LEFT WIGGLY FENCE
29D9; 29D8 # RIGHT WIGGLY FENCE
29DA; 29DB # LEFT DOUBLE WIGGLY FENCE
29DB; 29DA # RIGHT DOUBLE WIGGLY FENCE
29F5; 2215 # REVERSE SOLIDUS OPERATOR
29F8; 29F9 # BIG SOLIDUS
29F9; 29F8 # BIG REVERSE SOLIDUS
29FC; 29FD # LEFT-POINTING CURVED ANGLE BRACKET
29FD; 29FC # RIGHT-POINTING CURVED ANGLE BRACKET
2A2B; 2A2C # MINUS SIGN WITH FALLING DOTS
2A2C; 2A2B # MINUS SIGN WITH RISING DOTS
2A2D; 2A2E # PLUS SIGN IN LEFT HALF CIRCLE
2A2E; 2A2D # PLUS SIGN IN RIGHT HALF CIRCLE
2A34; 2A35 # MULTIPLICATION SIGN IN LEFT HALF CIRCLE
2A35; 2A34 # MULTIPLICATION SIGN IN RIGHT HALF CIRCLE
2A3C; 2A3D # INTERIOR PRODUCT
2A3D; 2A3C # RIGHTHAND INTERIOR PRODUCT
2A64; 2A65 # Z NOTATION DOMAIN ANTIRESTRICTION
2A65; 2A64 # Z NOTATION RANGE ANTIRESTRICTION
2A79; 2A7A # LESS-THAN WITH CIRCLE INSIDE
2A7A; 2A79 # GREATER-THAN WITH CIRCLE INSIDE
2A7D; 2A7E # LESS-THAN OR SLANTED EQUAL TO
2A7E; 2A7D # GREATER-THAN OR SLANTED EQUAL TO
2A7F; 2A80 # LESS-THAN OR SLANTED EQUAL TO WITH DOT INSIDE
2A80; 2A7F # GREATER-THAN OR SLANTED EQUAL TO WITH DOT INSIDE
2A81; 2A82 # LESS-THAN OR SLANTED EQUAL TO WITH DOT ABOVE
2A82; 2A81 # GREATER-THAN OR SLANTED EQUAL TO WITH DOT ABOVE
2A83; 2A84 # LESS-THAN OR SLANTED EQUAL TO WITH DOT ABOVE RIGHT
2A84; 2A83 # GREATER-THAN OR SLANTED EQUAL TO WITH DOT ABOVE LEFT
2A8B; 2A8C # LESS-THAN ABOVE DOUBLE-LINE EQUAL ABOVE GREATER-THAN
2A8C; 2A8B # GREATER-THAN ABOVE DOUBLE-LINE EQUAL ABOVE LESS-THAN
2A91; 2A92 # LESS-THAN ABOVE GREATER-THAN ABOVE DOUBLE-LINE EQUAL
2A92; 2A91 # GREATER-THAN ABOVE LESS-THAN ABOVE DOUBLE-LINE EQUAL
2A93; 2A94 # LESS-THAN ABOVE SLANTED EQUAL ABOVE GREATER-THAN ABOVE SLANTED EQUAL
2A94; 2A93 # GREATER-THAN ABOVE SLANTED EQUAL ABOVE LESS-THAN ABOVE SLANTED EQUAL
2A95; 2A96 # SLANTED EQUAL TO OR LESS-THAN
2A96; 2A95 # SLANTED EQUAL TO OR GREATER-THAN
2A97; 2A98 # SLANTED EQUAL TO OR LESS-THAN WITH DOT INSIDE
2A98; 2A97 # SLANTED EQUAL TO OR GREATER-THAN WITH DOT INSIDE
2A99; 2A9A # DOUBLE-LINE EQUAL TO OR LESS-THAN
2A9A; 2A99 # DOUBLE-LINE EQUAL TO OR GREATER-THAN
2A9B; 2A9C # DOUBLE-LINE SLANTED EQUAL TO OR LESS-THAN
2A9C; 2A9B # DOUBLE-LINE SLANTED EQUAL TO OR GREATER-THAN
2AA1; 2AA2 # DOUBLE NESTED LESS-THAN
2AA2; 2AA1 # DOUBLE NESTED GREATER-THAN
2AA6; 2AA7 # LESS-THAN CLOSED BY CURVE
2AA7; 2AA6 # GREATER-THAN CLOSED BY CURVE
2AA8; 2AA9 # LESS-THAN CLOSED BY CURVE ABOVE SLANTED EQUAL
2AA9; 2AA8 # GREATER-THAN CLOSED BY CURVE ABOVE SLANTED EQUAL
2AAA; 2AAB # SMALLER THAN
2AAB; 2AAA # LARGER THAN
2AAC; 2AAD # SMALLER THAN OR EQUAL TO
2AAD; 2AAC # LARGER THAN OR EQUAL TO
2AAF; 2AB0 # PRECEDES ABOVE SINGLE-LINE EQUALS SIGN
2AB0; 2AAF # SUCCEEDS ABOVE SINGLE-LINE EQUALS SIGN
2AB3; 2AB4 # PRECEDES ABOVE EQUALS SIGN
2AB4; 2AB3 # SUCCEEDS ABOVE EQUALS SIGN
2ABB; 2ABC # DOUBLE PRECEDES
2ABC; 2ABB # DOUBLE SUCCEEDS
2ABD; 2ABE # SUBSET WITH DOT
2ABE; 2ABD # SUPERSET WITH DOT
2ABF; 2AC0 # SUBSET WITH PLUS SIGN BELOW
2AC0; 2ABF # SUPERSET WITH PLUS SIGN BELOW
2AC1; 2AC2 # SUBSET WITH MULTIPLICATION SIGN BELOW
2AC2; 2AC1 # SUPERSET WITH MULTIPLICATION SIGN BELOW
2AC3; 2AC4 # SUBSET OF OR EQUAL TO WITH DOT ABOVE
2AC4; 2AC3 # SUPERSET OF OR EQUAL TO WITH DOT ABOVE
2AC5; 2AC6 # SUBSET OF ABOVE EQUALS SIGN
2AC6; 2AC5 # SUPERSET OF ABOVE EQUALS SIGN
2ACD; 2ACE # SQUARE LEFT OPEN BOX OPERATOR
2ACE; 2ACD # SQUARE RIGHT OPEN BOX OPERATOR
2ACF; 2AD0 # CLOSED SUBSET
2AD0; 2ACF # CLOSED SUPERSET
2AD1; 2AD2 # CLOSED SUBSET OR EQUAL TO
2AD2; 2AD1 # CLOSED SUPERSET OR EQUAL TO
2AD3; 2AD4 # SUBSET ABOVE SUPERSET
2AD4; 2AD3 # SUPERSET ABOVE SUBSET
2AD5; 2AD6 # SUBSET ABOVE SUBSET
2AD6; 2AD5 # SUPERSET ABOVE SUPERSET
2ADE; 22A6 # SHORT LEFT TACK
2AE3; 22A9 # DOUBLE VERTICAL BAR LEFT TURNSTILE
2AE4; 22A8 # VERTICAL BAR DOUBLE LEFT TURNSTILE
2AE5; 22AB # DOUBLE VERTICAL BAR DOUBLE LEFT TURNSTILE
2AEC; 2AED # DOUBLE STROKE NOT SIGN
2AED; 2AEC # REVERSED DOUBLE STROKE NOT SIGN
2AF7; 2AF8 # TRIPLE NESTED LESS-THAN
2AF8; 2AF7 # TRIPLE NESTED GREATER-THAN
2AF9; 2AFA # DOUBLE-LINE SLANTED LESS-THAN OR EQUAL TO
2AFA; 2AF9 # DOUBLE-LINE SLANTED GREATER-THAN OR EQUAL TO
2E02; 2E03 # LEFT SUBSTITUTION BRACKET
2E03; 2E02 # RIGHT SUBSTITUTION BRACKET
2E04; 2E05 # LEFT DOTTED SUBSTITUTION BRACKET
2E05; 2E04 # RIGHT DOTTED SUBSTITUTION BRACKET
2E09; 2E0A # LEFT TRANSPOSITION BRACKET
2E0A; 2E09 # RIGHT TRANSPOSITION BRACKET
2E0C; 2E0D # LEFT RAISED OMISSION BRACKET
2E0D; 2E0C # RIGHT RAISED OMISSION BRACKET
2E1C; 2E1D # LEFT LOW PARAPHRASE BRACKET
2E1D; 2E1C # RIGHT LOW PARAPHRASE BRACKET
3008; 3009 # LEFT ANGLE BRACKET
3009; 3008 # RIGHT ANGLE BRACKET
300A; 300B # LEFT DOUBLE ANGLE BRACKET
300B; 300A # RIGHT DOUBLE ANGLE BRACKET
300C; 300D # [BEST FIT] LEFT CORNER BRACKET
300D; 300C # [BEST FIT] RIGHT CORNER BRACKET
300E; 300F # [BEST FIT] LEFT WHITE CORNER BRACKET
300F; 300E # [BEST FIT] RIGHT WHITE CORNER BRACKET
3010; 3011 # LEFT BLACK LENTICULAR BRACKET
3011; 3010 # RIGHT BLACK LENTICULAR BRACKET
3014; 3015 # LEFT TORTOISE SHELL BRACKET
3015; 3014 # RIGHT TORTOISE SHELL BRACKET
3016; 3017 # LEFT WHITE LENTICULAR BRACKET
3017; 3016 # RIGHT WHITE LENTICULAR BRACKET
3018; 3019 # LEFT WHITE TORTOISE SHELL BRACKET
3019; 3018 # RIGHT WHITE TORTOISE SHELL BRACKET
301A; 301B # LEFT WHITE SQUARE BRACKET
301B; 301A # RIGHT WHITE SQUARE BRACKET
301D; 301E # REVERSED DOUBLE PRIME QUOTATION MARK
301E; 301D # DOUBLE PRIME QUOTATION MARK
FE59; FE5A # SMALL LEFT PARENTHESIS
FE5A; FE59 # SMALL RIGHT PARENTHESIS
FE5B; FE5C # SMALL LEFT CURLY BRACKET
FE5C; FE5B # SMALL RIGHT CURLY BRACKET
FE5D; FE5E # SMALL LEFT TORTOISE SHELL BRACKET
FE5E; FE5D # SMALL RIGHT TORTOISE SHELL BRACKET
FE64; FE65 # SMALL LESS-THAN SIGN
FE65; FE64 # SMALL GREATER-THAN SIGN
FF08; FF09 # FULLWIDTH LEFT PARENTHESIS
FF09; FF08 # FULLWIDTH RIGHT PARENTHESIS
FF1C; FF1E # FULLWIDTH LESS-THAN SIGN
FF1E; FF1C # FULLWIDTH GREATER-THAN SIGN
FF3B; FF3D # FULLWIDTH LEFT SQUARE BRACKET
FF3D; FF3B # FULLWIDTH RIGHT SQUARE BRACKET
FF5B; FF5D # FULLWIDTH LEFT CURLY BRACKET
FF5D; FF5B # FULLWIDTH RIGHT CURLY BRACKET
FF5F; FF60 # FULLWIDTH LEFT WHITE PARENTHESIS
FF60; FF5F # FULLWIDTH RIGHT WHITE PARENTHESIS
FF62; FF63 # [BEST FIT] HALFWIDTH LEFT CORNER BRACKET
FF63; FF62 # [BEST FIT] HALFWIDTH RIGHT CORNER BRACKET
# The following characters have no appropriate mirroring character.
# For these characters it is up to the rendering system
# to provide mirrored glyphs.
# 201A; SINGLE LOW-9 QUOTATION MARK
# 201B; SINGLE HIGH-REVERSED-9 QUOTATION MARK
# 201E; DOUBLE LOW-9 QUOTATION MARK
# 201F; DOUBLE HIGH-REVERSED-9 QUOTATION MARK
# 2140; DOUBLE-STRUCK N-ARY SUMMATION
# 2201; COMPLEMENT
# 2202; PARTIAL DIFFERENTIAL
# 2203; THERE EXISTS
# 2204; THERE DOES NOT EXIST
# 2211; N-ARY SUMMATION
# 2216; SET MINUS
# 221A; SQUARE ROOT
# 221B; CUBE ROOT
# 221C; FOURTH ROOT
# 221D; PROPORTIONAL TO
# 221F; RIGHT ANGLE
# 2220; ANGLE
# 2221; MEASURED ANGLE
# 2222; SPHERICAL ANGLE
# 2224; DOES NOT DIVIDE
# 2226; NOT PARALLEL TO
# 222B; INTEGRAL
# 222C; DOUBLE INTEGRAL
# 222D; TRIPLE INTEGRAL
# 222E; CONTOUR INTEGRAL
# 222F; SURFACE INTEGRAL
# 2230; VOLUME INTEGRAL
# 2231; CLOCKWISE INTEGRAL
# 2232; CLOCKWISE CONTOUR INTEGRAL
# 2233; ANTICLOCKWISE CONTOUR INTEGRAL
# 2239; EXCESS
# 223B; HOMOTHETIC
# 223E; INVERTED LAZY S
# 223F; SINE WAVE
# 2240; WREATH PRODUCT
# 2241; NOT TILDE
# 2242; MINUS TILDE
# 2244; NOT ASYMPTOTICALLY EQUAL TO
# 2245; APPROXIMATELY EQUAL TO
# 2246; APPROXIMATELY BUT NOT ACTUALLY EQUAL TO
# 2247; NEITHER APPROXIMATELY NOR ACTUALLY EQUAL TO
# 2248; ALMOST EQUAL TO
# 2249; NOT ALMOST EQUAL TO
# 224A; ALMOST EQUAL OR EQUAL TO
# 224B; TRIPLE TILDE
# 224C; ALL EQUAL TO
# 225F; QUESTIONED EQUAL TO
# 2260; NOT EQUAL TO
# 2262; NOT IDENTICAL TO
# 228C; MULTISET
# 22A7; MODELS
# 22AA; TRIPLE VERTICAL BAR RIGHT TURNSTILE
# 22AC; DOES NOT PROVE
# 22AD; NOT TRUE
# 22AE; DOES NOT FORCE
# 22AF; NEGATED DOUBLE VERTICAL BAR DOUBLE RIGHT TURNSTILE
# 22B8; MULTIMAP
# 22BE; RIGHT ANGLE WITH ARC
# 22BF; RIGHT TRIANGLE
# 22F5; ELEMENT OF WITH DOT ABOVE
# 22F8; ELEMENT OF WITH UNDERBAR
# 22F9; ELEMENT OF WITH TWO HORIZONTAL STROKES
# 22FF; Z NOTATION BAG MEMBERSHIP
# 2320; TOP HALF INTEGRAL
# 2321; BOTTOM HALF INTEGRAL
# 27C0; THREE DIMENSIONAL ANGLE
# 27D3; LOWER RIGHT CORNER WITH DOT
# 27D4; UPPER LEFT CORNER WITH DOT
# 27DC; LEFT MULTIMAP
# 299B; MEASURED ANGLE OPENING LEFT
# 299C; RIGHT ANGLE VARIANT WITH SQUARE
# 299D; MEASURED RIGHT ANGLE WITH DOT
# 299E; ANGLE WITH S INSIDE
# 299F; ACUTE ANGLE
# 29A0; SPHERICAL ANGLE OPENING LEFT
# 29A1; SPHERICAL ANGLE OPENING UP
# 29A2; TURNED ANGLE
# 29A3; REVERSED ANGLE
# 29A4; ANGLE WITH UNDERBAR
# 29A5; REVERSED ANGLE WITH UNDERBAR
# 29A6; OBLIQUE ANGLE OPENING UP
# 29A7; OBLIQUE ANGLE OPENING DOWN
# 29A8; MEASURED ANGLE WITH OPEN ARM ENDING IN ARROW POINTING UP AND RIGHT
# 29A9; MEASURED ANGLE WITH OPEN ARM ENDING IN ARROW POINTING UP AND LEFT
# 29AA; MEASURED ANGLE WITH OPEN ARM ENDING IN ARROW POINTING DOWN AND RIGHT
# 29AB; MEASURED ANGLE WITH OPEN ARM ENDING IN ARROW POINTING DOWN AND LEFT
# 29AC; MEASURED ANGLE WITH OPEN ARM ENDING IN ARROW POINTING RIGHT AND UP
# 29AD; MEASURED ANGLE WITH OPEN ARM ENDING IN ARROW POINTING LEFT AND UP
# 29AE; MEASURED ANGLE WITH OPEN ARM ENDING IN ARROW POINTING RIGHT AND DOWN
# 29AF; MEASURED ANGLE WITH OPEN ARM ENDING IN ARROW POINTING LEFT AND DOWN
# 29C2; CIRCLE WITH SMALL CIRCLE TO THE RIGHT
# 29C3; CIRCLE WITH TWO HORIZONTAL STROKES TO THE RIGHT
# 29C9; TWO JOINED SQUARES
# 29CE; RIGHT TRIANGLE ABOVE LEFT TRIANGLE
# 29DC; INCOMPLETE INFINITY
# 29E1; INCREASES AS
# 29E3; EQUALS SIGN AND SLANTED PARALLEL
# 29E4; EQUALS SIGN AND SLANTED PARALLEL WITH TILDE ABOVE
# 29E5; IDENTICAL TO AND SLANTED PARALLEL
# 29E8; DOWN-POINTING TRIANGLE WITH LEFT HALF BLACK
# 29E9; DOWN-POINTING TRIANGLE WITH RIGHT HALF BLACK
# 29F4; RULE-DELAYED
# 29F6; SOLIDUS WITH OVERBAR
# 29F7; REVERSE SOLIDUS WITH HORIZONTAL STROKE
# 2A0A; MODULO TWO SUM
# 2A0B; SUMMATION WITH INTEGRAL
# 2A0C; QUADRUPLE INTEGRAL OPERATOR
# 2A0D; FINITE PART INTEGRAL
# 2A0E; INTEGRAL WITH DOUBLE STROKE
# 2A0F; INTEGRAL AVERAGE WITH SLASH
# 2A10; CIRCULATION FUNCTION
# 2A11; ANTICLOCKWISE INTEGRATION
# 2A12; LINE INTEGRATION WITH RECTANGULAR PATH AROUND POLE
# 2A13; LINE INTEGRATION WITH SEMICIRCULAR PATH AROUND POLE
# 2A14; LINE INTEGRATION NOT INCLUDING THE POLE
# 2A15; INTEGRAL AROUND A POINT OPERATOR
# 2A16; QUATERNION INTEGRAL OPERATOR
# 2A17; INTEGRAL WITH LEFTWARDS ARROW WITH HOOK
# 2A18; INTEGRAL WITH TIMES SIGN
# 2A19; INTEGRAL WITH INTERSECTION
# 2A1A; INTEGRAL WITH UNION
# 2A1B; INTEGRAL WITH OVERBAR
# 2A1C; INTEGRAL WITH UNDERBAR
# 2A1E; LARGE LEFT TRIANGLE OPERATOR
# 2A1F; Z NOTATION SCHEMA COMPOSITION
# 2A20; Z NOTATION SCHEMA PIPING
# 2A21; Z NOTATION SCHEMA PROJECTION
# 2A24; PLUS SIGN WITH TILDE ABOVE
# 2A26; PLUS SIGN WITH TILDE BELOW
# 2A29; MINUS SIGN WITH COMMA ABOVE
# 2A3E; Z NOTATION RELATIONAL COMPOSITION
# 2A57; SLOPING LARGE OR
# 2A58; SLOPING LARGE AND
# 2A6A; TILDE OPERATOR WITH DOT ABOVE
# 2A6B; TILDE OPERATOR WITH RISING DOTS
# 2A6C; SIMILAR MINUS SIMILAR
# 2A6D; CONGRUENT WITH DOT ABOVE
# 2A6F; ALMOST EQUAL TO WITH CIRCUMFLEX ACCENT
# 2A70; APPROXIMATELY EQUAL OR EQUAL TO
# 2A73; EQUALS SIGN ABOVE TILDE OPERATOR
# 2A74; DOUBLE COLON EQUAL
# 2A7B; LESS-THAN WITH QUESTION MARK ABOVE
# 2A7C; GREATER-THAN WITH QUESTION MARK ABOVE
# 2A85; LESS-THAN OR APPROXIMATE
# 2A86; GREATER-THAN OR APPROXIMATE
# 2A87; LESS-THAN AND SINGLE-LINE NOT EQUAL TO
# 2A88; GREATER-THAN AND SINGLE-LINE NOT EQUAL TO
# 2A89; LESS-THAN AND NOT APPROXIMATE
# 2A8A; GREATER-THAN AND NOT APPROXIMATE
# 2A8D; LESS-THAN ABOVE SIMILAR OR EQUAL
# 2A8E; GREATER-THAN ABOVE SIMILAR OR EQUAL
# 2A8F; LESS-THAN ABOVE SIMILAR ABOVE GREATER-THAN
# 2A90; GREATER-THAN ABOVE SIMILAR ABOVE LESS-THAN
# 2A9D; SIMILAR OR LESS-THAN
# 2A9E; SIMILAR OR GREATER-THAN
# 2A9F; SIMILAR ABOVE LESS-THAN ABOVE EQUALS SIGN
# 2AA0; SIMILAR ABOVE GREATER-THAN ABOVE EQUALS SIGN
# 2AA3; DOUBLE NESTED LESS-THAN WITH UNDERBAR
# 2AB1; PRECEDES ABOVE SINGLE-LINE NOT EQUAL TO
# 2AB2; SUCCEEDS ABOVE SINGLE-LINE NOT EQUAL TO
# 2AB5; PRECEDES ABOVE NOT EQUAL TO
# 2AB6; SUCCEEDS ABOVE NOT EQUAL TO
# 2AB7; PRECEDES ABOVE ALMOST EQUAL TO
# 2AB8; SUCCEEDS ABOVE ALMOST EQUAL TO
# 2AB9; PRECEDES ABOVE NOT ALMOST EQUAL TO
# 2ABA; SUCCEEDS ABOVE NOT ALMOST EQUAL TO
# 2AC7; SUBSET OF ABOVE TILDE OPERATOR
# 2AC8; SUPERSET OF ABOVE TILDE OPERATOR
# 2AC9; SUBSET OF ABOVE ALMOST EQUAL TO
# 2ACA; SUPERSET OF ABOVE ALMOST EQUAL TO
# 2ACB; SUBSET OF ABOVE NOT EQUAL TO
# 2ACC; SUPERSET OF ABOVE NOT EQUAL TO
# 2ADC; FORKING
# 2AE2; VERTICAL BAR TRIPLE RIGHT TURNSTILE
# 2AE6; LONG DASH FROM LEFT MEMBER OF DOUBLE VERTICAL
# 2AEE; DOES NOT DIVIDE WITH REVERSED NEGATION SLASH
# 2AF3; PARALLEL WITH TILDE OPERATOR
# 2AFB; TRIPLE SOLIDUS BINARY RELATION
# 2AFD; DOUBLE SOLIDUS OPERATOR
# 301F; LOW DOUBLE PRIME QUOTATION MARK
# 1D6DB; MATHEMATICAL BOLD PARTIAL DIFFERENTIAL
# 1D715; MATHEMATICAL ITALIC PARTIAL DIFFERENTIAL
# 1D74F; MATHEMATICAL BOLD ITALIC PARTIAL DIFFERENTIAL
# 1D789; MATHEMATICAL SANS-SERIF BOLD PARTIAL DIFFERENTIAL
# 1D7C3; MATHEMATICAL SANS-SERIF BOLD ITALIC PARTIAL DIFFERENTIAL
# EOF

View File

@ -0,0 +1,185 @@
# Blocks-5.0.0.txt
# Date: 2006-02-15, 15:40:00 [KW]
#
# Unicode Character Database
# Copyright (c) 1991-2006 Unicode, Inc.
# For terms of use, see http://www.unicode.org/terms_of_use.html
# For documentation, see UCD.html
#
# Note: The casing of block names is not normative.
# For example, "Basic Latin" and "BASIC LATIN" are equivalent.
#
# Format:
# Start Code..End Code; Block Name
# ================================================
# Note: When comparing block names, casing, whitespace, hyphens,
# and underbars are ignored.
# For example, "Latin Extended-A" and "latin extended a" are equivalent.
# For more information on the comparison of property values,
# see UCD.html.
#
# All code points not explicitly listed for Block
# have the value No_Block.
# Property: Block
#
# @missing: 0000..10FFFF; No_Block
0000..007F; Basic Latin
0080..00FF; Latin-1 Supplement
0100..017F; Latin Extended-A
0180..024F; Latin Extended-B
0250..02AF; IPA Extensions
02B0..02FF; Spacing Modifier Letters
0300..036F; Combining Diacritical Marks
0370..03FF; Greek and Coptic
0400..04FF; Cyrillic
0500..052F; Cyrillic Supplement
0530..058F; Armenian
0590..05FF; Hebrew
0600..06FF; Arabic
0700..074F; Syriac
0750..077F; Arabic Supplement
0780..07BF; Thaana
07C0..07FF; NKo
0900..097F; Devanagari
0980..09FF; Bengali
0A00..0A7F; Gurmukhi
0A80..0AFF; Gujarati
0B00..0B7F; Oriya
0B80..0BFF; Tamil
0C00..0C7F; Telugu
0C80..0CFF; Kannada
0D00..0D7F; Malayalam
0D80..0DFF; Sinhala
0E00..0E7F; Thai
0E80..0EFF; Lao
0F00..0FFF; Tibetan
1000..109F; Myanmar
10A0..10FF; Georgian
1100..11FF; Hangul Jamo
1200..137F; Ethiopic
1380..139F; Ethiopic Supplement
13A0..13FF; Cherokee
1400..167F; Unified Canadian Aboriginal Syllabics
1680..169F; Ogham
16A0..16FF; Runic
1700..171F; Tagalog
1720..173F; Hanunoo
1740..175F; Buhid
1760..177F; Tagbanwa
1780..17FF; Khmer
1800..18AF; Mongolian
1900..194F; Limbu
1950..197F; Tai Le
1980..19DF; New Tai Lue
19E0..19FF; Khmer Symbols
1A00..1A1F; Buginese
1B00..1B7F; Balinese
1D00..1D7F; Phonetic Extensions
1D80..1DBF; Phonetic Extensions Supplement
1DC0..1DFF; Combining Diacritical Marks Supplement
1E00..1EFF; Latin Extended Additional
1F00..1FFF; Greek Extended
2000..206F; General Punctuation
2070..209F; Superscripts and Subscripts
20A0..20CF; Currency Symbols
20D0..20FF; Combining Diacritical Marks for Symbols
2100..214F; Letterlike Symbols
2150..218F; Number Forms
2190..21FF; Arrows
2200..22FF; Mathematical Operators
2300..23FF; Miscellaneous Technical
2400..243F; Control Pictures
2440..245F; Optical Character Recognition
2460..24FF; Enclosed Alphanumerics
2500..257F; Box Drawing
2580..259F; Block Elements
25A0..25FF; Geometric Shapes
2600..26FF; Miscellaneous Symbols
2700..27BF; Dingbats
27C0..27EF; Miscellaneous Mathematical Symbols-A
27F0..27FF; Supplemental Arrows-A
2800..28FF; Braille Patterns
2900..297F; Supplemental Arrows-B
2980..29FF; Miscellaneous Mathematical Symbols-B
2A00..2AFF; Supplemental Mathematical Operators
2B00..2BFF; Miscellaneous Symbols and Arrows
2C00..2C5F; Glagolitic
2C60..2C7F; Latin Extended-C
2C80..2CFF; Coptic
2D00..2D2F; Georgian Supplement
2D30..2D7F; Tifinagh
2D80..2DDF; Ethiopic Extended
2E00..2E7F; Supplemental Punctuation
2E80..2EFF; CJK Radicals Supplement
2F00..2FDF; Kangxi Radicals
2FF0..2FFF; Ideographic Description Characters
3000..303F; CJK Symbols and Punctuation
3040..309F; Hiragana
30A0..30FF; Katakana
3100..312F; Bopomofo
3130..318F; Hangul Compatibility Jamo
3190..319F; Kanbun
31A0..31BF; Bopomofo Extended
31C0..31EF; CJK Strokes
31F0..31FF; Katakana Phonetic Extensions
3200..32FF; Enclosed CJK Letters and Months
3300..33FF; CJK Compatibility
3400..4DBF; CJK Unified Ideographs Extension A
4DC0..4DFF; Yijing Hexagram Symbols
4E00..9FFF; CJK Unified Ideographs
A000..A48F; Yi Syllables
A490..A4CF; Yi Radicals
A700..A71F; Modifier Tone Letters
A720..A7FF; Latin Extended-D
A800..A82F; Syloti Nagri
A840..A87F; Phags-pa
AC00..D7AF; Hangul Syllables
D800..DB7F; High Surrogates
DB80..DBFF; High Private Use Surrogates
DC00..DFFF; Low Surrogates
E000..F8FF; Private Use Area
F900..FAFF; CJK Compatibility Ideographs
FB00..FB4F; Alphabetic Presentation Forms
FB50..FDFF; Arabic Presentation Forms-A
FE00..FE0F; Variation Selectors
FE10..FE1F; Vertical Forms
FE20..FE2F; Combining Half Marks
FE30..FE4F; CJK Compatibility Forms
FE50..FE6F; Small Form Variants
FE70..FEFF; Arabic Presentation Forms-B
FF00..FFEF; Halfwidth and Fullwidth Forms
FFF0..FFFF; Specials
10000..1007F; Linear B Syllabary
10080..100FF; Linear B Ideograms
10100..1013F; Aegean Numbers
10140..1018F; Ancient Greek Numbers
10300..1032F; Old Italic
10330..1034F; Gothic
10380..1039F; Ugaritic
103A0..103DF; Old Persian
10400..1044F; Deseret
10450..1047F; Shavian
10480..104AF; Osmanya
10800..1083F; Cypriot Syllabary
10900..1091F; Phoenician
10A00..10A5F; Kharoshthi
12000..123FF; Cuneiform
12400..1247F; Cuneiform Numbers and Punctuation
1D000..1D0FF; Byzantine Musical Symbols
1D100..1D1FF; Musical Symbols
1D200..1D24F; Ancient Greek Musical Notation
1D300..1D35F; Tai Xuan Jing Symbols
1D360..1D37F; Counting Rod Numerals
1D400..1D7FF; Mathematical Alphanumeric Symbols
20000..2A6DF; CJK Unified Ideographs Extension B
2F800..2FA1F; CJK Compatibility Ideographs Supplement
E0000..E007F; Tags
E0100..E01EF; Variation Selectors Supplement
F0000..FFFFF; Supplementary Private Use Area-A
100000..10FFFF; Supplementary Private Use Area-B
# EOF

File diff suppressed because it is too large Load Diff

View File

@ -0,0 +1,197 @@
# CompositionExclusions-5.0.0.txt
# Date: 2006-05-23, 12:42:00 PST [KW]
#
# This file lists the characters for the Composition Exclusion Table
# defined in UAX #15, Unicode Normalization Forms.
#
# This file is a normative contributory data file in the
# Unicode Character Database.
#
# Copyright (c) 1991-2006 Unicode, Inc.
# For terms of use, see http://www.unicode.org/terms_of_use.html
#
# For more information, see
# http://www.unicode.org/unicode/reports/tr15/#Primary Exclusion List Table
#
# For a full derivation of composition exclusions, see the derived property
# Full_Composition_Exclusion in DerivedNormalizationProps.txt
#
# ================================================
# (1) Script Specifics
#
# This list of characters cannot be derived from the UnicodeData.txt file.
# ================================================
0958 # DEVANAGARI LETTER QA
0959 # DEVANAGARI LETTER KHHA
095A # DEVANAGARI LETTER GHHA
095B # DEVANAGARI LETTER ZA
095C # DEVANAGARI LETTER DDDHA
095D # DEVANAGARI LETTER RHA
095E # DEVANAGARI LETTER FA
095F # DEVANAGARI LETTER YYA
09DC # BENGALI LETTER RRA
09DD # BENGALI LETTER RHA
09DF # BENGALI LETTER YYA
0A33 # GURMUKHI LETTER LLA
0A36 # GURMUKHI LETTER SHA
0A59 # GURMUKHI LETTER KHHA
0A5A # GURMUKHI LETTER GHHA
0A5B # GURMUKHI LETTER ZA
0A5E # GURMUKHI LETTER FA
0B5C # ORIYA LETTER RRA
0B5D # ORIYA LETTER RHA
0F43 # TIBETAN LETTER GHA
0F4D # TIBETAN LETTER DDHA
0F52 # TIBETAN LETTER DHA
0F57 # TIBETAN LETTER BHA
0F5C # TIBETAN LETTER DZHA
0F69 # TIBETAN LETTER KSSA
0F76 # TIBETAN VOWEL SIGN VOCALIC R
0F78 # TIBETAN VOWEL SIGN VOCALIC L
0F93 # TIBETAN SUBJOINED LETTER GHA
0F9D # TIBETAN SUBJOINED LETTER DDHA
0FA2 # TIBETAN SUBJOINED LETTER DHA
0FA7 # TIBETAN SUBJOINED LETTER BHA
0FAC # TIBETAN SUBJOINED LETTER DZHA
0FB9 # TIBETAN SUBJOINED LETTER KSSA
FB1D # HEBREW LETTER YOD WITH HIRIQ
FB1F # HEBREW LIGATURE YIDDISH YOD YOD PATAH
FB2A # HEBREW LETTER SHIN WITH SHIN DOT
FB2B # HEBREW LETTER SHIN WITH SIN DOT
FB2C # HEBREW LETTER SHIN WITH DAGESH AND SHIN DOT
FB2D # HEBREW LETTER SHIN WITH DAGESH AND SIN DOT
FB2E # HEBREW LETTER ALEF WITH PATAH
FB2F # HEBREW LETTER ALEF WITH QAMATS
FB30 # HEBREW LETTER ALEF WITH MAPIQ
FB31 # HEBREW LETTER BET WITH DAGESH
FB32 # HEBREW LETTER GIMEL WITH DAGESH
FB33 # HEBREW LETTER DALET WITH DAGESH
FB34 # HEBREW LETTER HE WITH MAPIQ
FB35 # HEBREW LETTER VAV WITH DAGESH
FB36 # HEBREW LETTER ZAYIN WITH DAGESH
FB38 # HEBREW LETTER TET WITH DAGESH
FB39 # HEBREW LETTER YOD WITH DAGESH
FB3A # HEBREW LETTER FINAL KAF WITH DAGESH
FB3B # HEBREW LETTER KAF WITH DAGESH
FB3C # HEBREW LETTER LAMED WITH DAGESH
FB3E # HEBREW LETTER MEM WITH DAGESH
FB40 # HEBREW LETTER NUN WITH DAGESH
FB41 # HEBREW LETTER SAMEKH WITH DAGESH
FB43 # HEBREW LETTER FINAL PE WITH DAGESH
FB44 # HEBREW LETTER PE WITH DAGESH
FB46 # HEBREW LETTER TSADI WITH DAGESH
FB47 # HEBREW LETTER QOF WITH DAGESH
FB48 # HEBREW LETTER RESH WITH DAGESH
FB49 # HEBREW LETTER SHIN WITH DAGESH
FB4A # HEBREW LETTER TAV WITH DAGESH
FB4B # HEBREW LETTER VAV WITH HOLAM
FB4C # HEBREW LETTER BET WITH RAFE
FB4D # HEBREW LETTER KAF WITH RAFE
FB4E # HEBREW LETTER PE WITH RAFE
# Total code points: 67
# ================================================
# (2) Post Composition Version precomposed characters
#
# These characters cannot be derived solely from the UnicodeData.txt file
# in this version of Unicode.
#
# Note that characters added to the standard after the
# Composition Version and which have canonical decomposition mappings
# are not automatically added to this list of Post Composition
# Version precomposed characters.
# ================================================
2ADC # FORKING
1D15E # MUSICAL SYMBOL HALF NOTE
1D15F # MUSICAL SYMBOL QUARTER NOTE
1D160 # MUSICAL SYMBOL EIGHTH NOTE
1D161 # MUSICAL SYMBOL SIXTEENTH NOTE
1D162 # MUSICAL SYMBOL THIRTY-SECOND NOTE
1D163 # MUSICAL SYMBOL SIXTY-FOURTH NOTE
1D164 # MUSICAL SYMBOL ONE HUNDRED TWENTY-EIGHTH NOTE
1D1BB # MUSICAL SYMBOL MINIMA
1D1BC # MUSICAL SYMBOL MINIMA BLACK
1D1BD # MUSICAL SYMBOL SEMIMINIMA WHITE
1D1BE # MUSICAL SYMBOL SEMIMINIMA BLACK
1D1BF # MUSICAL SYMBOL FUSA WHITE
1D1C0 # MUSICAL SYMBOL FUSA BLACK
# Total code points: 14
# ================================================
# (3) Singleton Decompositions
#
# These characters can be derived from the UnicodeData.txt file
# by including all characters whose canonical decomposition
# consists of a single character.
#
# These characters are simply quoted here for reference.
# See also Full_Composition_Exclusion in DerivedNormalizationProps.txt
# ================================================
# 0340..0341 [2] COMBINING GRAVE TONE MARK..COMBINING ACUTE TONE MARK
# 0343 COMBINING GREEK KORONIS
# 0374 GREEK NUMERAL SIGN
# 037E GREEK QUESTION MARK
# 0387 GREEK ANO TELEIA
# 1F71 GREEK SMALL LETTER ALPHA WITH OXIA
# 1F73 GREEK SMALL LETTER EPSILON WITH OXIA
# 1F75 GREEK SMALL LETTER ETA WITH OXIA
# 1F77 GREEK SMALL LETTER IOTA WITH OXIA
# 1F79 GREEK SMALL LETTER OMICRON WITH OXIA
# 1F7B GREEK SMALL LETTER UPSILON WITH OXIA
# 1F7D GREEK SMALL LETTER OMEGA WITH OXIA
# 1FBB GREEK CAPITAL LETTER ALPHA WITH OXIA
# 1FBE GREEK PROSGEGRAMMENI
# 1FC9 GREEK CAPITAL LETTER EPSILON WITH OXIA
# 1FCB GREEK CAPITAL LETTER ETA WITH OXIA
# 1FD3 GREEK SMALL LETTER IOTA WITH DIALYTIKA AND OXIA
# 1FDB GREEK CAPITAL LETTER IOTA WITH OXIA
# 1FE3 GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND OXIA
# 1FEB GREEK CAPITAL LETTER UPSILON WITH OXIA
# 1FEE..1FEF [2] GREEK DIALYTIKA AND OXIA..GREEK VARIA
# 1FF9 GREEK CAPITAL LETTER OMICRON WITH OXIA
# 1FFB GREEK CAPITAL LETTER OMEGA WITH OXIA
# 1FFD GREEK OXIA
# 2000..2001 [2] EN QUAD..EM QUAD
# 2126 OHM SIGN
# 212A..212B [2] KELVIN SIGN..ANGSTROM SIGN
# 2329 LEFT-POINTING ANGLE BRACKET
# 232A RIGHT-POINTING ANGLE BRACKET
# F900..FA0D [270] CJK COMPATIBILITY IDEOGRAPH-F900..CJK COMPATIBILITY IDEOGRAPH-FA0D
# FA10 CJK COMPATIBILITY IDEOGRAPH-FA10
# FA12 CJK COMPATIBILITY IDEOGRAPH-FA12
# FA15..FA1E [10] CJK COMPATIBILITY IDEOGRAPH-FA15..CJK COMPATIBILITY IDEOGRAPH-FA1E
# FA20 CJK COMPATIBILITY IDEOGRAPH-FA20
# FA22 CJK COMPATIBILITY IDEOGRAPH-FA22
# FA25..FA26 [2] CJK COMPATIBILITY IDEOGRAPH-FA25..CJK COMPATIBILITY IDEOGRAPH-FA26
# FA2A..FA2D [4] CJK COMPATIBILITY IDEOGRAPH-FA2A..CJK COMPATIBILITY IDEOGRAPH-FA2D
# FA30..FA6A [59] CJK COMPATIBILITY IDEOGRAPH-FA30..CJK COMPATIBILITY IDEOGRAPH-FA6A
# FA70..FAD9 [106] CJK COMPATIBILITY IDEOGRAPH-FA70..CJK COMPATIBILITY IDEOGRAPH-FAD9
# 2F800..2FA1D [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D
# Total code points: 924
# ================================================
# (4) Non-Starter Decompositions
#
# These characters can be derived from the UnicodeData file
# by including all characters whose canonical decomposition consists
# of a sequence of characters, the first of which has a non-zero
# combining class.
#
# These characters are simply quoted here for reference.
# See also Full_Composition_Exclusion in DerivedNormalizationProps.txt
# ================================================
# 0344 COMBINING GREEK DIALYTIKA TONOS
# 0F73 TIBETAN VOWEL SIGN II
# 0F75 TIBETAN VOWEL SIGN UU
# 0F81 TIBETAN VOWEL SIGN REVERSED II
# Total code points: 4

View File

@ -0,0 +1,867 @@
# DerivedAge-5.0.0.txt
# Date: 2006-07-14, 17:25:00 PST [MD/KW]
#
# Unicode Character Database
# Copyright (c) 1991-2006 Unicode, Inc.
# For terms of use, see http://www.unicode.org/terms_of_use.html
# For documentation, see UCD.html
#
# Unicode Character Database: Derived Property Data
# This file shows when various code points were first assigned in Unicode.
#
# Caution: When using the Age *property*, all assigned code points
# in each version are included, not just the newly assigned code points.
# For more information, see http://www.unicode.org/reports/tr18/
#
# Notes:
#
# - The term 'assigned' means that a previously reserved code point was assigned
# to be a character (graphic, format, control, or private-use);
# a noncharacter code point; or a surrogate code point.
# For more information, see The Unicode Standard Section 2.4
#
# - Versions are only tracked from 1.1 onwards, since version 1.0
# predated changes required by the ISO 10646 merger.
#
# - The Hangul Syllables that were removed from 2.0 are not included in the 1.1 listing.
#
# - The supplementary private use code points and the non-character code points
# were assigned in version 2.0, but not specifically listed in the UCD
# until versions 3.0 and 3.1 respectively.
#
# - Contiguous ranges are broken into separate lines where they would cross code point
# types: graphic, format, control, private-use, surrogate, noncharacter
#
# For details on the contents of each version, see
# http://www.unicode.org/versions/enumeratedversions.html.
# ================================================
# Property: Age
# All code points not explicitly listed for Age
# have the value unassigned.
# @missing: 0000..10FFFF; unassigned
# ================================================
# Assigned as of Unicode 1.1.0 (June, 1993)
# [excluding removed Hangul Syllables]
0000..001F ; 1.1 # [32] <control-0000>..<control-001F>
0020..007E ; 1.1 # [95] SPACE..TILDE
007F..009F ; 1.1 # [33] <control-007F>..<control-009F>
00A0..00AC ; 1.1 # [13] NO-BREAK SPACE..NOT SIGN
00AD ; 1.1 # SOFT HYPHEN
00AE..01F5 ; 1.1 # [328] REGISTERED SIGN..LATIN SMALL LETTER G WITH ACUTE
01FA..0217 ; 1.1 # [30] LATIN CAPITAL LETTER A WITH RING ABOVE AND ACUTE..LATIN SMALL LETTER U WITH INVERTED BREVE
0250..02A8 ; 1.1 # [89] LATIN SMALL LETTER TURNED A..LATIN SMALL LETTER TC DIGRAPH WITH CURL
02B0..02DE ; 1.1 # [47] MODIFIER LETTER SMALL H..MODIFIER LETTER RHOTIC HOOK
02E0..02E9 ; 1.1 # [10] MODIFIER LETTER SMALL GAMMA..MODIFIER LETTER EXTRA-LOW TONE BAR
0300..0345 ; 1.1 # [70] COMBINING GRAVE ACCENT..COMBINING GREEK YPOGEGRAMMENI
0360..0361 ; 1.1 # [2] COMBINING DOUBLE TILDE..COMBINING DOUBLE INVERTED BREVE
0374..0375 ; 1.1 # [2] GREEK NUMERAL SIGN..GREEK LOWER NUMERAL SIGN
037A ; 1.1 # GREEK YPOGEGRAMMENI
037E ; 1.1 # GREEK QUESTION MARK
0384..038A ; 1.1 # [7] GREEK TONOS..GREEK CAPITAL LETTER IOTA WITH TONOS
038C ; 1.1 # GREEK CAPITAL LETTER OMICRON WITH TONOS
038E..03A1 ; 1.1 # [20] GREEK CAPITAL LETTER UPSILON WITH TONOS..GREEK CAPITAL LETTER RHO
03A3..03CE ; 1.1 # [44] GREEK CAPITAL LETTER SIGMA..GREEK SMALL LETTER OMEGA WITH TONOS
03D0..03D6 ; 1.1 # [7] GREEK BETA SYMBOL..GREEK PI SYMBOL
03DA ; 1.1 # GREEK LETTER STIGMA
03DC ; 1.1 # GREEK LETTER DIGAMMA
03DE ; 1.1 # GREEK LETTER KOPPA
03E0 ; 1.1 # GREEK LETTER SAMPI
03E2..03F3 ; 1.1 # [18] COPTIC CAPITAL LETTER SHEI..GREEK LETTER YOT
0401..040C ; 1.1 # [12] CYRILLIC CAPITAL LETTER IO..CYRILLIC CAPITAL LETTER KJE
040E..044F ; 1.1 # [66] CYRILLIC CAPITAL LETTER SHORT U..CYRILLIC SMALL LETTER YA
0451..045C ; 1.1 # [12] CYRILLIC SMALL LETTER IO..CYRILLIC SMALL LETTER KJE
045E..0486 ; 1.1 # [41] CYRILLIC SMALL LETTER SHORT U..COMBINING CYRILLIC PSILI PNEUMATA
0490..04C4 ; 1.1 # [53] CYRILLIC CAPITAL LETTER GHE WITH UPTURN..CYRILLIC SMALL LETTER KA WITH HOOK
04C7..04C8 ; 1.1 # [2] CYRILLIC CAPITAL LETTER EN WITH HOOK..CYRILLIC SMALL LETTER EN WITH HOOK
04CB..04CC ; 1.1 # [2] CYRILLIC CAPITAL LETTER KHAKASSIAN CHE..CYRILLIC SMALL LETTER KHAKASSIAN CHE
04D0..04EB ; 1.1 # [28] CYRILLIC CAPITAL LETTER A WITH BREVE..CYRILLIC SMALL LETTER BARRED O WITH DIAERESIS
04EE..04F5 ; 1.1 # [8] CYRILLIC CAPITAL LETTER U WITH MACRON..CYRILLIC SMALL LETTER CHE WITH DIAERESIS
04F8..04F9 ; 1.1 # [2] CYRILLIC CAPITAL LETTER YERU WITH DIAERESIS..CYRILLIC SMALL LETTER YERU WITH DIAERESIS
0531..0556 ; 1.1 # [38] ARMENIAN CAPITAL LETTER AYB..ARMENIAN CAPITAL LETTER FEH
0559..055F ; 1.1 # [7] ARMENIAN MODIFIER LETTER LEFT HALF RING..ARMENIAN ABBREVIATION MARK
0561..0587 ; 1.1 # [39] ARMENIAN SMALL LETTER AYB..ARMENIAN SMALL LIGATURE ECH YIWN
0589 ; 1.1 # ARMENIAN FULL STOP
05B0..05B9 ; 1.1 # [10] HEBREW POINT SHEVA..HEBREW POINT HOLAM
05BB..05C3 ; 1.1 # [9] HEBREW POINT QUBUTS..HEBREW PUNCTUATION SOF PASUQ
05D0..05EA ; 1.1 # [27] HEBREW LETTER ALEF..HEBREW LETTER TAV
05F0..05F4 ; 1.1 # [5] HEBREW LIGATURE YIDDISH DOUBLE VAV..HEBREW PUNCTUATION GERSHAYIM
060C ; 1.1 # ARABIC COMMA
061B ; 1.1 # ARABIC SEMICOLON
061F ; 1.1 # ARABIC QUESTION MARK
0621..063A ; 1.1 # [26] ARABIC LETTER HAMZA..ARABIC LETTER GHAIN
0640..0652 ; 1.1 # [19] ARABIC TATWEEL..ARABIC SUKUN
0660..066D ; 1.1 # [14] ARABIC-INDIC DIGIT ZERO..ARABIC FIVE POINTED STAR
0670..06B7 ; 1.1 # [72] ARABIC LETTER SUPERSCRIPT ALEF..ARABIC LETTER LAM WITH THREE DOTS ABOVE
06BA..06BE ; 1.1 # [5] ARABIC LETTER NOON GHUNNA..ARABIC LETTER HEH DOACHASHMEE
06C0..06CE ; 1.1 # [15] ARABIC LETTER HEH WITH YEH ABOVE..ARABIC LETTER YEH WITH SMALL V
06D0..06DC ; 1.1 # [13] ARABIC LETTER E..ARABIC SMALL HIGH SEEN
06DD ; 1.1 # ARABIC END OF AYAH
06DE..06ED ; 1.1 # [16] ARABIC START OF RUB EL HIZB..ARABIC SMALL LOW MEEM
06F0..06F9 ; 1.1 # [10] EXTENDED ARABIC-INDIC DIGIT ZERO..EXTENDED ARABIC-INDIC DIGIT NINE
0901..0903 ; 1.1 # [3] DEVANAGARI SIGN CANDRABINDU..DEVANAGARI SIGN VISARGA
0905..0939 ; 1.1 # [53] DEVANAGARI LETTER A..DEVANAGARI LETTER HA
093C..094D ; 1.1 # [18] DEVANAGARI SIGN NUKTA..DEVANAGARI SIGN VIRAMA
0950..0954 ; 1.1 # [5] DEVANAGARI OM..DEVANAGARI ACUTE ACCENT
0958..0970 ; 1.1 # [25] DEVANAGARI LETTER QA..DEVANAGARI ABBREVIATION SIGN
0981..0983 ; 1.1 # [3] BENGALI SIGN CANDRABINDU..BENGALI SIGN VISARGA
0985..098C ; 1.1 # [8] BENGALI LETTER A..BENGALI LETTER VOCALIC L
098F..0990 ; 1.1 # [2] BENGALI LETTER E..BENGALI LETTER AI
0993..09A8 ; 1.1 # [22] BENGALI LETTER O..BENGALI LETTER NA
09AA..09B0 ; 1.1 # [7] BENGALI LETTER PA..BENGALI LETTER RA
09B2 ; 1.1 # BENGALI LETTER LA
09B6..09B9 ; 1.1 # [4] BENGALI LETTER SHA..BENGALI LETTER HA
09BC ; 1.1 # BENGALI SIGN NUKTA
09BE..09C4 ; 1.1 # [7] BENGALI VOWEL SIGN AA..BENGALI VOWEL SIGN VOCALIC RR
09C7..09C8 ; 1.1 # [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI
09CB..09CD ; 1.1 # [3] BENGALI VOWEL SIGN O..BENGALI SIGN VIRAMA
09D7 ; 1.1 # BENGALI AU LENGTH MARK
09DC..09DD ; 1.1 # [2] BENGALI LETTER RRA..BENGALI LETTER RHA
09DF..09E3 ; 1.1 # [5] BENGALI LETTER YYA..BENGALI VOWEL SIGN VOCALIC LL
09E6..09FA ; 1.1 # [21] BENGALI DIGIT ZERO..BENGALI ISSHAR
0A02 ; 1.1 # GURMUKHI SIGN BINDI
0A05..0A0A ; 1.1 # [6] GURMUKHI LETTER A..GURMUKHI LETTER UU
0A0F..0A10 ; 1.1 # [2] GURMUKHI LETTER EE..GURMUKHI LETTER AI
0A13..0A28 ; 1.1 # [22] GURMUKHI LETTER OO..GURMUKHI LETTER NA
0A2A..0A30 ; 1.1 # [7] GURMUKHI LETTER PA..GURMUKHI LETTER RA
0A32..0A33 ; 1.1 # [2] GURMUKHI LETTER LA..GURMUKHI LETTER LLA
0A35..0A36 ; 1.1 # [2] GURMUKHI LETTER VA..GURMUKHI LETTER SHA
0A38..0A39 ; 1.1 # [2] GURMUKHI LETTER SA..GURMUKHI LETTER HA
0A3C ; 1.1 # GURMUKHI SIGN NUKTA
0A3E..0A42 ; 1.1 # [5] GURMUKHI VOWEL SIGN AA..GURMUKHI VOWEL SIGN UU
0A47..0A48 ; 1.1 # [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI
0A4B..0A4D ; 1.1 # [3] GURMUKHI VOWEL SIGN OO..GURMUKHI SIGN VIRAMA
0A59..0A5C ; 1.1 # [4] GURMUKHI LETTER KHHA..GURMUKHI LETTER RRA
0A5E ; 1.1 # GURMUKHI LETTER FA
0A66..0A74 ; 1.1 # [15] GURMUKHI DIGIT ZERO..GURMUKHI EK ONKAR
0A81..0A83 ; 1.1 # [3] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN VISARGA
0A85..0A8B ; 1.1 # [7] GUJARATI LETTER A..GUJARATI LETTER VOCALIC R
0A8D ; 1.1 # GUJARATI VOWEL CANDRA E
0A8F..0A91 ; 1.1 # [3] GUJARATI LETTER E..GUJARATI VOWEL CANDRA O
0A93..0AA8 ; 1.1 # [22] GUJARATI LETTER O..GUJARATI LETTER NA
0AAA..0AB0 ; 1.1 # [7] GUJARATI LETTER PA..GUJARATI LETTER RA
0AB2..0AB3 ; 1.1 # [2] GUJARATI LETTER LA..GUJARATI LETTER LLA
0AB5..0AB9 ; 1.1 # [5] GUJARATI LETTER VA..GUJARATI LETTER HA
0ABC..0AC5 ; 1.1 # [10] GUJARATI SIGN NUKTA..GUJARATI VOWEL SIGN CANDRA E
0AC7..0AC9 ; 1.1 # [3] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN CANDRA O
0ACB..0ACD ; 1.1 # [3] GUJARATI VOWEL SIGN O..GUJARATI SIGN VIRAMA
0AD0 ; 1.1 # GUJARATI OM
0AE0 ; 1.1 # GUJARATI LETTER VOCALIC RR
0AE6..0AEF ; 1.1 # [10] GUJARATI DIGIT ZERO..GUJARATI DIGIT NINE
0B01..0B03 ; 1.1 # [3] ORIYA SIGN CANDRABINDU..ORIYA SIGN VISARGA
0B05..0B0C ; 1.1 # [8] ORIYA LETTER A..ORIYA LETTER VOCALIC L
0B0F..0B10 ; 1.1 # [2] ORIYA LETTER E..ORIYA LETTER AI
0B13..0B28 ; 1.1 # [22] ORIYA LETTER O..ORIYA LETTER NA
0B2A..0B30 ; 1.1 # [7] ORIYA LETTER PA..ORIYA LETTER RA
0B32..0B33 ; 1.1 # [2] ORIYA LETTER LA..ORIYA LETTER LLA
0B36..0B39 ; 1.1 # [4] ORIYA LETTER SHA..ORIYA LETTER HA
0B3C..0B43 ; 1.1 # [8] ORIYA SIGN NUKTA..ORIYA VOWEL SIGN VOCALIC R
0B47..0B48 ; 1.1 # [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI
0B4B..0B4D ; 1.1 # [3] ORIYA VOWEL SIGN O..ORIYA SIGN VIRAMA
0B56..0B57 ; 1.1 # [2] ORIYA AI LENGTH MARK..ORIYA AU LENGTH MARK
0B5C..0B5D ; 1.1 # [2] ORIYA LETTER RRA..ORIYA LETTER RHA
0B5F..0B61 ; 1.1 # [3] ORIYA LETTER YYA..ORIYA LETTER VOCALIC LL
0B66..0B70 ; 1.1 # [11] ORIYA DIGIT ZERO..ORIYA ISSHAR
0B82..0B83 ; 1.1 # [2] TAMIL SIGN ANUSVARA..TAMIL SIGN VISARGA
0B85..0B8A ; 1.1 # [6] TAMIL LETTER A..TAMIL LETTER UU
0B8E..0B90 ; 1.1 # [3] TAMIL LETTER E..TAMIL LETTER AI
0B92..0B95 ; 1.1 # [4] TAMIL LETTER O..TAMIL LETTER KA
0B99..0B9A ; 1.1 # [2] TAMIL LETTER NGA..TAMIL LETTER CA
0B9C ; 1.1 # TAMIL LETTER JA
0B9E..0B9F ; 1.1 # [2] TAMIL LETTER NYA..TAMIL LETTER TTA
0BA3..0BA4 ; 1.1 # [2] TAMIL LETTER NNA..TAMIL LETTER TA
0BA8..0BAA ; 1.1 # [3] TAMIL LETTER NA..TAMIL LETTER PA
0BAE..0BB5 ; 1.1 # [8] TAMIL LETTER MA..TAMIL LETTER VA
0BB7..0BB9 ; 1.1 # [3] TAMIL LETTER SSA..TAMIL LETTER HA
0BBE..0BC2 ; 1.1 # [5] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN UU
0BC6..0BC8 ; 1.1 # [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI
0BCA..0BCD ; 1.1 # [4] TAMIL VOWEL SIGN O..TAMIL SIGN VIRAMA
0BD7 ; 1.1 # TAMIL AU LENGTH MARK
0BE7..0BF2 ; 1.1 # [12] TAMIL DIGIT ONE..TAMIL NUMBER ONE THOUSAND
0C01..0C03 ; 1.1 # [3] TELUGU SIGN CANDRABINDU..TELUGU SIGN VISARGA
0C05..0C0C ; 1.1 # [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L
0C0E..0C10 ; 1.1 # [3] TELUGU LETTER E..TELUGU LETTER AI
0C12..0C28 ; 1.1 # [23] TELUGU LETTER O..TELUGU LETTER NA
0C2A..0C33 ; 1.1 # [10] TELUGU LETTER PA..TELUGU LETTER LLA
0C35..0C39 ; 1.1 # [5] TELUGU LETTER VA..TELUGU LETTER HA
0C3E..0C44 ; 1.1 # [7] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN VOCALIC RR
0C46..0C48 ; 1.1 # [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI
0C4A..0C4D ; 1.1 # [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA
0C55..0C56 ; 1.1 # [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK
0C60..0C61 ; 1.1 # [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL
0C66..0C6F ; 1.1 # [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE
0C82..0C83 ; 1.1 # [2] KANNADA SIGN ANUSVARA..KANNADA SIGN VISARGA
0C85..0C8C ; 1.1 # [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L
0C8E..0C90 ; 1.1 # [3] KANNADA LETTER E..KANNADA LETTER AI
0C92..0CA8 ; 1.1 # [23] KANNADA LETTER O..KANNADA LETTER NA
0CAA..0CB3 ; 1.1 # [10] KANNADA LETTER PA..KANNADA LETTER LLA
0CB5..0CB9 ; 1.1 # [5] KANNADA LETTER VA..KANNADA LETTER HA
0CBE..0CC4 ; 1.1 # [7] KANNADA VOWEL SIGN AA..KANNADA VOWEL SIGN VOCALIC RR
0CC6..0CC8 ; 1.1 # [3] KANNADA VOWEL SIGN E..KANNADA VOWEL SIGN AI
0CCA..0CCD ; 1.1 # [4] KANNADA VOWEL SIGN O..KANNADA SIGN VIRAMA
0CD5..0CD6 ; 1.1 # [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK
0CDE ; 1.1 # KANNADA LETTER FA
0CE0..0CE1 ; 1.1 # [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL
0CE6..0CEF ; 1.1 # [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE
0D02..0D03 ; 1.1 # [2] MALAYALAM SIGN ANUSVARA..MALAYALAM SIGN VISARGA
0D05..0D0C ; 1.1 # [8] MALAYALAM LETTER A..MALAYALAM LETTER VOCALIC L
0D0E..0D10 ; 1.1 # [3] MALAYALAM LETTER E..MALAYALAM LETTER AI
0D12..0D28 ; 1.1 # [23] MALAYALAM LETTER O..MALAYALAM LETTER NA
0D2A..0D39 ; 1.1 # [16] MALAYALAM LETTER PA..MALAYALAM LETTER HA
0D3E..0D43 ; 1.1 # [6] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN VOCALIC R
0D46..0D48 ; 1.1 # [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI
0D4A..0D4D ; 1.1 # [4] MALAYALAM VOWEL SIGN O..MALAYALAM SIGN VIRAMA
0D57 ; 1.1 # MALAYALAM AU LENGTH MARK
0D60..0D61 ; 1.1 # [2] MALAYALAM LETTER VOCALIC RR..MALAYALAM LETTER VOCALIC LL
0D66..0D6F ; 1.1 # [10] MALAYALAM DIGIT ZERO..MALAYALAM DIGIT NINE
0E01..0E3A ; 1.1 # [58] THAI CHARACTER KO KAI..THAI CHARACTER PHINTHU
0E3F..0E5B ; 1.1 # [29] THAI CURRENCY SYMBOL BAHT..THAI CHARACTER KHOMUT
0E81..0E82 ; 1.1 # [2] LAO LETTER KO..LAO LETTER KHO SUNG
0E84 ; 1.1 # LAO LETTER KHO TAM
0E87..0E88 ; 1.1 # [2] LAO LETTER NGO..LAO LETTER CO
0E8A ; 1.1 # LAO LETTER SO TAM
0E8D ; 1.1 # LAO LETTER NYO
0E94..0E97 ; 1.1 # [4] LAO LETTER DO..LAO LETTER THO TAM
0E99..0E9F ; 1.1 # [7] LAO LETTER NO..LAO LETTER FO SUNG
0EA1..0EA3 ; 1.1 # [3] LAO LETTER MO..LAO LETTER LO LING
0EA5 ; 1.1 # LAO LETTER LO LOOT
0EA7 ; 1.1 # LAO LETTER WO
0EAA..0EAB ; 1.1 # [2] LAO LETTER SO SUNG..LAO LETTER HO SUNG
0EAD..0EB9 ; 1.1 # [13] LAO LETTER O..LAO VOWEL SIGN UU
0EBB..0EBD ; 1.1 # [3] LAO VOWEL SIGN MAI KON..LAO SEMIVOWEL SIGN NYO
0EC0..0EC4 ; 1.1 # [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI
0EC6 ; 1.1 # LAO KO LA
0EC8..0ECD ; 1.1 # [6] LAO TONE MAI EK..LAO NIGGAHITA
0ED0..0ED9 ; 1.1 # [10] LAO DIGIT ZERO..LAO DIGIT NINE
0EDC..0EDD ; 1.1 # [2] LAO HO NO..LAO HO MO
10A0..10C5 ; 1.1 # [38] GEORGIAN CAPITAL LETTER AN..GEORGIAN CAPITAL LETTER HOE
10D0..10F6 ; 1.1 # [39] GEORGIAN LETTER AN..GEORGIAN LETTER FI
10FB ; 1.1 # GEORGIAN PARAGRAPH SEPARATOR
1100..1159 ; 1.1 # [90] HANGUL CHOSEONG KIYEOK..HANGUL CHOSEONG YEORINHIEUH
115F..11A2 ; 1.1 # [68] HANGUL CHOSEONG FILLER..HANGUL JUNGSEONG SSANGARAEA
11A8..11F9 ; 1.1 # [82] HANGUL JONGSEONG KIYEOK..HANGUL JONGSEONG YEORINHIEUH
1E00..1E9A ; 1.1 # [155] LATIN CAPITAL LETTER A WITH RING BELOW..LATIN SMALL LETTER A WITH RIGHT HALF RING
1EA0..1EF9 ; 1.1 # [90] LATIN CAPITAL LETTER A WITH DOT BELOW..LATIN SMALL LETTER Y WITH TILDE
1F00..1F15 ; 1.1 # [22] GREEK SMALL LETTER ALPHA WITH PSILI..GREEK SMALL LETTER EPSILON WITH DASIA AND OXIA
1F18..1F1D ; 1.1 # [6] GREEK CAPITAL LETTER EPSILON WITH PSILI..GREEK CAPITAL LETTER EPSILON WITH DASIA AND OXIA
1F20..1F45 ; 1.1 # [38] GREEK SMALL LETTER ETA WITH PSILI..GREEK SMALL LETTER OMICRON WITH DASIA AND OXIA
1F48..1F4D ; 1.1 # [6] GREEK CAPITAL LETTER OMICRON WITH PSILI..GREEK CAPITAL LETTER OMICRON WITH DASIA AND OXIA
1F50..1F57 ; 1.1 # [8] GREEK SMALL LETTER UPSILON WITH PSILI..GREEK SMALL LETTER UPSILON WITH DASIA AND PERISPOMENI
1F59 ; 1.1 # GREEK CAPITAL LETTER UPSILON WITH DASIA
1F5B ; 1.1 # GREEK CAPITAL LETTER UPSILON WITH DASIA AND VARIA
1F5D ; 1.1 # GREEK CAPITAL LETTER UPSILON WITH DASIA AND OXIA
1F5F..1F7D ; 1.1 # [31] GREEK CAPITAL LETTER UPSILON WITH DASIA AND PERISPOMENI..GREEK SMALL LETTER OMEGA WITH OXIA
1F80..1FB4 ; 1.1 # [53] GREEK SMALL LETTER ALPHA WITH PSILI AND YPOGEGRAMMENI..GREEK SMALL LETTER ALPHA WITH OXIA AND YPOGEGRAMMENI
1FB6..1FC4 ; 1.1 # [15] GREEK SMALL LETTER ALPHA WITH PERISPOMENI..GREEK SMALL LETTER ETA WITH OXIA AND YPOGEGRAMMENI
1FC6..1FD3 ; 1.1 # [14] GREEK SMALL LETTER ETA WITH PERISPOMENI..GREEK SMALL LETTER IOTA WITH DIALYTIKA AND OXIA
1FD6..1FDB ; 1.1 # [6] GREEK SMALL LETTER IOTA WITH PERISPOMENI..GREEK CAPITAL LETTER IOTA WITH OXIA
1FDD..1FEF ; 1.1 # [19] GREEK DASIA AND VARIA..GREEK VARIA
1FF2..1FF4 ; 1.1 # [3] GREEK SMALL LETTER OMEGA WITH VARIA AND YPOGEGRAMMENI..GREEK SMALL LETTER OMEGA WITH OXIA AND YPOGEGRAMMENI
1FF6..1FFE ; 1.1 # [9] GREEK SMALL LETTER OMEGA WITH PERISPOMENI..GREEK DASIA
2000..200A ; 1.1 # [11] EN QUAD..HAIR SPACE
200B..200F ; 1.1 # [5] ZERO WIDTH SPACE..RIGHT-TO-LEFT MARK
2010..2027 ; 1.1 # [24] HYPHEN..HYPHENATION POINT
2028..202E ; 1.1 # [7] LINE SEPARATOR..RIGHT-TO-LEFT OVERRIDE
2030..2046 ; 1.1 # [23] PER MILLE SIGN..RIGHT SQUARE BRACKET WITH QUILL
206A..206F ; 1.1 # [6] INHIBIT SYMMETRIC SWAPPING..NOMINAL DIGIT SHAPES
2070 ; 1.1 # SUPERSCRIPT ZERO
2074..208E ; 1.1 # [27] SUPERSCRIPT FOUR..SUBSCRIPT RIGHT PARENTHESIS
20A0..20AA ; 1.1 # [11] EURO-CURRENCY SIGN..NEW SHEQEL SIGN
20D0..20E1 ; 1.1 # [18] COMBINING LEFT HARPOON ABOVE..COMBINING LEFT RIGHT ARROW ABOVE
2100..2138 ; 1.1 # [57] ACCOUNT OF..DALET SYMBOL
2153..2182 ; 1.1 # [48] VULGAR FRACTION ONE THIRD..ROMAN NUMERAL TEN THOUSAND
2190..21EA ; 1.1 # [91] LEFTWARDS ARROW..UPWARDS WHITE ARROW FROM BAR
2200..22F1 ; 1.1 # [242] FOR ALL..DOWN RIGHT DIAGONAL ELLIPSIS
2300 ; 1.1 # DIAMETER SIGN
2302..237A ; 1.1 # [121] HOUSE..APL FUNCTIONAL SYMBOL ALPHA
2400..2424 ; 1.1 # [37] SYMBOL FOR NULL..SYMBOL FOR NEWLINE
2440..244A ; 1.1 # [11] OCR HOOK..OCR DOUBLE BACKSLASH
2460..24EA ; 1.1 # [139] CIRCLED DIGIT ONE..CIRCLED DIGIT ZERO
2500..2595 ; 1.1 # [150] BOX DRAWINGS LIGHT HORIZONTAL..RIGHT ONE EIGHTH BLOCK
25A0..25EF ; 1.1 # [80] BLACK SQUARE..LARGE CIRCLE
2600..2613 ; 1.1 # [20] BLACK SUN WITH RAYS..SALTIRE
261A..266F ; 1.1 # [86] BLACK LEFT POINTING INDEX..MUSIC SHARP SIGN
2701..2704 ; 1.1 # [4] UPPER BLADE SCISSORS..WHITE SCISSORS
2706..2709 ; 1.1 # [4] TELEPHONE LOCATION SIGN..ENVELOPE
270C..2727 ; 1.1 # [28] VICTORY HAND..WHITE FOUR POINTED STAR
2729..274B ; 1.1 # [35] STRESS OUTLINED WHITE STAR..HEAVY EIGHT TEARDROP-SPOKED PROPELLER ASTERISK
274D ; 1.1 # SHADOWED WHITE CIRCLE
274F..2752 ; 1.1 # [4] LOWER RIGHT DROP-SHADOWED WHITE SQUARE..UPPER RIGHT SHADOWED WHITE SQUARE
2756 ; 1.1 # BLACK DIAMOND MINUS WHITE X
2758..275E ; 1.1 # [7] LIGHT VERTICAL BAR..HEAVY DOUBLE COMMA QUOTATION MARK ORNAMENT
2761..2767 ; 1.1 # [7] CURVED STEM PARAGRAPH SIGN ORNAMENT..ROTATED FLORAL HEART BULLET
2776..2794 ; 1.1 # [31] DINGBAT NEGATIVE CIRCLED DIGIT ONE..HEAVY WIDE-HEADED RIGHTWARDS ARROW
2798..27AF ; 1.1 # [24] HEAVY SOUTH EAST ARROW..NOTCHED LOWER RIGHT-SHADOWED WHITE RIGHTWARDS ARROW
27B1..27BE ; 1.1 # [14] NOTCHED UPPER RIGHT-SHADOWED WHITE RIGHTWARDS ARROW..OPEN-OUTLINED RIGHTWARDS ARROW
3000..3037 ; 1.1 # [56] IDEOGRAPHIC SPACE..IDEOGRAPHIC TELEGRAPH LINE FEED SEPARATOR SYMBOL
303F ; 1.1 # IDEOGRAPHIC HALF FILL SPACE
3041..3094 ; 1.1 # [84] HIRAGANA LETTER SMALL A..HIRAGANA LETTER VU
3099..309E ; 1.1 # [6] COMBINING KATAKANA-HIRAGANA VOICED SOUND MARK..HIRAGANA VOICED ITERATION MARK
30A1..30FE ; 1.1 # [94] KATAKANA LETTER SMALL A..KATAKANA VOICED ITERATION MARK
3105..312C ; 1.1 # [40] BOPOMOFO LETTER B..BOPOMOFO LETTER GN
3131..318E ; 1.1 # [94] HANGUL LETTER KIYEOK..HANGUL LETTER ARAEAE
3190..319F ; 1.1 # [16] IDEOGRAPHIC ANNOTATION LINKING MARK..IDEOGRAPHIC ANNOTATION MAN MARK
3200..321C ; 1.1 # [29] PARENTHESIZED HANGUL KIYEOK..PARENTHESIZED HANGUL CIEUC U
3220..3243 ; 1.1 # [36] PARENTHESIZED IDEOGRAPH ONE..PARENTHESIZED IDEOGRAPH REACH
3260..327B ; 1.1 # [28] CIRCLED HANGUL KIYEOK..CIRCLED HANGUL HIEUH A
327F..32B0 ; 1.1 # [50] KOREAN STANDARD SYMBOL..CIRCLED IDEOGRAPH NIGHT
32C0..32CB ; 1.1 # [12] IDEOGRAPHIC TELEGRAPH SYMBOL FOR JANUARY..IDEOGRAPHIC TELEGRAPH SYMBOL FOR DECEMBER
32D0..32FE ; 1.1 # [47] CIRCLED KATAKANA A..CIRCLED KATAKANA WO
3300..3376 ; 1.1 # [119] SQUARE APAATO..SQUARE PC
337B..33DD ; 1.1 # [99] SQUARE ERA NAME HEISEI..SQUARE WB
33E0..33FE ; 1.1 # [31] IDEOGRAPHIC TELEGRAPH SYMBOL FOR DAY ONE..IDEOGRAPHIC TELEGRAPH SYMBOL FOR DAY THIRTY-ONE
4E00..9FA5 ; 1.1 # [20902] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FA5
E000..F8FF ; 1.1 # [6400] <private-use-E000>..<private-use-F8FF>
F900..FA2D ; 1.1 # [302] CJK COMPATIBILITY IDEOGRAPH-F900..CJK COMPATIBILITY IDEOGRAPH-FA2D
FB00..FB06 ; 1.1 # [7] LATIN SMALL LIGATURE FF..LATIN SMALL LIGATURE ST
FB13..FB17 ; 1.1 # [5] ARMENIAN SMALL LIGATURE MEN NOW..ARMENIAN SMALL LIGATURE MEN XEH
FB1E..FB36 ; 1.1 # [25] HEBREW POINT JUDEO-SPANISH VARIKA..HEBREW LETTER ZAYIN WITH DAGESH
FB38..FB3C ; 1.1 # [5] HEBREW LETTER TET WITH DAGESH..HEBREW LETTER LAMED WITH DAGESH
FB3E ; 1.1 # HEBREW LETTER MEM WITH DAGESH
FB40..FB41 ; 1.1 # [2] HEBREW LETTER NUN WITH DAGESH..HEBREW LETTER SAMEKH WITH DAGESH
FB43..FB44 ; 1.1 # [2] HEBREW LETTER FINAL PE WITH DAGESH..HEBREW LETTER PE WITH DAGESH
FB46..FBB1 ; 1.1 # [108] HEBREW LETTER TSADI WITH DAGESH..ARABIC LETTER YEH BARREE WITH HAMZA ABOVE FINAL FORM
FBD3..FD3F ; 1.1 # [365] ARABIC LETTER NG ISOLATED FORM..ORNATE RIGHT PARENTHESIS
FD50..FD8F ; 1.1 # [64] ARABIC LIGATURE TEH WITH JEEM WITH MEEM INITIAL FORM..ARABIC LIGATURE MEEM WITH KHAH WITH MEEM INITIAL FORM
FD92..FDC7 ; 1.1 # [54] ARABIC LIGATURE MEEM WITH JEEM WITH KHAH INITIAL FORM..ARABIC LIGATURE NOON WITH JEEM WITH YEH FINAL FORM
FDF0..FDFB ; 1.1 # [12] ARABIC LIGATURE SALLA USED AS KORANIC STOP SIGN ISOLATED FORM..ARABIC LIGATURE JALLAJALALOUHOU
FE20..FE23 ; 1.1 # [4] COMBINING LIGATURE LEFT HALF..COMBINING DOUBLE TILDE RIGHT HALF
FE30..FE44 ; 1.1 # [21] PRESENTATION FORM FOR VERTICAL TWO DOT LEADER..PRESENTATION FORM FOR VERTICAL RIGHT WHITE CORNER BRACKET
FE49..FE52 ; 1.1 # [10] DASHED OVERLINE..SMALL FULL STOP
FE54..FE66 ; 1.1 # [19] SMALL SEMICOLON..SMALL EQUALS SIGN
FE68..FE6B ; 1.1 # [4] SMALL REVERSE SOLIDUS..SMALL COMMERCIAL AT
FE70..FE72 ; 1.1 # [3] ARABIC FATHATAN ISOLATED FORM..ARABIC DAMMATAN ISOLATED FORM
FE74 ; 1.1 # ARABIC KASRATAN ISOLATED FORM
FE76..FEFC ; 1.1 # [135] ARABIC FATHA ISOLATED FORM..ARABIC LIGATURE LAM WITH ALEF FINAL FORM
FEFF ; 1.1 # ZERO WIDTH NO-BREAK SPACE
FF01..FF5E ; 1.1 # [94] FULLWIDTH EXCLAMATION MARK..FULLWIDTH TILDE
FF61..FFBE ; 1.1 # [94] HALFWIDTH IDEOGRAPHIC FULL STOP..HALFWIDTH HANGUL LETTER HIEUH
FFC2..FFC7 ; 1.1 # [6] HALFWIDTH HANGUL LETTER A..HALFWIDTH HANGUL LETTER E
FFCA..FFCF ; 1.1 # [6] HALFWIDTH HANGUL LETTER YEO..HALFWIDTH HANGUL LETTER OE
FFD2..FFD7 ; 1.1 # [6] HALFWIDTH HANGUL LETTER YO..HALFWIDTH HANGUL LETTER YU
FFDA..FFDC ; 1.1 # [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I
FFE0..FFE6 ; 1.1 # [7] FULLWIDTH CENT SIGN..FULLWIDTH WON SIGN
FFE8..FFEE ; 1.1 # [7] HALFWIDTH FORMS LIGHT VERTICAL..HALFWIDTH WHITE CIRCLE
FFFD ; 1.1 # REPLACEMENT CHARACTER
FFFE..FFFF ; 1.1 # [2] <noncharacter-FFFE>..<noncharacter-FFFF>
# Total code points: 33979
# ================================================
# Newly assigned in Unicode 2.0.0 (July, 1996)
0591..05A1 ; 2.0 # [17] HEBREW ACCENT ETNAHTA..HEBREW ACCENT PAZER
05A3..05AF ; 2.0 # [13] HEBREW ACCENT MUNAH..HEBREW MARK MASORA CIRCLE
05C4 ; 2.0 # HEBREW MARK UPPER DOT
0F00..0F47 ; 2.0 # [72] TIBETAN SYLLABLE OM..TIBETAN LETTER JA
0F49..0F69 ; 2.0 # [33] TIBETAN LETTER NYA..TIBETAN LETTER KSSA
0F71..0F8B ; 2.0 # [27] TIBETAN VOWEL SIGN AA..TIBETAN SIGN GRU MED RGYINGS
0F90..0F95 ; 2.0 # [6] TIBETAN SUBJOINED LETTER KA..TIBETAN SUBJOINED LETTER CA
0F97 ; 2.0 # TIBETAN SUBJOINED LETTER JA
0F99..0FAD ; 2.0 # [21] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER WA
0FB1..0FB7 ; 2.0 # [7] TIBETAN SUBJOINED LETTER YA..TIBETAN SUBJOINED LETTER HA
0FB9 ; 2.0 # TIBETAN SUBJOINED LETTER KSSA
1E9B ; 2.0 # LATIN SMALL LETTER LONG S WITH DOT ABOVE
20AB ; 2.0 # DONG SIGN
AC00..D7A3 ; 2.0 # [11172] HANGUL SYLLABLE GA..HANGUL SYLLABLE HIH
D800..DFFF ; 2.0 # [2048] <surrogate-D800>..<surrogate-DFFF>
1FFFE..1FFFF ; 2.0 # [2] <noncharacter-1FFFE>..<noncharacter-1FFFF>
2FFFE..2FFFF ; 2.0 # [2] <noncharacter-2FFFE>..<noncharacter-2FFFF>
3FFFE..3FFFF ; 2.0 # [2] <noncharacter-3FFFE>..<noncharacter-3FFFF>
4FFFE..4FFFF ; 2.0 # [2] <noncharacter-4FFFE>..<noncharacter-4FFFF>
5FFFE..5FFFF ; 2.0 # [2] <noncharacter-5FFFE>..<noncharacter-5FFFF>
6FFFE..6FFFF ; 2.0 # [2] <noncharacter-6FFFE>..<noncharacter-6FFFF>
7FFFE..7FFFF ; 2.0 # [2] <noncharacter-7FFFE>..<noncharacter-7FFFF>
8FFFE..8FFFF ; 2.0 # [2] <noncharacter-8FFFE>..<noncharacter-8FFFF>
9FFFE..9FFFF ; 2.0 # [2] <noncharacter-9FFFE>..<noncharacter-9FFFF>
AFFFE..AFFFF ; 2.0 # [2] <noncharacter-AFFFE>..<noncharacter-AFFFF>
BFFFE..BFFFF ; 2.0 # [2] <noncharacter-BFFFE>..<noncharacter-BFFFF>
CFFFE..CFFFF ; 2.0 # [2] <noncharacter-CFFFE>..<noncharacter-CFFFF>
DFFFE..DFFFF ; 2.0 # [2] <noncharacter-DFFFE>..<noncharacter-DFFFF>
EFFFE..EFFFF ; 2.0 # [2] <noncharacter-EFFFE>..<noncharacter-EFFFF>
F0000..FFFFD ; 2.0 # [65534] <private-use-F0000>..<private-use-FFFFD>
FFFFE..FFFFF ; 2.0 # [2] <noncharacter-FFFFE>..<noncharacter-FFFFF>
100000..10FFFD; 2.0 # [65534] <private-use-100000>..<private-use-10FFFD>
10FFFE..10FFFF; 2.0 # [2] <noncharacter-10FFFE>..<noncharacter-10FFFF>
# Total code points: 144521
# ================================================
# Newly assigned in Unicode 2.1.2 (May, 1998)
20AC ; 2.1 # EURO SIGN
FFFC ; 2.1 # OBJECT REPLACEMENT CHARACTER
# Total code points: 2
# ================================================
# Newly assigned in Unicode 3.0.0 (September, 1999)
01F6..01F9 ; 3.0 # [4] LATIN CAPITAL LETTER HWAIR..LATIN SMALL LETTER N WITH GRAVE
0218..021F ; 3.0 # [8] LATIN CAPITAL LETTER S WITH COMMA BELOW..LATIN SMALL LETTER H WITH CARON
0222..0233 ; 3.0 # [18] LATIN CAPITAL LETTER OU..LATIN SMALL LETTER Y WITH MACRON
02A9..02AD ; 3.0 # [5] LATIN SMALL LETTER FENG DIGRAPH..LATIN LETTER BIDENTAL PERCUSSIVE
02DF ; 3.0 # MODIFIER LETTER CROSS ACCENT
02EA..02EE ; 3.0 # [5] MODIFIER LETTER YIN DEPARTING TONE MARK..MODIFIER LETTER DOUBLE APOSTROPHE
0346..034E ; 3.0 # [9] COMBINING BRIDGE ABOVE..COMBINING UPWARDS ARROW BELOW
0362 ; 3.0 # COMBINING DOUBLE RIGHTWARDS ARROW BELOW
03D7 ; 3.0 # GREEK KAI SYMBOL
03DB ; 3.0 # GREEK SMALL LETTER STIGMA
03DD ; 3.0 # GREEK SMALL LETTER DIGAMMA
03DF ; 3.0 # GREEK SMALL LETTER KOPPA
03E1 ; 3.0 # GREEK SMALL LETTER SAMPI
0400 ; 3.0 # CYRILLIC CAPITAL LETTER IE WITH GRAVE
040D ; 3.0 # CYRILLIC CAPITAL LETTER I WITH GRAVE
0450 ; 3.0 # CYRILLIC SMALL LETTER IE WITH GRAVE
045D ; 3.0 # CYRILLIC SMALL LETTER I WITH GRAVE
0488..0489 ; 3.0 # [2] COMBINING CYRILLIC HUNDRED THOUSANDS SIGN..COMBINING CYRILLIC MILLIONS SIGN
048C..048F ; 3.0 # [4] CYRILLIC CAPITAL LETTER SEMISOFT SIGN..CYRILLIC SMALL LETTER ER WITH TICK
04EC..04ED ; 3.0 # [2] CYRILLIC CAPITAL LETTER E WITH DIAERESIS..CYRILLIC SMALL LETTER E WITH DIAERESIS
058A ; 3.0 # ARMENIAN HYPHEN
0653..0655 ; 3.0 # [3] ARABIC MADDAH ABOVE..ARABIC HAMZA BELOW
06B8..06B9 ; 3.0 # [2] ARABIC LETTER LAM WITH THREE DOTS BELOW..ARABIC LETTER NOON WITH DOT BELOW
06BF ; 3.0 # ARABIC LETTER TCHEH WITH DOT ABOVE
06CF ; 3.0 # ARABIC LETTER WAW WITH DOT ABOVE
06FA..06FE ; 3.0 # [5] ARABIC LETTER SHEEN WITH DOT BELOW..ARABIC SIGN SINDHI POSTPOSITION MEN
0700..070D ; 3.0 # [14] SYRIAC END OF PARAGRAPH..SYRIAC HARKLEAN ASTERISCUS
070F ; 3.0 # SYRIAC ABBREVIATION MARK
0710..072C ; 3.0 # [29] SYRIAC LETTER ALAPH..SYRIAC LETTER TAW
0730..074A ; 3.0 # [27] SYRIAC PTHAHA ABOVE..SYRIAC BARREKH
0780..07B0 ; 3.0 # [49] THAANA LETTER HAA..THAANA SUKUN
0D82..0D83 ; 3.0 # [2] SINHALA SIGN ANUSVARAYA..SINHALA SIGN VISARGAYA
0D85..0D96 ; 3.0 # [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA
0D9A..0DB1 ; 3.0 # [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA
0DB3..0DBB ; 3.0 # [9] SINHALA LETTER SANYAKA DAYANNA..SINHALA LETTER RAYANNA
0DBD ; 3.0 # SINHALA LETTER DANTAJA LAYANNA
0DC0..0DC6 ; 3.0 # [7] SINHALA LETTER VAYANNA..SINHALA LETTER FAYANNA
0DCA ; 3.0 # SINHALA SIGN AL-LAKUNA
0DCF..0DD4 ; 3.0 # [6] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA
0DD6 ; 3.0 # SINHALA VOWEL SIGN DIGA PAA-PILLA
0DD8..0DDF ; 3.0 # [8] SINHALA VOWEL SIGN GAETTA-PILLA..SINHALA VOWEL SIGN GAYANUKITTA
0DF2..0DF4 ; 3.0 # [3] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA PUNCTUATION KUNDDALIYA
0F6A ; 3.0 # TIBETAN LETTER FIXED-FORM RA
0F96 ; 3.0 # TIBETAN SUBJOINED LETTER CHA
0FAE..0FB0 ; 3.0 # [3] TIBETAN SUBJOINED LETTER ZHA..TIBETAN SUBJOINED LETTER -A
0FB8 ; 3.0 # TIBETAN SUBJOINED LETTER A
0FBA..0FBC ; 3.0 # [3] TIBETAN SUBJOINED LETTER FIXED-FORM WA..TIBETAN SUBJOINED LETTER FIXED-FORM RA
0FBE..0FCC ; 3.0 # [15] TIBETAN KU RU KHA..TIBETAN SYMBOL NOR BU BZHI -KHYIL
0FCF ; 3.0 # TIBETAN SIGN RDEL NAG GSUM
1000..1021 ; 3.0 # [34] MYANMAR LETTER KA..MYANMAR LETTER A
1023..1027 ; 3.0 # [5] MYANMAR LETTER I..MYANMAR LETTER E
1029..102A ; 3.0 # [2] MYANMAR LETTER O..MYANMAR LETTER AU
102C..1032 ; 3.0 # [7] MYANMAR VOWEL SIGN AA..MYANMAR VOWEL SIGN AI
1036..1039 ; 3.0 # [4] MYANMAR SIGN ANUSVARA..MYANMAR SIGN VIRAMA
1040..1059 ; 3.0 # [26] MYANMAR DIGIT ZERO..MYANMAR VOWEL SIGN VOCALIC LL
1200..1206 ; 3.0 # [7] ETHIOPIC SYLLABLE HA..ETHIOPIC SYLLABLE HO
1208..1246 ; 3.0 # [63] ETHIOPIC SYLLABLE LA..ETHIOPIC SYLLABLE QO
1248 ; 3.0 # ETHIOPIC SYLLABLE QWA
124A..124D ; 3.0 # [4] ETHIOPIC SYLLABLE QWI..ETHIOPIC SYLLABLE QWE
1250..1256 ; 3.0 # [7] ETHIOPIC SYLLABLE QHA..ETHIOPIC SYLLABLE QHO
1258 ; 3.0 # ETHIOPIC SYLLABLE QHWA
125A..125D ; 3.0 # [4] ETHIOPIC SYLLABLE QHWI..ETHIOPIC SYLLABLE QHWE
1260..1286 ; 3.0 # [39] ETHIOPIC SYLLABLE BA..ETHIOPIC SYLLABLE XO
1288 ; 3.0 # ETHIOPIC SYLLABLE XWA
128A..128D ; 3.0 # [4] ETHIOPIC SYLLABLE XWI..ETHIOPIC SYLLABLE XWE
1290..12AE ; 3.0 # [31] ETHIOPIC SYLLABLE NA..ETHIOPIC SYLLABLE KO
12B0 ; 3.0 # ETHIOPIC SYLLABLE KWA
12B2..12B5 ; 3.0 # [4] ETHIOPIC SYLLABLE KWI..ETHIOPIC SYLLABLE KWE
12B8..12BE ; 3.0 # [7] ETHIOPIC SYLLABLE KXA..ETHIOPIC SYLLABLE KXO
12C0 ; 3.0 # ETHIOPIC SYLLABLE KXWA
12C2..12C5 ; 3.0 # [4] ETHIOPIC SYLLABLE KXWI..ETHIOPIC SYLLABLE KXWE
12C8..12CE ; 3.0 # [7] ETHIOPIC SYLLABLE WA..ETHIOPIC SYLLABLE WO
12D0..12D6 ; 3.0 # [7] ETHIOPIC SYLLABLE PHARYNGEAL A..ETHIOPIC SYLLABLE PHARYNGEAL O
12D8..12EE ; 3.0 # [23] ETHIOPIC SYLLABLE ZA..ETHIOPIC SYLLABLE YO
12F0..130E ; 3.0 # [31] ETHIOPIC SYLLABLE DA..ETHIOPIC SYLLABLE GO
1310 ; 3.0 # ETHIOPIC SYLLABLE GWA
1312..1315 ; 3.0 # [4] ETHIOPIC SYLLABLE GWI..ETHIOPIC SYLLABLE GWE
1318..131E ; 3.0 # [7] ETHIOPIC SYLLABLE GGA..ETHIOPIC SYLLABLE GGO
1320..1346 ; 3.0 # [39] ETHIOPIC SYLLABLE THA..ETHIOPIC SYLLABLE TZO
1348..135A ; 3.0 # [19] ETHIOPIC SYLLABLE FA..ETHIOPIC SYLLABLE FYA
1361..137C ; 3.0 # [28] ETHIOPIC WORDSPACE..ETHIOPIC NUMBER TEN THOUSAND
13A0..13F4 ; 3.0 # [85] CHEROKEE LETTER A..CHEROKEE LETTER YV
1401..1676 ; 3.0 # [630] CANADIAN SYLLABICS E..CANADIAN SYLLABICS NNGAA
1680..169C ; 3.0 # [29] OGHAM SPACE MARK..OGHAM REVERSED FEATHER MARK
16A0..16F0 ; 3.0 # [81] RUNIC LETTER FEHU FEOH FE F..RUNIC BELGTHOR SYMBOL
1780..17B3 ; 3.0 # [52] KHMER LETTER KA..KHMER INDEPENDENT VOWEL QAU
17B4..17B5 ; 3.0 # [2] KHMER VOWEL INHERENT AQ..KHMER VOWEL INHERENT AA
17B6..17DC ; 3.0 # [39] KHMER VOWEL SIGN AA..KHMER SIGN AVAKRAHASANYA
17E0..17E9 ; 3.0 # [10] KHMER DIGIT ZERO..KHMER DIGIT NINE
1800..180E ; 3.0 # [15] MONGOLIAN BIRGA..MONGOLIAN VOWEL SEPARATOR
1810..1819 ; 3.0 # [10] MONGOLIAN DIGIT ZERO..MONGOLIAN DIGIT NINE
1820..1877 ; 3.0 # [88] MONGOLIAN LETTER A..MONGOLIAN LETTER MANCHU ZHA
1880..18A9 ; 3.0 # [42] MONGOLIAN LETTER ALI GALI ANUSVARA ONE..MONGOLIAN LETTER ALI GALI DAGALGA
202F ; 3.0 # NARROW NO-BREAK SPACE
2048..204D ; 3.0 # [6] QUESTION EXCLAMATION MARK..BLACK RIGHTWARDS BULLET
20AD..20AF ; 3.0 # [3] KIP SIGN..DRACHMA SIGN
20E2..20E3 ; 3.0 # [2] COMBINING ENCLOSING SCREEN..COMBINING ENCLOSING KEYCAP
2139..213A ; 3.0 # [2] INFORMATION SOURCE..ROTATED CAPITAL Q
2183 ; 3.0 # ROMAN NUMERAL REVERSED ONE HUNDRED
21EB..21F3 ; 3.0 # [9] UPWARDS WHITE ARROW ON PEDESTAL..UP DOWN WHITE ARROW
2301 ; 3.0 # ELECTRIC ARROW
237B ; 3.0 # NOT CHECK MARK
237D..239A ; 3.0 # [30] SHOULDERED OPEN BOX..CLEAR SCREEN SYMBOL
2425..2426 ; 3.0 # [2] SYMBOL FOR DELETE FORM TWO..SYMBOL FOR SUBSTITUTE FORM TWO
25F0..25F7 ; 3.0 # [8] WHITE SQUARE WITH UPPER LEFT QUADRANT..WHITE CIRCLE WITH UPPER RIGHT QUADRANT
2619 ; 3.0 # REVERSED ROTATED FLORAL HEART BULLET
2670..2671 ; 3.0 # [2] WEST SYRIAC CROSS..EAST SYRIAC CROSS
2800..28FF ; 3.0 # [256] BRAILLE PATTERN BLANK..BRAILLE PATTERN DOTS-12345678
2E80..2E99 ; 3.0 # [26] CJK RADICAL REPEAT..CJK RADICAL RAP
2E9B..2EF3 ; 3.0 # [89] CJK RADICAL CHOKE..CJK RADICAL C-SIMPLIFIED TURTLE
2F00..2FD5 ; 3.0 # [214] KANGXI RADICAL ONE..KANGXI RADICAL FLUTE
2FF0..2FFB ; 3.0 # [12] IDEOGRAPHIC DESCRIPTION CHARACTER LEFT TO RIGHT..IDEOGRAPHIC DESCRIPTION CHARACTER OVERLAID
3038..303A ; 3.0 # [3] HANGZHOU NUMERAL TEN..HANGZHOU NUMERAL THIRTY
303E ; 3.0 # IDEOGRAPHIC VARIATION INDICATOR
31A0..31B7 ; 3.0 # [24] BOPOMOFO LETTER BU..BOPOMOFO FINAL LETTER H
3400..4DB5 ; 3.0 # [6582] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DB5
A000..A48C ; 3.0 # [1165] YI SYLLABLE IT..YI SYLLABLE YYR
A490..A4A1 ; 3.0 # [18] YI RADICAL QOT..YI RADICAL GA
A4A4..A4B3 ; 3.0 # [16] YI RADICAL DDUR..YI RADICAL JO
A4B5..A4C0 ; 3.0 # [12] YI RADICAL JJY..YI RADICAL SHAT
A4C2..A4C4 ; 3.0 # [3] YI RADICAL SHOP..YI RADICAL ZZIET
A4C6 ; 3.0 # YI RADICAL KE
FB1D ; 3.0 # HEBREW LETTER YOD WITH HIRIQ
FFF9..FFFB ; 3.0 # [3] INTERLINEAR ANNOTATION ANCHOR..INTERLINEAR ANNOTATION TERMINATOR
# Total code points: 10307
# ================================================
# Newly assigned in Unicode 3.1.0 (March, 2001)
03F4..03F5 ; 3.1 # [2] GREEK CAPITAL THETA SYMBOL..GREEK LUNATE EPSILON SYMBOL
FDD0..FDEF ; 3.1 # [32] <noncharacter-FDD0>..<noncharacter-FDEF>
10300..1031E ; 3.1 # [31] OLD ITALIC LETTER A..OLD ITALIC LETTER UU
10320..10323 ; 3.1 # [4] OLD ITALIC NUMERAL ONE..OLD ITALIC NUMERAL FIFTY
10330..1034A ; 3.1 # [27] GOTHIC LETTER AHSA..GOTHIC LETTER NINE HUNDRED
10400..10425 ; 3.1 # [38] DESERET CAPITAL LETTER LONG I..DESERET CAPITAL LETTER ENG
10428..1044D ; 3.1 # [38] DESERET SMALL LETTER LONG I..DESERET SMALL LETTER ENG
1D000..1D0F5 ; 3.1 # [246] BYZANTINE MUSICAL SYMBOL PSILI..BYZANTINE MUSICAL SYMBOL GORGON NEO KATO
1D100..1D126 ; 3.1 # [39] MUSICAL SYMBOL SINGLE BARLINE..MUSICAL SYMBOL DRUM CLEF-2
1D12A..1D172 ; 3.1 # [73] MUSICAL SYMBOL DOUBLE SHARP..MUSICAL SYMBOL COMBINING FLAG-5
1D173..1D17A ; 3.1 # [8] MUSICAL SYMBOL BEGIN BEAM..MUSICAL SYMBOL END PHRASE
1D17B..1D1DD ; 3.1 # [99] MUSICAL SYMBOL COMBINING ACCENT..MUSICAL SYMBOL PES SUBPUNCTIS
1D400..1D454 ; 3.1 # [85] MATHEMATICAL BOLD CAPITAL A..MATHEMATICAL ITALIC SMALL G
1D456..1D49C ; 3.1 # [71] MATHEMATICAL ITALIC SMALL I..MATHEMATICAL SCRIPT CAPITAL A
1D49E..1D49F ; 3.1 # [2] MATHEMATICAL SCRIPT CAPITAL C..MATHEMATICAL SCRIPT CAPITAL D
1D4A2 ; 3.1 # MATHEMATICAL SCRIPT CAPITAL G
1D4A5..1D4A6 ; 3.1 # [2] MATHEMATICAL SCRIPT CAPITAL J..MATHEMATICAL SCRIPT CAPITAL K
1D4A9..1D4AC ; 3.1 # [4] MATHEMATICAL SCRIPT CAPITAL N..MATHEMATICAL SCRIPT CAPITAL Q
1D4AE..1D4B9 ; 3.1 # [12] MATHEMATICAL SCRIPT CAPITAL S..MATHEMATICAL SCRIPT SMALL D
1D4BB ; 3.1 # MATHEMATICAL SCRIPT SMALL F
1D4BD..1D4C0 ; 3.1 # [4] MATHEMATICAL SCRIPT SMALL H..MATHEMATICAL SCRIPT SMALL K
1D4C2..1D4C3 ; 3.1 # [2] MATHEMATICAL SCRIPT SMALL M..MATHEMATICAL SCRIPT SMALL N
1D4C5..1D505 ; 3.1 # [65] MATHEMATICAL SCRIPT SMALL P..MATHEMATICAL FRAKTUR CAPITAL B
1D507..1D50A ; 3.1 # [4] MATHEMATICAL FRAKTUR CAPITAL D..MATHEMATICAL FRAKTUR CAPITAL G
1D50D..1D514 ; 3.1 # [8] MATHEMATICAL FRAKTUR CAPITAL J..MATHEMATICAL FRAKTUR CAPITAL Q
1D516..1D51C ; 3.1 # [7] MATHEMATICAL FRAKTUR CAPITAL S..MATHEMATICAL FRAKTUR CAPITAL Y
1D51E..1D539 ; 3.1 # [28] MATHEMATICAL FRAKTUR SMALL A..MATHEMATICAL DOUBLE-STRUCK CAPITAL B
1D53B..1D53E ; 3.1 # [4] MATHEMATICAL DOUBLE-STRUCK CAPITAL D..MATHEMATICAL DOUBLE-STRUCK CAPITAL G
1D540..1D544 ; 3.1 # [5] MATHEMATICAL DOUBLE-STRUCK CAPITAL I..MATHEMATICAL DOUBLE-STRUCK CAPITAL M
1D546 ; 3.1 # MATHEMATICAL DOUBLE-STRUCK CAPITAL O
1D54A..1D550 ; 3.1 # [7] MATHEMATICAL DOUBLE-STRUCK CAPITAL S..MATHEMATICAL DOUBLE-STRUCK CAPITAL Y
1D552..1D6A3 ; 3.1 # [338] MATHEMATICAL DOUBLE-STRUCK SMALL A..MATHEMATICAL MONOSPACE SMALL Z
1D6A8..1D7C9 ; 3.1 # [290] MATHEMATICAL BOLD CAPITAL ALPHA..MATHEMATICAL SANS-SERIF BOLD ITALIC PI SYMBOL
1D7CE..1D7FF ; 3.1 # [50] MATHEMATICAL BOLD DIGIT ZERO..MATHEMATICAL MONOSPACE DIGIT NINE
20000..2A6D6 ; 3.1 # [42711] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6D6
2F800..2FA1D ; 3.1 # [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D
E0001 ; 3.1 # LANGUAGE TAG
E0020..E007F ; 3.1 # [96] TAG SPACE..CANCEL TAG
# Total code points: 44978
# ================================================
# Newly assigned in Unicode 3.2.0 (March, 2002)
0220 ; 3.2 # LATIN CAPITAL LETTER N WITH LONG RIGHT LEG
034F ; 3.2 # COMBINING GRAPHEME JOINER
0363..036F ; 3.2 # [13] COMBINING LATIN SMALL LETTER A..COMBINING LATIN SMALL LETTER X
03D8..03D9 ; 3.2 # [2] GREEK LETTER ARCHAIC KOPPA..GREEK SMALL LETTER ARCHAIC KOPPA
03F6 ; 3.2 # GREEK REVERSED LUNATE EPSILON SYMBOL
048A..048B ; 3.2 # [2] CYRILLIC CAPITAL LETTER SHORT I WITH TAIL..CYRILLIC SMALL LETTER SHORT I WITH TAIL
04C5..04C6 ; 3.2 # [2] CYRILLIC CAPITAL LETTER EL WITH TAIL..CYRILLIC SMALL LETTER EL WITH TAIL
04C9..04CA ; 3.2 # [2] CYRILLIC CAPITAL LETTER EN WITH TAIL..CYRILLIC SMALL LETTER EN WITH TAIL
04CD..04CE ; 3.2 # [2] CYRILLIC CAPITAL LETTER EM WITH TAIL..CYRILLIC SMALL LETTER EM WITH TAIL
0500..050F ; 3.2 # [16] CYRILLIC CAPITAL LETTER KOMI DE..CYRILLIC SMALL LETTER KOMI TJE
066E..066F ; 3.2 # [2] ARABIC LETTER DOTLESS BEH..ARABIC LETTER DOTLESS QAF
07B1 ; 3.2 # THAANA LETTER NAA
10F7..10F8 ; 3.2 # [2] GEORGIAN LETTER YN..GEORGIAN LETTER ELIFI
1700..170C ; 3.2 # [13] TAGALOG LETTER A..TAGALOG LETTER YA
170E..1714 ; 3.2 # [7] TAGALOG LETTER LA..TAGALOG SIGN VIRAMA
1720..1736 ; 3.2 # [23] HANUNOO LETTER A..PHILIPPINE DOUBLE PUNCTUATION
1740..1753 ; 3.2 # [20] BUHID LETTER A..BUHID VOWEL SIGN U
1760..176C ; 3.2 # [13] TAGBANWA LETTER A..TAGBANWA LETTER YA
176E..1770 ; 3.2 # [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA
1772..1773 ; 3.2 # [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U
2047 ; 3.2 # DOUBLE QUESTION MARK
204E..2052 ; 3.2 # [5] LOW ASTERISK..COMMERCIAL MINUS SIGN
2057 ; 3.2 # QUADRUPLE PRIME
205F ; 3.2 # MEDIUM MATHEMATICAL SPACE
2060..2063 ; 3.2 # [4] WORD JOINER..INVISIBLE SEPARATOR
2071 ; 3.2 # SUPERSCRIPT LATIN SMALL LETTER I
20B0..20B1 ; 3.2 # [2] GERMAN PENNY SIGN..PESO SIGN
20E4..20EA ; 3.2 # [7] COMBINING ENCLOSING UPWARD POINTING TRIANGLE..COMBINING LEFTWARDS ARROW OVERLAY
213D..214B ; 3.2 # [15] DOUBLE-STRUCK SMALL GAMMA..TURNED AMPERSAND
21F4..21FF ; 3.2 # [12] RIGHT ARROW WITH SMALL CIRCLE..LEFT RIGHT OPEN-HEADED ARROW
22F2..22FF ; 3.2 # [14] ELEMENT OF WITH LONG HORIZONTAL STROKE..Z NOTATION BAG MEMBERSHIP
237C ; 3.2 # RIGHT ANGLE WITH DOWNWARDS ZIGZAG ARROW
239B..23CE ; 3.2 # [52] LEFT PARENTHESIS UPPER HOOK..RETURN SYMBOL
24EB..24FE ; 3.2 # [20] NEGATIVE CIRCLED NUMBER ELEVEN..DOUBLE CIRCLED NUMBER TEN
2596..259F ; 3.2 # [10] QUADRANT LOWER LEFT..QUADRANT UPPER RIGHT AND LOWER LEFT AND LOWER RIGHT
25F8..25FF ; 3.2 # [8] UPPER LEFT TRIANGLE..LOWER RIGHT TRIANGLE
2616..2617 ; 3.2 # [2] WHITE SHOGI PIECE..BLACK SHOGI PIECE
2672..267D ; 3.2 # [12] UNIVERSAL RECYCLING SYMBOL..PARTIALLY-RECYCLED PAPER SYMBOL
2680..2689 ; 3.2 # [10] DIE FACE-1..BLACK CIRCLE WITH TWO WHITE DOTS
2768..2775 ; 3.2 # [14] MEDIUM LEFT PARENTHESIS ORNAMENT..MEDIUM RIGHT CURLY BRACKET ORNAMENT
27D0..27EB ; 3.2 # [28] WHITE DIAMOND WITH CENTRED DOT..MATHEMATICAL RIGHT DOUBLE ANGLE BRACKET
27F0..27FF ; 3.2 # [16] UPWARDS QUADRUPLE ARROW..LONG RIGHTWARDS SQUIGGLE ARROW
2900..2AFF ; 3.2 # [512] RIGHTWARDS TWO-HEADED ARROW WITH VERTICAL STROKE..N-ARY WHITE VERTICAL BAR
303B..303D ; 3.2 # [3] VERTICAL IDEOGRAPHIC ITERATION MARK..PART ALTERNATION MARK
3095..3096 ; 3.2 # [2] HIRAGANA LETTER SMALL KA..HIRAGANA LETTER SMALL KE
309F..30A0 ; 3.2 # [2] HIRAGANA DIGRAPH YORI..KATAKANA-HIRAGANA DOUBLE HYPHEN
30FF ; 3.2 # KATAKANA DIGRAPH KOTO
31F0..31FF ; 3.2 # [16] KATAKANA LETTER SMALL KU..KATAKANA LETTER SMALL RO
3251..325F ; 3.2 # [15] CIRCLED NUMBER TWENTY ONE..CIRCLED NUMBER THIRTY FIVE
32B1..32BF ; 3.2 # [15] CIRCLED NUMBER THIRTY SIX..CIRCLED NUMBER FIFTY
A4A2..A4A3 ; 3.2 # [2] YI RADICAL ZUP..YI RADICAL CYT
A4B4 ; 3.2 # YI RADICAL NZUP
A4C1 ; 3.2 # YI RADICAL ZUR
A4C5 ; 3.2 # YI RADICAL NBIE
FA30..FA6A ; 3.2 # [59] CJK COMPATIBILITY IDEOGRAPH-FA30..CJK COMPATIBILITY IDEOGRAPH-FA6A
FDFC ; 3.2 # RIAL SIGN
FE00..FE0F ; 3.2 # [16] VARIATION SELECTOR-1..VARIATION SELECTOR-16
FE45..FE46 ; 3.2 # [2] SESAME DOT..WHITE SESAME DOT
FE73 ; 3.2 # ARABIC TAIL FRAGMENT
FF5F..FF60 ; 3.2 # [2] FULLWIDTH LEFT WHITE PARENTHESIS..FULLWIDTH RIGHT WHITE PARENTHESIS
# Total code points: 1016
# ================================================
# Newly assigned in Unicode 4.0.0 (April, 2003)
0221 ; 4.0 # LATIN SMALL LETTER D WITH CURL
0234..0236 ; 4.0 # [3] LATIN SMALL LETTER L WITH CURL..LATIN SMALL LETTER T WITH CURL
02AE..02AF ; 4.0 # [2] LATIN SMALL LETTER TURNED H WITH FISHHOOK..LATIN SMALL LETTER TURNED H WITH FISHHOOK AND TAIL
02EF..02FF ; 4.0 # [17] MODIFIER LETTER LOW DOWN ARROWHEAD..MODIFIER LETTER LOW LEFT ARROW
0350..0357 ; 4.0 # [8] COMBINING RIGHT ARROWHEAD ABOVE..COMBINING RIGHT HALF RING ABOVE
035D..035F ; 4.0 # [3] COMBINING DOUBLE BREVE..COMBINING DOUBLE MACRON BELOW
03F7..03FB ; 4.0 # [5] GREEK CAPITAL LETTER SHO..GREEK SMALL LETTER SAN
0600..0603 ; 4.0 # [4] ARABIC NUMBER SIGN..ARABIC SIGN SAFHA
060D..0615 ; 4.0 # [9] ARABIC DATE SEPARATOR..ARABIC SMALL HIGH TAH
0656..0658 ; 4.0 # [3] ARABIC SUBSCRIPT ALEF..ARABIC MARK NOON GHUNNA
06EE..06EF ; 4.0 # [2] ARABIC LETTER DAL WITH INVERTED V..ARABIC LETTER REH WITH INVERTED V
06FF ; 4.0 # ARABIC LETTER HEH WITH INVERTED V
072D..072F ; 4.0 # [3] SYRIAC LETTER PERSIAN BHETH..SYRIAC LETTER PERSIAN DHALATH
074D..074F ; 4.0 # [3] SYRIAC LETTER SOGDIAN ZHAIN..SYRIAC LETTER SOGDIAN FE
0904 ; 4.0 # DEVANAGARI LETTER SHORT A
09BD ; 4.0 # BENGALI SIGN AVAGRAHA
0A01 ; 4.0 # GURMUKHI SIGN ADAK BINDI
0A03 ; 4.0 # GURMUKHI SIGN VISARGA
0A8C ; 4.0 # GUJARATI LETTER VOCALIC L
0AE1..0AE3 ; 4.0 # [3] GUJARATI LETTER VOCALIC LL..GUJARATI VOWEL SIGN VOCALIC LL
0AF1 ; 4.0 # GUJARATI RUPEE SIGN
0B35 ; 4.0 # ORIYA LETTER VA
0B71 ; 4.0 # ORIYA LETTER WA
0BF3..0BFA ; 4.0 # [8] TAMIL DAY SIGN..TAMIL NUMBER SIGN
0CBC..0CBD ; 4.0 # [2] KANNADA SIGN NUKTA..KANNADA SIGN AVAGRAHA
17DD ; 4.0 # KHMER SIGN ATTHACAN
17F0..17F9 ; 4.0 # [10] KHMER SYMBOL LEK ATTAK SON..KHMER SYMBOL LEK ATTAK PRAM-BUON
1900..191C ; 4.0 # [29] LIMBU VOWEL-CARRIER LETTER..LIMBU LETTER HA
1920..192B ; 4.0 # [12] LIMBU VOWEL SIGN A..LIMBU SUBJOINED LETTER WA
1930..193B ; 4.0 # [12] LIMBU SMALL LETTER KA..LIMBU SIGN SA-I
1940 ; 4.0 # LIMBU SIGN LOO
1944..196D ; 4.0 # [42] LIMBU EXCLAMATION MARK..TAI LE LETTER AI
1970..1974 ; 4.0 # [5] TAI LE LETTER TONE-2..TAI LE LETTER TONE-6
19E0..19FF ; 4.0 # [32] KHMER SYMBOL PATHAMASAT..KHMER SYMBOL DAP-PRAM ROC
1D00..1D6B ; 4.0 # [108] LATIN LETTER SMALL CAPITAL A..LATIN SMALL LETTER UE
2053..2054 ; 4.0 # [2] SWUNG DASH..INVERTED UNDERTIE
213B ; 4.0 # FACSIMILE SIGN
23CF..23D0 ; 4.0 # [2] EJECT SYMBOL..VERTICAL LINE EXTENSION
24FF ; 4.0 # NEGATIVE CIRCLED DIGIT ZERO
2614..2615 ; 4.0 # [2] UMBRELLA WITH RAIN DROPS..HOT BEVERAGE
268A..2691 ; 4.0 # [8] MONOGRAM FOR YANG..BLACK FLAG
26A0..26A1 ; 4.0 # [2] WARNING SIGN..HIGH VOLTAGE SIGN
2B00..2B0D ; 4.0 # [14] NORTH EAST WHITE ARROW..UP DOWN BLACK ARROW
321D..321E ; 4.0 # [2] PARENTHESIZED KOREAN CHARACTER OJEON..PARENTHESIZED KOREAN CHARACTER O HU
3250 ; 4.0 # PARTNERSHIP SIGN
327C..327D ; 4.0 # [2] CIRCLED KOREAN CHARACTER CHAMKO..CIRCLED KOREAN CHARACTER JUEUI
32CC..32CF ; 4.0 # [4] SQUARE HG..LIMITED LIABILITY SIGN
3377..337A ; 4.0 # [4] SQUARE DM..SQUARE IU
33DE..33DF ; 4.0 # [2] SQUARE V OVER M..SQUARE A OVER M
33FF ; 4.0 # SQUARE GAL
4DC0..4DFF ; 4.0 # [64] HEXAGRAM FOR THE CREATIVE HEAVEN..HEXAGRAM FOR BEFORE COMPLETION
FDFD ; 4.0 # ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM
FE47..FE48 ; 4.0 # [2] PRESENTATION FORM FOR VERTICAL LEFT SQUARE BRACKET..PRESENTATION FORM FOR VERTICAL RIGHT SQUARE BRACKET
10000..1000B ; 4.0 # [12] LINEAR B SYLLABLE B008 A..LINEAR B SYLLABLE B046 JE
1000D..10026 ; 4.0 # [26] LINEAR B SYLLABLE B036 JO..LINEAR B SYLLABLE B032 QO
10028..1003A ; 4.0 # [19] LINEAR B SYLLABLE B060 RA..LINEAR B SYLLABLE B042 WO
1003C..1003D ; 4.0 # [2] LINEAR B SYLLABLE B017 ZA..LINEAR B SYLLABLE B074 ZE
1003F..1004D ; 4.0 # [15] LINEAR B SYLLABLE B020 ZO..LINEAR B SYLLABLE B091 TWO
10050..1005D ; 4.0 # [14] LINEAR B SYMBOL B018..LINEAR B SYMBOL B089
10080..100FA ; 4.0 # [123] LINEAR B IDEOGRAM B100 MAN..LINEAR B IDEOGRAM VESSEL B305
10100..10102 ; 4.0 # [3] AEGEAN WORD SEPARATOR LINE..AEGEAN CHECK MARK
10107..10133 ; 4.0 # [45] AEGEAN NUMBER ONE..AEGEAN NUMBER NINETY THOUSAND
10137..1013F ; 4.0 # [9] AEGEAN WEIGHT BASE UNIT..AEGEAN MEASURE THIRD SUBUNIT
10380..1039D ; 4.0 # [30] UGARITIC LETTER ALPA..UGARITIC LETTER SSU
1039F ; 4.0 # UGARITIC WORD DIVIDER
10426..10427 ; 4.0 # [2] DESERET CAPITAL LETTER OI..DESERET CAPITAL LETTER EW
1044E..1049D ; 4.0 # [80] DESERET SMALL LETTER OI..OSMANYA LETTER OO
104A0..104A9 ; 4.0 # [10] OSMANYA DIGIT ZERO..OSMANYA DIGIT NINE
10800..10805 ; 4.0 # [6] CYPRIOT SYLLABLE A..CYPRIOT SYLLABLE JA
10808 ; 4.0 # CYPRIOT SYLLABLE JO
1080A..10835 ; 4.0 # [44] CYPRIOT SYLLABLE KA..CYPRIOT SYLLABLE WO
10837..10838 ; 4.0 # [2] CYPRIOT SYLLABLE XA..CYPRIOT SYLLABLE XE
1083C ; 4.0 # CYPRIOT SYLLABLE ZA
1083F ; 4.0 # CYPRIOT SYLLABLE ZO
1D300..1D356 ; 4.0 # [87] MONOGRAM FOR EARTH..TETRAGRAM FOR FOSTERING
1D4C1 ; 4.0 # MATHEMATICAL SCRIPT SMALL L
E0100..E01EF ; 4.0 # [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256
# Total code points: 1226
# ================================================
# Newly assigned in Unicode 4.1.0 (March, 2005)
0237..0241 ; 4.1 # [11] LATIN SMALL LETTER DOTLESS J..LATIN CAPITAL LETTER GLOTTAL STOP
0358..035C ; 4.1 # [5] COMBINING DOT ABOVE RIGHT..COMBINING DOUBLE BREVE BELOW
03FC..03FF ; 4.1 # [4] GREEK RHO WITH STROKE SYMBOL..GREEK CAPITAL REVERSED DOTTED LUNATE SIGMA SYMBOL
04F6..04F7 ; 4.1 # [2] CYRILLIC CAPITAL LETTER GHE WITH DESCENDER..CYRILLIC SMALL LETTER GHE WITH DESCENDER
05A2 ; 4.1 # HEBREW ACCENT ATNAH HAFUKH
05C5..05C7 ; 4.1 # [3] HEBREW MARK LOWER DOT..HEBREW POINT QAMATS QATAN
060B ; 4.1 # AFGHANI SIGN
061E ; 4.1 # ARABIC TRIPLE DOT PUNCTUATION MARK
0659..065E ; 4.1 # [6] ARABIC ZWARAKAY..ARABIC FATHA WITH TWO DOTS
0750..076D ; 4.1 # [30] ARABIC LETTER BEH WITH THREE DOTS HORIZONTALLY BELOW..ARABIC LETTER SEEN WITH TWO DOTS VERTICALLY ABOVE
097D ; 4.1 # DEVANAGARI LETTER GLOTTAL STOP
09CE ; 4.1 # BENGALI LETTER KHANDA TA
0BB6 ; 4.1 # TAMIL LETTER SHA
0BE6 ; 4.1 # TAMIL DIGIT ZERO
0FD0..0FD1 ; 4.1 # [2] TIBETAN MARK BSKA- SHOG GI MGO RGYAN..TIBETAN MARK MNYAM YIG GI MGO RGYAN
10F9..10FA ; 4.1 # [2] GEORGIAN LETTER TURNED GAN..GEORGIAN LETTER AIN
10FC ; 4.1 # MODIFIER LETTER GEORGIAN NAR
1207 ; 4.1 # ETHIOPIC SYLLABLE HOA
1247 ; 4.1 # ETHIOPIC SYLLABLE QOA
1287 ; 4.1 # ETHIOPIC SYLLABLE XOA
12AF ; 4.1 # ETHIOPIC SYLLABLE KOA
12CF ; 4.1 # ETHIOPIC SYLLABLE WOA
12EF ; 4.1 # ETHIOPIC SYLLABLE YOA
130F ; 4.1 # ETHIOPIC SYLLABLE GOA
131F ; 4.1 # ETHIOPIC SYLLABLE GGWAA
1347 ; 4.1 # ETHIOPIC SYLLABLE TZOA
135F..1360 ; 4.1 # [2] ETHIOPIC COMBINING GEMINATION MARK..ETHIOPIC SECTION MARK
1380..1399 ; 4.1 # [26] ETHIOPIC SYLLABLE SEBATBEIT MWA..ETHIOPIC TONAL MARK KURT
1980..19A9 ; 4.1 # [42] NEW TAI LUE LETTER HIGH QA..NEW TAI LUE LETTER LOW XVA
19B0..19C9 ; 4.1 # [26] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE TONE MARK-2
19D0..19D9 ; 4.1 # [10] NEW TAI LUE DIGIT ZERO..NEW TAI LUE DIGIT NINE
19DE..19DF ; 4.1 # [2] NEW TAI LUE SIGN LAE..NEW TAI LUE SIGN LAEV
1A00..1A1B ; 4.1 # [28] BUGINESE LETTER KA..BUGINESE VOWEL SIGN AE
1A1E..1A1F ; 4.1 # [2] BUGINESE PALLAWA..BUGINESE END OF SECTION
1D6C..1DC3 ; 4.1 # [88] LATIN SMALL LETTER B WITH MIDDLE TILDE..COMBINING SUSPENSION MARK
2055..2056 ; 4.1 # [2] FLOWER PUNCTUATION MARK..THREE DOT PUNCTUATION
2058..205E ; 4.1 # [7] FOUR DOT PUNCTUATION..VERTICAL FOUR DOTS
2090..2094 ; 4.1 # [5] LATIN SUBSCRIPT SMALL LETTER A..LATIN SUBSCRIPT SMALL LETTER SCHWA
20B2..20B5 ; 4.1 # [4] GUARANI SIGN..CEDI SIGN
20EB ; 4.1 # COMBINING LONG DOUBLE SOLIDUS OVERLAY
213C ; 4.1 # DOUBLE-STRUCK SMALL PI
214C ; 4.1 # PER SIGN
23D1..23DB ; 4.1 # [11] METRICAL BREVE..FUSE
2618 ; 4.1 # SHAMROCK
267E..267F ; 4.1 # [2] PERMANENT PAPER SIGN..WHEELCHAIR SYMBOL
2692..269C ; 4.1 # [11] HAMMER AND PICK..FLEUR-DE-LIS
26A2..26B1 ; 4.1 # [16] DOUBLED FEMALE SIGN..FUNERAL URN
27C0..27C6 ; 4.1 # [7] THREE DIMENSIONAL ANGLE..RIGHT S-SHAPED BAG DELIMITER
2B0E..2B13 ; 4.1 # [6] RIGHTWARDS ARROW WITH TIP DOWNWARDS..SQUARE WITH BOTTOM HALF BLACK
2C00..2C2E ; 4.1 # [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE
2C30..2C5E ; 4.1 # [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE
2C80..2CEA ; 4.1 # [107] COPTIC CAPITAL LETTER ALFA..COPTIC SYMBOL SHIMA SIMA
2CF9..2D25 ; 4.1 # [45] COPTIC OLD NUBIAN FULL STOP..GEORGIAN SMALL LETTER HOE
2D30..2D65 ; 4.1 # [54] TIFINAGH LETTER YA..TIFINAGH LETTER YAZZ
2D6F ; 4.1 # TIFINAGH MODIFIER LETTER LABIALIZATION MARK
2D80..2D96 ; 4.1 # [23] ETHIOPIC SYLLABLE LOA..ETHIOPIC SYLLABLE GGWE
2DA0..2DA6 ; 4.1 # [7] ETHIOPIC SYLLABLE SSA..ETHIOPIC SYLLABLE SSO
2DA8..2DAE ; 4.1 # [7] ETHIOPIC SYLLABLE CCA..ETHIOPIC SYLLABLE CCO
2DB0..2DB6 ; 4.1 # [7] ETHIOPIC SYLLABLE ZZA..ETHIOPIC SYLLABLE ZZO
2DB8..2DBE ; 4.1 # [7] ETHIOPIC SYLLABLE CCHA..ETHIOPIC SYLLABLE CCHO
2DC0..2DC6 ; 4.1 # [7] ETHIOPIC SYLLABLE QYA..ETHIOPIC SYLLABLE QYO
2DC8..2DCE ; 4.1 # [7] ETHIOPIC SYLLABLE KYA..ETHIOPIC SYLLABLE KYO
2DD0..2DD6 ; 4.1 # [7] ETHIOPIC SYLLABLE XYA..ETHIOPIC SYLLABLE XYO
2DD8..2DDE ; 4.1 # [7] ETHIOPIC SYLLABLE GYA..ETHIOPIC SYLLABLE GYO
2E00..2E17 ; 4.1 # [24] RIGHT ANGLE SUBSTITUTION MARKER..DOUBLE OBLIQUE HYPHEN
2E1C..2E1D ; 4.1 # [2] LEFT LOW PARAPHRASE BRACKET..RIGHT LOW PARAPHRASE BRACKET
31C0..31CF ; 4.1 # [16] CJK STROKE T..CJK STROKE N
327E ; 4.1 # CIRCLED HANGUL IEUNG U
9FA6..9FBB ; 4.1 # [22] CJK UNIFIED IDEOGRAPH-9FA6..CJK UNIFIED IDEOGRAPH-9FBB
A700..A716 ; 4.1 # [23] MODIFIER LETTER CHINESE TONE YIN PING..MODIFIER LETTER EXTRA-LOW LEFT-STEM TONE BAR
A800..A82B ; 4.1 # [44] SYLOTI NAGRI LETTER A..SYLOTI NAGRI POETRY MARK-4
FA70..FAD9 ; 4.1 # [106] CJK COMPATIBILITY IDEOGRAPH-FA70..CJK COMPATIBILITY IDEOGRAPH-FAD9
FE10..FE19 ; 4.1 # [10] PRESENTATION FORM FOR VERTICAL COMMA..PRESENTATION FORM FOR VERTICAL HORIZONTAL ELLIPSIS
10140..1018A ; 4.1 # [75] GREEK ACROPHONIC ATTIC ONE QUARTER..GREEK ZERO SIGN
103A0..103C3 ; 4.1 # [36] OLD PERSIAN SIGN A..OLD PERSIAN SIGN HA
103C8..103D5 ; 4.1 # [14] OLD PERSIAN SIGN AURAMAZDAA..OLD PERSIAN NUMBER HUNDRED
10A00..10A03 ; 4.1 # [4] KHAROSHTHI LETTER A..KHAROSHTHI VOWEL SIGN VOCALIC R
10A05..10A06 ; 4.1 # [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O
10A0C..10A13 ; 4.1 # [8] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI LETTER GHA
10A15..10A17 ; 4.1 # [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA
10A19..10A33 ; 4.1 # [27] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER TTTHA
10A38..10A3A ; 4.1 # [3] KHAROSHTHI SIGN BAR ABOVE..KHAROSHTHI SIGN DOT BELOW
10A3F..10A47 ; 4.1 # [9] KHAROSHTHI VIRAMA..KHAROSHTHI NUMBER ONE THOUSAND
10A50..10A58 ; 4.1 # [9] KHAROSHTHI PUNCTUATION DOT..KHAROSHTHI PUNCTUATION LINES
1D200..1D245 ; 4.1 # [70] GREEK VOCAL NOTATION SYMBOL-1..GREEK MUSICAL LEIMMA
1D6A4..1D6A5 ; 4.1 # [2] MATHEMATICAL ITALIC SMALL DOTLESS I..MATHEMATICAL ITALIC SMALL DOTLESS J
# Total code points: 1273
# ================================================
# Newly assigned in Unicode 5.0.0 (July, 2006)
0242..024F ; 5.0 # [14] LATIN SMALL LETTER GLOTTAL STOP..LATIN SMALL LETTER Y WITH STROKE
037B..037D ; 5.0 # [3] GREEK SMALL REVERSED LUNATE SIGMA SYMBOL..GREEK SMALL REVERSED DOTTED LUNATE SIGMA SYMBOL
04CF ; 5.0 # CYRILLIC SMALL LETTER PALOCHKA
04FA..04FF ; 5.0 # [6] CYRILLIC CAPITAL LETTER GHE WITH STROKE AND HOOK..CYRILLIC SMALL LETTER HA WITH STROKE
0510..0513 ; 5.0 # [4] CYRILLIC CAPITAL LETTER REVERSED ZE..CYRILLIC SMALL LETTER EL WITH HOOK
05BA ; 5.0 # HEBREW POINT HOLAM HASER FOR VAV
07C0..07FA ; 5.0 # [59] NKO DIGIT ZERO..NKO LAJANYALAN
097B..097C ; 5.0 # [2] DEVANAGARI LETTER GGA..DEVANAGARI LETTER JJA
097E..097F ; 5.0 # [2] DEVANAGARI LETTER DDDA..DEVANAGARI LETTER BBA
0CE2..0CE3 ; 5.0 # [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL
0CF1..0CF2 ; 5.0 # [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA
1B00..1B4B ; 5.0 # [76] BALINESE SIGN ULU RICEM..BALINESE LETTER ASYURA SASAK
1B50..1B7C ; 5.0 # [45] BALINESE DIGIT ZERO..BALINESE MUSICAL SYMBOL LEFT-HAND OPEN PING
1DC4..1DCA ; 5.0 # [7] COMBINING MACRON-ACUTE..COMBINING LATIN SMALL LETTER R BELOW
1DFE..1DFF ; 5.0 # [2] COMBINING LEFT ARROWHEAD ABOVE..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW
20EC..20EF ; 5.0 # [4] COMBINING RIGHTWARDS HARPOON WITH BARB DOWNWARDS..COMBINING RIGHT ARROW BELOW
214D..214E ; 5.0 # [2] AKTIESELSKAB..TURNED SMALL F
2184 ; 5.0 # LATIN SMALL LETTER REVERSED C
23DC..23E7 ; 5.0 # [12] TOP PARENTHESIS..ELECTRICAL INTERSECTION
26B2 ; 5.0 # NEUTER
27C7..27CA ; 5.0 # [4] OR WITH DOT INSIDE..VERTICAL BAR WITH HORIZONTAL STROKE
2B14..2B1A ; 5.0 # [7] SQUARE WITH UPPER RIGHT DIAGONAL HALF BLACK..DOTTED SQUARE
2B20..2B23 ; 5.0 # [4] WHITE PENTAGON..HORIZONTAL BLACK HEXAGON
2C60..2C6C ; 5.0 # [13] LATIN CAPITAL LETTER L WITH DOUBLE BAR..LATIN SMALL LETTER Z WITH DESCENDER
2C74..2C77 ; 5.0 # [4] LATIN SMALL LETTER V WITH CURL..LATIN SMALL LETTER TAILLESS PHI
A717..A71A ; 5.0 # [4] MODIFIER LETTER DOT VERTICAL BAR..MODIFIER LETTER LOWER RIGHT CORNER ANGLE
A720..A721 ; 5.0 # [2] MODIFIER LETTER STRESS AND HIGH TONE..MODIFIER LETTER STRESS AND LOW TONE
A840..A877 ; 5.0 # [56] PHAGS-PA LETTER KA..PHAGS-PA MARK DOUBLE SHAD
10900..10919 ; 5.0 # [26] PHOENICIAN LETTER ALF..PHOENICIAN NUMBER ONE HUNDRED
1091F ; 5.0 # PHOENICIAN WORD SEPARATOR
12000..1236E ; 5.0 # [879] CUNEIFORM SIGN A..CUNEIFORM SIGN ZUM
12400..12462 ; 5.0 # [99] CUNEIFORM NUMERIC SIGN TWO ASH..CUNEIFORM NUMERIC SIGN OLD ASSYRIAN ONE QUARTER
12470..12473 ; 5.0 # [4] CUNEIFORM PUNCTUATION SIGN OLD ASSYRIAN WORD DIVIDER..CUNEIFORM PUNCTUATION SIGN DIAGONAL TRICOLON
1D360..1D371 ; 5.0 # [18] COUNTING ROD UNIT DIGIT ONE..COUNTING ROD TENS DIGIT NINE
1D7CA..1D7CB ; 5.0 # [2] MATHEMATICAL BOLD CAPITAL DIGAMMA..MATHEMATICAL BOLD SMALL DIGAMMA
# Total code points: 1369
# EOF

File diff suppressed because it is too large Load Diff

File diff suppressed because it is too large Load Diff

File diff suppressed because it is too large Load Diff

View File

@ -0,0 +1,855 @@
# HangulSyllableType-5.0.0.txt
# Date: 2006-03-09, 23:14:14 GMT [MD]
#
# Unicode Character Database
# Copyright (c) 1991-2006 Unicode, Inc.
# For terms of use, see http://www.unicode.org/terms_of_use.html
# For documentation, see UCD.html
# ================================================
# Property: Hangul_Syllable_Type
# All code points not explicitly listed for Hangul_Syllable_Type
# have the value Not_Applicable (NA).
# @missing: 0000..10FFFF; Not_Applicable
# ================================================
# Hangul_Syllable_Type=Leading_Jamo
1100..1159 ; L # Lo [90] HANGUL CHOSEONG KIYEOK..HANGUL CHOSEONG YEORINHIEUH
115F ; L # Lo HANGUL CHOSEONG FILLER
# Total code points: 91
# ================================================
# Hangul_Syllable_Type=Vowel_Jamo
1160..11A2 ; V # Lo [67] HANGUL JUNGSEONG FILLER..HANGUL JUNGSEONG SSANGARAEA
# Total code points: 67
# ================================================
# Hangul_Syllable_Type=Trailing_Jamo
11A8..11F9 ; T # Lo [82] HANGUL JONGSEONG KIYEOK..HANGUL JONGSEONG YEORINHIEUH
# Total code points: 82
# ================================================
# Hangul_Syllable_Type=LV_Syllable
AC00 ; LV # Lo HANGUL SYLLABLE GA
AC1C ; LV # Lo HANGUL SYLLABLE GAE
AC38 ; LV # Lo HANGUL SYLLABLE GYA
AC54 ; LV # Lo HANGUL SYLLABLE GYAE
AC70 ; LV # Lo HANGUL SYLLABLE GEO
AC8C ; LV # Lo HANGUL SYLLABLE GE
ACA8 ; LV # Lo HANGUL SYLLABLE GYEO
ACC4 ; LV # Lo HANGUL SYLLABLE GYE
ACE0 ; LV # Lo HANGUL SYLLABLE GO
ACFC ; LV # Lo HANGUL SYLLABLE GWA
AD18 ; LV # Lo HANGUL SYLLABLE GWAE
AD34 ; LV # Lo HANGUL SYLLABLE GOE
AD50 ; LV # Lo HANGUL SYLLABLE GYO
AD6C ; LV # Lo HANGUL SYLLABLE GU
AD88 ; LV # Lo HANGUL SYLLABLE GWEO
ADA4 ; LV # Lo HANGUL SYLLABLE GWE
ADC0 ; LV # Lo HANGUL SYLLABLE GWI
ADDC ; LV # Lo HANGUL SYLLABLE GYU
ADF8 ; LV # Lo HANGUL SYLLABLE GEU
AE14 ; LV # Lo HANGUL SYLLABLE GYI
AE30 ; LV # Lo HANGUL SYLLABLE GI
AE4C ; LV # Lo HANGUL SYLLABLE GGA
AE68 ; LV # Lo HANGUL SYLLABLE GGAE
AE84 ; LV # Lo HANGUL SYLLABLE GGYA
AEA0 ; LV # Lo HANGUL SYLLABLE GGYAE
AEBC ; LV # Lo HANGUL SYLLABLE GGEO
AED8 ; LV # Lo HANGUL SYLLABLE GGE
AEF4 ; LV # Lo HANGUL SYLLABLE GGYEO
AF10 ; LV # Lo HANGUL SYLLABLE GGYE
AF2C ; LV # Lo HANGUL SYLLABLE GGO
AF48 ; LV # Lo HANGUL SYLLABLE GGWA
AF64 ; LV # Lo HANGUL SYLLABLE GGWAE
AF80 ; LV # Lo HANGUL SYLLABLE GGOE
AF9C ; LV # Lo HANGUL SYLLABLE GGYO
AFB8 ; LV # Lo HANGUL SYLLABLE GGU
AFD4 ; LV # Lo HANGUL SYLLABLE GGWEO
AFF0 ; LV # Lo HANGUL SYLLABLE GGWE
B00C ; LV # Lo HANGUL SYLLABLE GGWI
B028 ; LV # Lo HANGUL SYLLABLE GGYU
B044 ; LV # Lo HANGUL SYLLABLE GGEU
B060 ; LV # Lo HANGUL SYLLABLE GGYI
B07C ; LV # Lo HANGUL SYLLABLE GGI
B098 ; LV # Lo HANGUL SYLLABLE NA
B0B4 ; LV # Lo HANGUL SYLLABLE NAE
B0D0 ; LV # Lo HANGUL SYLLABLE NYA
B0EC ; LV # Lo HANGUL SYLLABLE NYAE
B108 ; LV # Lo HANGUL SYLLABLE NEO
B124 ; LV # Lo HANGUL SYLLABLE NE
B140 ; LV # Lo HANGUL SYLLABLE NYEO
B15C ; LV # Lo HANGUL SYLLABLE NYE
B178 ; LV # Lo HANGUL SYLLABLE NO
B194 ; LV # Lo HANGUL SYLLABLE NWA
B1B0 ; LV # Lo HANGUL SYLLABLE NWAE
B1CC ; LV # Lo HANGUL SYLLABLE NOE
B1E8 ; LV # Lo HANGUL SYLLABLE NYO
B204 ; LV # Lo HANGUL SYLLABLE NU
B220 ; LV # Lo HANGUL SYLLABLE NWEO
B23C ; LV # Lo HANGUL SYLLABLE NWE
B258 ; LV # Lo HANGUL SYLLABLE NWI
B274 ; LV # Lo HANGUL SYLLABLE NYU
B290 ; LV # Lo HANGUL SYLLABLE NEU
B2AC ; LV # Lo HANGUL SYLLABLE NYI
B2C8 ; LV # Lo HANGUL SYLLABLE NI
B2E4 ; LV # Lo HANGUL SYLLABLE DA
B300 ; LV # Lo HANGUL SYLLABLE DAE
B31C ; LV # Lo HANGUL SYLLABLE DYA
B338 ; LV # Lo HANGUL SYLLABLE DYAE
B354 ; LV # Lo HANGUL SYLLABLE DEO
B370 ; LV # Lo HANGUL SYLLABLE DE
B38C ; LV # Lo HANGUL SYLLABLE DYEO
B3A8 ; LV # Lo HANGUL SYLLABLE DYE
B3C4 ; LV # Lo HANGUL SYLLABLE DO
B3E0 ; LV # Lo HANGUL SYLLABLE DWA
B3FC ; LV # Lo HANGUL SYLLABLE DWAE
B418 ; LV # Lo HANGUL SYLLABLE DOE
B434 ; LV # Lo HANGUL SYLLABLE DYO
B450 ; LV # Lo HANGUL SYLLABLE DU
B46C ; LV # Lo HANGUL SYLLABLE DWEO
B488 ; LV # Lo HANGUL SYLLABLE DWE
B4A4 ; LV # Lo HANGUL SYLLABLE DWI
B4C0 ; LV # Lo HANGUL SYLLABLE DYU
B4DC ; LV # Lo HANGUL SYLLABLE DEU
B4F8 ; LV # Lo HANGUL SYLLABLE DYI
B514 ; LV # Lo HANGUL SYLLABLE DI
B530 ; LV # Lo HANGUL SYLLABLE DDA
B54C ; LV # Lo HANGUL SYLLABLE DDAE
B568 ; LV # Lo HANGUL SYLLABLE DDYA
B584 ; LV # Lo HANGUL SYLLABLE DDYAE
B5A0 ; LV # Lo HANGUL SYLLABLE DDEO
B5BC ; LV # Lo HANGUL SYLLABLE DDE
B5D8 ; LV # Lo HANGUL SYLLABLE DDYEO
B5F4 ; LV # Lo HANGUL SYLLABLE DDYE
B610 ; LV # Lo HANGUL SYLLABLE DDO
B62C ; LV # Lo HANGUL SYLLABLE DDWA
B648 ; LV # Lo HANGUL SYLLABLE DDWAE
B664 ; LV # Lo HANGUL SYLLABLE DDOE
B680 ; LV # Lo HANGUL SYLLABLE DDYO
B69C ; LV # Lo HANGUL SYLLABLE DDU
B6B8 ; LV # Lo HANGUL SYLLABLE DDWEO
B6D4 ; LV # Lo HANGUL SYLLABLE DDWE
B6F0 ; LV # Lo HANGUL SYLLABLE DDWI
B70C ; LV # Lo HANGUL SYLLABLE DDYU
B728 ; LV # Lo HANGUL SYLLABLE DDEU
B744 ; LV # Lo HANGUL SYLLABLE DDYI
B760 ; LV # Lo HANGUL SYLLABLE DDI
B77C ; LV # Lo HANGUL SYLLABLE RA
B798 ; LV # Lo HANGUL SYLLABLE RAE
B7B4 ; LV # Lo HANGUL SYLLABLE RYA
B7D0 ; LV # Lo HANGUL SYLLABLE RYAE
B7EC ; LV # Lo HANGUL SYLLABLE REO
B808 ; LV # Lo HANGUL SYLLABLE RE
B824 ; LV # Lo HANGUL SYLLABLE RYEO
B840 ; LV # Lo HANGUL SYLLABLE RYE
B85C ; LV # Lo HANGUL SYLLABLE RO
B878 ; LV # Lo HANGUL SYLLABLE RWA
B894 ; LV # Lo HANGUL SYLLABLE RWAE
B8B0 ; LV # Lo HANGUL SYLLABLE ROE
B8CC ; LV # Lo HANGUL SYLLABLE RYO
B8E8 ; LV # Lo HANGUL SYLLABLE RU
B904 ; LV # Lo HANGUL SYLLABLE RWEO
B920 ; LV # Lo HANGUL SYLLABLE RWE
B93C ; LV # Lo HANGUL SYLLABLE RWI
B958 ; LV # Lo HANGUL SYLLABLE RYU
B974 ; LV # Lo HANGUL SYLLABLE REU
B990 ; LV # Lo HANGUL SYLLABLE RYI
B9AC ; LV # Lo HANGUL SYLLABLE RI
B9C8 ; LV # Lo HANGUL SYLLABLE MA
B9E4 ; LV # Lo HANGUL SYLLABLE MAE
BA00 ; LV # Lo HANGUL SYLLABLE MYA
BA1C ; LV # Lo HANGUL SYLLABLE MYAE
BA38 ; LV # Lo HANGUL SYLLABLE MEO
BA54 ; LV # Lo HANGUL SYLLABLE ME
BA70 ; LV # Lo HANGUL SYLLABLE MYEO
BA8C ; LV # Lo HANGUL SYLLABLE MYE
BAA8 ; LV # Lo HANGUL SYLLABLE MO
BAC4 ; LV # Lo HANGUL SYLLABLE MWA
BAE0 ; LV # Lo HANGUL SYLLABLE MWAE
BAFC ; LV # Lo HANGUL SYLLABLE MOE
BB18 ; LV # Lo HANGUL SYLLABLE MYO
BB34 ; LV # Lo HANGUL SYLLABLE MU
BB50 ; LV # Lo HANGUL SYLLABLE MWEO
BB6C ; LV # Lo HANGUL SYLLABLE MWE
BB88 ; LV # Lo HANGUL SYLLABLE MWI
BBA4 ; LV # Lo HANGUL SYLLABLE MYU
BBC0 ; LV # Lo HANGUL SYLLABLE MEU
BBDC ; LV # Lo HANGUL SYLLABLE MYI
BBF8 ; LV # Lo HANGUL SYLLABLE MI
BC14 ; LV # Lo HANGUL SYLLABLE BA
BC30 ; LV # Lo HANGUL SYLLABLE BAE
BC4C ; LV # Lo HANGUL SYLLABLE BYA
BC68 ; LV # Lo HANGUL SYLLABLE BYAE
BC84 ; LV # Lo HANGUL SYLLABLE BEO
BCA0 ; LV # Lo HANGUL SYLLABLE BE
BCBC ; LV # Lo HANGUL SYLLABLE BYEO
BCD8 ; LV # Lo HANGUL SYLLABLE BYE
BCF4 ; LV # Lo HANGUL SYLLABLE BO
BD10 ; LV # Lo HANGUL SYLLABLE BWA
BD2C ; LV # Lo HANGUL SYLLABLE BWAE
BD48 ; LV # Lo HANGUL SYLLABLE BOE
BD64 ; LV # Lo HANGUL SYLLABLE BYO
BD80 ; LV # Lo HANGUL SYLLABLE BU
BD9C ; LV # Lo HANGUL SYLLABLE BWEO
BDB8 ; LV # Lo HANGUL SYLLABLE BWE
BDD4 ; LV # Lo HANGUL SYLLABLE BWI
BDF0 ; LV # Lo HANGUL SYLLABLE BYU
BE0C ; LV # Lo HANGUL SYLLABLE BEU
BE28 ; LV # Lo HANGUL SYLLABLE BYI
BE44 ; LV # Lo HANGUL SYLLABLE BI
BE60 ; LV # Lo HANGUL SYLLABLE BBA
BE7C ; LV # Lo HANGUL SYLLABLE BBAE
BE98 ; LV # Lo HANGUL SYLLABLE BBYA
BEB4 ; LV # Lo HANGUL SYLLABLE BBYAE
BED0 ; LV # Lo HANGUL SYLLABLE BBEO
BEEC ; LV # Lo HANGUL SYLLABLE BBE
BF08 ; LV # Lo HANGUL SYLLABLE BBYEO
BF24 ; LV # Lo HANGUL SYLLABLE BBYE
BF40 ; LV # Lo HANGUL SYLLABLE BBO
BF5C ; LV # Lo HANGUL SYLLABLE BBWA
BF78 ; LV # Lo HANGUL SYLLABLE BBWAE
BF94 ; LV # Lo HANGUL SYLLABLE BBOE
BFB0 ; LV # Lo HANGUL SYLLABLE BBYO
BFCC ; LV # Lo HANGUL SYLLABLE BBU
BFE8 ; LV # Lo HANGUL SYLLABLE BBWEO
C004 ; LV # Lo HANGUL SYLLABLE BBWE
C020 ; LV # Lo HANGUL SYLLABLE BBWI
C03C ; LV # Lo HANGUL SYLLABLE BBYU
C058 ; LV # Lo HANGUL SYLLABLE BBEU
C074 ; LV # Lo HANGUL SYLLABLE BBYI
C090 ; LV # Lo HANGUL SYLLABLE BBI
C0AC ; LV # Lo HANGUL SYLLABLE SA
C0C8 ; LV # Lo HANGUL SYLLABLE SAE
C0E4 ; LV # Lo HANGUL SYLLABLE SYA
C100 ; LV # Lo HANGUL SYLLABLE SYAE
C11C ; LV # Lo HANGUL SYLLABLE SEO
C138 ; LV # Lo HANGUL SYLLABLE SE
C154 ; LV # Lo HANGUL SYLLABLE SYEO
C170 ; LV # Lo HANGUL SYLLABLE SYE
C18C ; LV # Lo HANGUL SYLLABLE SO
C1A8 ; LV # Lo HANGUL SYLLABLE SWA
C1C4 ; LV # Lo HANGUL SYLLABLE SWAE
C1E0 ; LV # Lo HANGUL SYLLABLE SOE
C1FC ; LV # Lo HANGUL SYLLABLE SYO
C218 ; LV # Lo HANGUL SYLLABLE SU
C234 ; LV # Lo HANGUL SYLLABLE SWEO
C250 ; LV # Lo HANGUL SYLLABLE SWE
C26C ; LV # Lo HANGUL SYLLABLE SWI
C288 ; LV # Lo HANGUL SYLLABLE SYU
C2A4 ; LV # Lo HANGUL SYLLABLE SEU
C2C0 ; LV # Lo HANGUL SYLLABLE SYI
C2DC ; LV # Lo HANGUL SYLLABLE SI
C2F8 ; LV # Lo HANGUL SYLLABLE SSA
C314 ; LV # Lo HANGUL SYLLABLE SSAE
C330 ; LV # Lo HANGUL SYLLABLE SSYA
C34C ; LV # Lo HANGUL SYLLABLE SSYAE
C368 ; LV # Lo HANGUL SYLLABLE SSEO
C384 ; LV # Lo HANGUL SYLLABLE SSE
C3A0 ; LV # Lo HANGUL SYLLABLE SSYEO
C3BC ; LV # Lo HANGUL SYLLABLE SSYE
C3D8 ; LV # Lo HANGUL SYLLABLE SSO
C3F4 ; LV # Lo HANGUL SYLLABLE SSWA
C410 ; LV # Lo HANGUL SYLLABLE SSWAE
C42C ; LV # Lo HANGUL SYLLABLE SSOE
C448 ; LV # Lo HANGUL SYLLABLE SSYO
C464 ; LV # Lo HANGUL SYLLABLE SSU
C480 ; LV # Lo HANGUL SYLLABLE SSWEO
C49C ; LV # Lo HANGUL SYLLABLE SSWE
C4B8 ; LV # Lo HANGUL SYLLABLE SSWI
C4D4 ; LV # Lo HANGUL SYLLABLE SSYU
C4F0 ; LV # Lo HANGUL SYLLABLE SSEU
C50C ; LV # Lo HANGUL SYLLABLE SSYI
C528 ; LV # Lo HANGUL SYLLABLE SSI
C544 ; LV # Lo HANGUL SYLLABLE A
C560 ; LV # Lo HANGUL SYLLABLE AE
C57C ; LV # Lo HANGUL SYLLABLE YA
C598 ; LV # Lo HANGUL SYLLABLE YAE
C5B4 ; LV # Lo HANGUL SYLLABLE EO
C5D0 ; LV # Lo HANGUL SYLLABLE E
C5EC ; LV # Lo HANGUL SYLLABLE YEO
C608 ; LV # Lo HANGUL SYLLABLE YE
C624 ; LV # Lo HANGUL SYLLABLE O
C640 ; LV # Lo HANGUL SYLLABLE WA
C65C ; LV # Lo HANGUL SYLLABLE WAE
C678 ; LV # Lo HANGUL SYLLABLE OE
C694 ; LV # Lo HANGUL SYLLABLE YO
C6B0 ; LV # Lo HANGUL SYLLABLE U
C6CC ; LV # Lo HANGUL SYLLABLE WEO
C6E8 ; LV # Lo HANGUL SYLLABLE WE
C704 ; LV # Lo HANGUL SYLLABLE WI
C720 ; LV # Lo HANGUL SYLLABLE YU
C73C ; LV # Lo HANGUL SYLLABLE EU
C758 ; LV # Lo HANGUL SYLLABLE YI
C774 ; LV # Lo HANGUL SYLLABLE I
C790 ; LV # Lo HANGUL SYLLABLE JA
C7AC ; LV # Lo HANGUL SYLLABLE JAE
C7C8 ; LV # Lo HANGUL SYLLABLE JYA
C7E4 ; LV # Lo HANGUL SYLLABLE JYAE
C800 ; LV # Lo HANGUL SYLLABLE JEO
C81C ; LV # Lo HANGUL SYLLABLE JE
C838 ; LV # Lo HANGUL SYLLABLE JYEO
C854 ; LV # Lo HANGUL SYLLABLE JYE
C870 ; LV # Lo HANGUL SYLLABLE JO
C88C ; LV # Lo HANGUL SYLLABLE JWA
C8A8 ; LV # Lo HANGUL SYLLABLE JWAE
C8C4 ; LV # Lo HANGUL SYLLABLE JOE
C8E0 ; LV # Lo HANGUL SYLLABLE JYO
C8FC ; LV # Lo HANGUL SYLLABLE JU
C918 ; LV # Lo HANGUL SYLLABLE JWEO
C934 ; LV # Lo HANGUL SYLLABLE JWE
C950 ; LV # Lo HANGUL SYLLABLE JWI
C96C ; LV # Lo HANGUL SYLLABLE JYU
C988 ; LV # Lo HANGUL SYLLABLE JEU
C9A4 ; LV # Lo HANGUL SYLLABLE JYI
C9C0 ; LV # Lo HANGUL SYLLABLE JI
C9DC ; LV # Lo HANGUL SYLLABLE JJA
C9F8 ; LV # Lo HANGUL SYLLABLE JJAE
CA14 ; LV # Lo HANGUL SYLLABLE JJYA
CA30 ; LV # Lo HANGUL SYLLABLE JJYAE
CA4C ; LV # Lo HANGUL SYLLABLE JJEO
CA68 ; LV # Lo HANGUL SYLLABLE JJE
CA84 ; LV # Lo HANGUL SYLLABLE JJYEO
CAA0 ; LV # Lo HANGUL SYLLABLE JJYE
CABC ; LV # Lo HANGUL SYLLABLE JJO
CAD8 ; LV # Lo HANGUL SYLLABLE JJWA
CAF4 ; LV # Lo HANGUL SYLLABLE JJWAE
CB10 ; LV # Lo HANGUL SYLLABLE JJOE
CB2C ; LV # Lo HANGUL SYLLABLE JJYO
CB48 ; LV # Lo HANGUL SYLLABLE JJU
CB64 ; LV # Lo HANGUL SYLLABLE JJWEO
CB80 ; LV # Lo HANGUL SYLLABLE JJWE
CB9C ; LV # Lo HANGUL SYLLABLE JJWI
CBB8 ; LV # Lo HANGUL SYLLABLE JJYU
CBD4 ; LV # Lo HANGUL SYLLABLE JJEU
CBF0 ; LV # Lo HANGUL SYLLABLE JJYI
CC0C ; LV # Lo HANGUL SYLLABLE JJI
CC28 ; LV # Lo HANGUL SYLLABLE CA
CC44 ; LV # Lo HANGUL SYLLABLE CAE
CC60 ; LV # Lo HANGUL SYLLABLE CYA
CC7C ; LV # Lo HANGUL SYLLABLE CYAE
CC98 ; LV # Lo HANGUL SYLLABLE CEO
CCB4 ; LV # Lo HANGUL SYLLABLE CE
CCD0 ; LV # Lo HANGUL SYLLABLE CYEO
CCEC ; LV # Lo HANGUL SYLLABLE CYE
CD08 ; LV # Lo HANGUL SYLLABLE CO
CD24 ; LV # Lo HANGUL SYLLABLE CWA
CD40 ; LV # Lo HANGUL SYLLABLE CWAE
CD5C ; LV # Lo HANGUL SYLLABLE COE
CD78 ; LV # Lo HANGUL SYLLABLE CYO
CD94 ; LV # Lo HANGUL SYLLABLE CU
CDB0 ; LV # Lo HANGUL SYLLABLE CWEO
CDCC ; LV # Lo HANGUL SYLLABLE CWE
CDE8 ; LV # Lo HANGUL SYLLABLE CWI
CE04 ; LV # Lo HANGUL SYLLABLE CYU
CE20 ; LV # Lo HANGUL SYLLABLE CEU
CE3C ; LV # Lo HANGUL SYLLABLE CYI
CE58 ; LV # Lo HANGUL SYLLABLE CI
CE74 ; LV # Lo HANGUL SYLLABLE KA
CE90 ; LV # Lo HANGUL SYLLABLE KAE
CEAC ; LV # Lo HANGUL SYLLABLE KYA
CEC8 ; LV # Lo HANGUL SYLLABLE KYAE
CEE4 ; LV # Lo HANGUL SYLLABLE KEO
CF00 ; LV # Lo HANGUL SYLLABLE KE
CF1C ; LV # Lo HANGUL SYLLABLE KYEO
CF38 ; LV # Lo HANGUL SYLLABLE KYE
CF54 ; LV # Lo HANGUL SYLLABLE KO
CF70 ; LV # Lo HANGUL SYLLABLE KWA
CF8C ; LV # Lo HANGUL SYLLABLE KWAE
CFA8 ; LV # Lo HANGUL SYLLABLE KOE
CFC4 ; LV # Lo HANGUL SYLLABLE KYO
CFE0 ; LV # Lo HANGUL SYLLABLE KU
CFFC ; LV # Lo HANGUL SYLLABLE KWEO
D018 ; LV # Lo HANGUL SYLLABLE KWE
D034 ; LV # Lo HANGUL SYLLABLE KWI
D050 ; LV # Lo HANGUL SYLLABLE KYU
D06C ; LV # Lo HANGUL SYLLABLE KEU
D088 ; LV # Lo HANGUL SYLLABLE KYI
D0A4 ; LV # Lo HANGUL SYLLABLE KI
D0C0 ; LV # Lo HANGUL SYLLABLE TA
D0DC ; LV # Lo HANGUL SYLLABLE TAE
D0F8 ; LV # Lo HANGUL SYLLABLE TYA
D114 ; LV # Lo HANGUL SYLLABLE TYAE
D130 ; LV # Lo HANGUL SYLLABLE TEO
D14C ; LV # Lo HANGUL SYLLABLE TE
D168 ; LV # Lo HANGUL SYLLABLE TYEO
D184 ; LV # Lo HANGUL SYLLABLE TYE
D1A0 ; LV # Lo HANGUL SYLLABLE TO
D1BC ; LV # Lo HANGUL SYLLABLE TWA
D1D8 ; LV # Lo HANGUL SYLLABLE TWAE
D1F4 ; LV # Lo HANGUL SYLLABLE TOE
D210 ; LV # Lo HANGUL SYLLABLE TYO
D22C ; LV # Lo HANGUL SYLLABLE TU
D248 ; LV # Lo HANGUL SYLLABLE TWEO
D264 ; LV # Lo HANGUL SYLLABLE TWE
D280 ; LV # Lo HANGUL SYLLABLE TWI
D29C ; LV # Lo HANGUL SYLLABLE TYU
D2B8 ; LV # Lo HANGUL SYLLABLE TEU
D2D4 ; LV # Lo HANGUL SYLLABLE TYI
D2F0 ; LV # Lo HANGUL SYLLABLE TI
D30C ; LV # Lo HANGUL SYLLABLE PA
D328 ; LV # Lo HANGUL SYLLABLE PAE
D344 ; LV # Lo HANGUL SYLLABLE PYA
D360 ; LV # Lo HANGUL SYLLABLE PYAE
D37C ; LV # Lo HANGUL SYLLABLE PEO
D398 ; LV # Lo HANGUL SYLLABLE PE
D3B4 ; LV # Lo HANGUL SYLLABLE PYEO
D3D0 ; LV # Lo HANGUL SYLLABLE PYE
D3EC ; LV # Lo HANGUL SYLLABLE PO
D408 ; LV # Lo HANGUL SYLLABLE PWA
D424 ; LV # Lo HANGUL SYLLABLE PWAE
D440 ; LV # Lo HANGUL SYLLABLE POE
D45C ; LV # Lo HANGUL SYLLABLE PYO
D478 ; LV # Lo HANGUL SYLLABLE PU
D494 ; LV # Lo HANGUL SYLLABLE PWEO
D4B0 ; LV # Lo HANGUL SYLLABLE PWE
D4CC ; LV # Lo HANGUL SYLLABLE PWI
D4E8 ; LV # Lo HANGUL SYLLABLE PYU
D504 ; LV # Lo HANGUL SYLLABLE PEU
D520 ; LV # Lo HANGUL SYLLABLE PYI
D53C ; LV # Lo HANGUL SYLLABLE PI
D558 ; LV # Lo HANGUL SYLLABLE HA
D574 ; LV # Lo HANGUL SYLLABLE HAE
D590 ; LV # Lo HANGUL SYLLABLE HYA
D5AC ; LV # Lo HANGUL SYLLABLE HYAE
D5C8 ; LV # Lo HANGUL SYLLABLE HEO
D5E4 ; LV # Lo HANGUL SYLLABLE HE
D600 ; LV # Lo HANGUL SYLLABLE HYEO
D61C ; LV # Lo HANGUL SYLLABLE HYE
D638 ; LV # Lo HANGUL SYLLABLE HO
D654 ; LV # Lo HANGUL SYLLABLE HWA
D670 ; LV # Lo HANGUL SYLLABLE HWAE
D68C ; LV # Lo HANGUL SYLLABLE HOE
D6A8 ; LV # Lo HANGUL SYLLABLE HYO
D6C4 ; LV # Lo HANGUL SYLLABLE HU
D6E0 ; LV # Lo HANGUL SYLLABLE HWEO
D6FC ; LV # Lo HANGUL SYLLABLE HWE
D718 ; LV # Lo HANGUL SYLLABLE HWI
D734 ; LV # Lo HANGUL SYLLABLE HYU
D750 ; LV # Lo HANGUL SYLLABLE HEU
D76C ; LV # Lo HANGUL SYLLABLE HYI
D788 ; LV # Lo HANGUL SYLLABLE HI
# Total code points: 399
# ================================================
# Hangul_Syllable_Type=LVT_Syllable
AC01..AC1B ; LVT # Lo [27] HANGUL SYLLABLE GAG..HANGUL SYLLABLE GAH
AC1D..AC37 ; LVT # Lo [27] HANGUL SYLLABLE GAEG..HANGUL SYLLABLE GAEH
AC39..AC53 ; LVT # Lo [27] HANGUL SYLLABLE GYAG..HANGUL SYLLABLE GYAH
AC55..AC6F ; LVT # Lo [27] HANGUL SYLLABLE GYAEG..HANGUL SYLLABLE GYAEH
AC71..AC8B ; LVT # Lo [27] HANGUL SYLLABLE GEOG..HANGUL SYLLABLE GEOH
AC8D..ACA7 ; LVT # Lo [27] HANGUL SYLLABLE GEG..HANGUL SYLLABLE GEH
ACA9..ACC3 ; LVT # Lo [27] HANGUL SYLLABLE GYEOG..HANGUL SYLLABLE GYEOH
ACC5..ACDF ; LVT # Lo [27] HANGUL SYLLABLE GYEG..HANGUL SYLLABLE GYEH
ACE1..ACFB ; LVT # Lo [27] HANGUL SYLLABLE GOG..HANGUL SYLLABLE GOH
ACFD..AD17 ; LVT # Lo [27] HANGUL SYLLABLE GWAG..HANGUL SYLLABLE GWAH
AD19..AD33 ; LVT # Lo [27] HANGUL SYLLABLE GWAEG..HANGUL SYLLABLE GWAEH
AD35..AD4F ; LVT # Lo [27] HANGUL SYLLABLE GOEG..HANGUL SYLLABLE GOEH
AD51..AD6B ; LVT # Lo [27] HANGUL SYLLABLE GYOG..HANGUL SYLLABLE GYOH
AD6D..AD87 ; LVT # Lo [27] HANGUL SYLLABLE GUG..HANGUL SYLLABLE GUH
AD89..ADA3 ; LVT # Lo [27] HANGUL SYLLABLE GWEOG..HANGUL SYLLABLE GWEOH
ADA5..ADBF ; LVT # Lo [27] HANGUL SYLLABLE GWEG..HANGUL SYLLABLE GWEH
ADC1..ADDB ; LVT # Lo [27] HANGUL SYLLABLE GWIG..HANGUL SYLLABLE GWIH
ADDD..ADF7 ; LVT # Lo [27] HANGUL SYLLABLE GYUG..HANGUL SYLLABLE GYUH
ADF9..AE13 ; LVT # Lo [27] HANGUL SYLLABLE GEUG..HANGUL SYLLABLE GEUH
AE15..AE2F ; LVT # Lo [27] HANGUL SYLLABLE GYIG..HANGUL SYLLABLE GYIH
AE31..AE4B ; LVT # Lo [27] HANGUL SYLLABLE GIG..HANGUL SYLLABLE GIH
AE4D..AE67 ; LVT # Lo [27] HANGUL SYLLABLE GGAG..HANGUL SYLLABLE GGAH
AE69..AE83 ; LVT # Lo [27] HANGUL SYLLABLE GGAEG..HANGUL SYLLABLE GGAEH
AE85..AE9F ; LVT # Lo [27] HANGUL SYLLABLE GGYAG..HANGUL SYLLABLE GGYAH
AEA1..AEBB ; LVT # Lo [27] HANGUL SYLLABLE GGYAEG..HANGUL SYLLABLE GGYAEH
AEBD..AED7 ; LVT # Lo [27] HANGUL SYLLABLE GGEOG..HANGUL SYLLABLE GGEOH
AED9..AEF3 ; LVT # Lo [27] HANGUL SYLLABLE GGEG..HANGUL SYLLABLE GGEH
AEF5..AF0F ; LVT # Lo [27] HANGUL SYLLABLE GGYEOG..HANGUL SYLLABLE GGYEOH
AF11..AF2B ; LVT # Lo [27] HANGUL SYLLABLE GGYEG..HANGUL SYLLABLE GGYEH
AF2D..AF47 ; LVT # Lo [27] HANGUL SYLLABLE GGOG..HANGUL SYLLABLE GGOH
AF49..AF63 ; LVT # Lo [27] HANGUL SYLLABLE GGWAG..HANGUL SYLLABLE GGWAH
AF65..AF7F ; LVT # Lo [27] HANGUL SYLLABLE GGWAEG..HANGUL SYLLABLE GGWAEH
AF81..AF9B ; LVT # Lo [27] HANGUL SYLLABLE GGOEG..HANGUL SYLLABLE GGOEH
AF9D..AFB7 ; LVT # Lo [27] HANGUL SYLLABLE GGYOG..HANGUL SYLLABLE GGYOH
AFB9..AFD3 ; LVT # Lo [27] HANGUL SYLLABLE GGUG..HANGUL SYLLABLE GGUH
AFD5..AFEF ; LVT # Lo [27] HANGUL SYLLABLE GGWEOG..HANGUL SYLLABLE GGWEOH
AFF1..B00B ; LVT # Lo [27] HANGUL SYLLABLE GGWEG..HANGUL SYLLABLE GGWEH
B00D..B027 ; LVT # Lo [27] HANGUL SYLLABLE GGWIG..HANGUL SYLLABLE GGWIH
B029..B043 ; LVT # Lo [27] HANGUL SYLLABLE GGYUG..HANGUL SYLLABLE GGYUH
B045..B05F ; LVT # Lo [27] HANGUL SYLLABLE GGEUG..HANGUL SYLLABLE GGEUH
B061..B07B ; LVT # Lo [27] HANGUL SYLLABLE GGYIG..HANGUL SYLLABLE GGYIH
B07D..B097 ; LVT # Lo [27] HANGUL SYLLABLE GGIG..HANGUL SYLLABLE GGIH
B099..B0B3 ; LVT # Lo [27] HANGUL SYLLABLE NAG..HANGUL SYLLABLE NAH
B0B5..B0CF ; LVT # Lo [27] HANGUL SYLLABLE NAEG..HANGUL SYLLABLE NAEH
B0D1..B0EB ; LVT # Lo [27] HANGUL SYLLABLE NYAG..HANGUL SYLLABLE NYAH
B0ED..B107 ; LVT # Lo [27] HANGUL SYLLABLE NYAEG..HANGUL SYLLABLE NYAEH
B109..B123 ; LVT # Lo [27] HANGUL SYLLABLE NEOG..HANGUL SYLLABLE NEOH
B125..B13F ; LVT # Lo [27] HANGUL SYLLABLE NEG..HANGUL SYLLABLE NEH
B141..B15B ; LVT # Lo [27] HANGUL SYLLABLE NYEOG..HANGUL SYLLABLE NYEOH
B15D..B177 ; LVT # Lo [27] HANGUL SYLLABLE NYEG..HANGUL SYLLABLE NYEH
B179..B193 ; LVT # Lo [27] HANGUL SYLLABLE NOG..HANGUL SYLLABLE NOH
B195..B1AF ; LVT # Lo [27] HANGUL SYLLABLE NWAG..HANGUL SYLLABLE NWAH
B1B1..B1CB ; LVT # Lo [27] HANGUL SYLLABLE NWAEG..HANGUL SYLLABLE NWAEH
B1CD..B1E7 ; LVT # Lo [27] HANGUL SYLLABLE NOEG..HANGUL SYLLABLE NOEH
B1E9..B203 ; LVT # Lo [27] HANGUL SYLLABLE NYOG..HANGUL SYLLABLE NYOH
B205..B21F ; LVT # Lo [27] HANGUL SYLLABLE NUG..HANGUL SYLLABLE NUH
B221..B23B ; LVT # Lo [27] HANGUL SYLLABLE NWEOG..HANGUL SYLLABLE NWEOH
B23D..B257 ; LVT # Lo [27] HANGUL SYLLABLE NWEG..HANGUL SYLLABLE NWEH
B259..B273 ; LVT # Lo [27] HANGUL SYLLABLE NWIG..HANGUL SYLLABLE NWIH
B275..B28F ; LVT # Lo [27] HANGUL SYLLABLE NYUG..HANGUL SYLLABLE NYUH
B291..B2AB ; LVT # Lo [27] HANGUL SYLLABLE NEUG..HANGUL SYLLABLE NEUH
B2AD..B2C7 ; LVT # Lo [27] HANGUL SYLLABLE NYIG..HANGUL SYLLABLE NYIH
B2C9..B2E3 ; LVT # Lo [27] HANGUL SYLLABLE NIG..HANGUL SYLLABLE NIH
B2E5..B2FF ; LVT # Lo [27] HANGUL SYLLABLE DAG..HANGUL SYLLABLE DAH
B301..B31B ; LVT # Lo [27] HANGUL SYLLABLE DAEG..HANGUL SYLLABLE DAEH
B31D..B337 ; LVT # Lo [27] HANGUL SYLLABLE DYAG..HANGUL SYLLABLE DYAH
B339..B353 ; LVT # Lo [27] HANGUL SYLLABLE DYAEG..HANGUL SYLLABLE DYAEH
B355..B36F ; LVT # Lo [27] HANGUL SYLLABLE DEOG..HANGUL SYLLABLE DEOH
B371..B38B ; LVT # Lo [27] HANGUL SYLLABLE DEG..HANGUL SYLLABLE DEH
B38D..B3A7 ; LVT # Lo [27] HANGUL SYLLABLE DYEOG..HANGUL SYLLABLE DYEOH
B3A9..B3C3 ; LVT # Lo [27] HANGUL SYLLABLE DYEG..HANGUL SYLLABLE DYEH
B3C5..B3DF ; LVT # Lo [27] HANGUL SYLLABLE DOG..HANGUL SYLLABLE DOH
B3E1..B3FB ; LVT # Lo [27] HANGUL SYLLABLE DWAG..HANGUL SYLLABLE DWAH
B3FD..B417 ; LVT # Lo [27] HANGUL SYLLABLE DWAEG..HANGUL SYLLABLE DWAEH
B419..B433 ; LVT # Lo [27] HANGUL SYLLABLE DOEG..HANGUL SYLLABLE DOEH
B435..B44F ; LVT # Lo [27] HANGUL SYLLABLE DYOG..HANGUL SYLLABLE DYOH
B451..B46B ; LVT # Lo [27] HANGUL SYLLABLE DUG..HANGUL SYLLABLE DUH
B46D..B487 ; LVT # Lo [27] HANGUL SYLLABLE DWEOG..HANGUL SYLLABLE DWEOH
B489..B4A3 ; LVT # Lo [27] HANGUL SYLLABLE DWEG..HANGUL SYLLABLE DWEH
B4A5..B4BF ; LVT # Lo [27] HANGUL SYLLABLE DWIG..HANGUL SYLLABLE DWIH
B4C1..B4DB ; LVT # Lo [27] HANGUL SYLLABLE DYUG..HANGUL SYLLABLE DYUH
B4DD..B4F7 ; LVT # Lo [27] HANGUL SYLLABLE DEUG..HANGUL SYLLABLE DEUH
B4F9..B513 ; LVT # Lo [27] HANGUL SYLLABLE DYIG..HANGUL SYLLABLE DYIH
B515..B52F ; LVT # Lo [27] HANGUL SYLLABLE DIG..HANGUL SYLLABLE DIH
B531..B54B ; LVT # Lo [27] HANGUL SYLLABLE DDAG..HANGUL SYLLABLE DDAH
B54D..B567 ; LVT # Lo [27] HANGUL SYLLABLE DDAEG..HANGUL SYLLABLE DDAEH
B569..B583 ; LVT # Lo [27] HANGUL SYLLABLE DDYAG..HANGUL SYLLABLE DDYAH
B585..B59F ; LVT # Lo [27] HANGUL SYLLABLE DDYAEG..HANGUL SYLLABLE DDYAEH
B5A1..B5BB ; LVT # Lo [27] HANGUL SYLLABLE DDEOG..HANGUL SYLLABLE DDEOH
B5BD..B5D7 ; LVT # Lo [27] HANGUL SYLLABLE DDEG..HANGUL SYLLABLE DDEH
B5D9..B5F3 ; LVT # Lo [27] HANGUL SYLLABLE DDYEOG..HANGUL SYLLABLE DDYEOH
B5F5..B60F ; LVT # Lo [27] HANGUL SYLLABLE DDYEG..HANGUL SYLLABLE DDYEH
B611..B62B ; LVT # Lo [27] HANGUL SYLLABLE DDOG..HANGUL SYLLABLE DDOH
B62D..B647 ; LVT # Lo [27] HANGUL SYLLABLE DDWAG..HANGUL SYLLABLE DDWAH
B649..B663 ; LVT # Lo [27] HANGUL SYLLABLE DDWAEG..HANGUL SYLLABLE DDWAEH
B665..B67F ; LVT # Lo [27] HANGUL SYLLABLE DDOEG..HANGUL SYLLABLE DDOEH
B681..B69B ; LVT # Lo [27] HANGUL SYLLABLE DDYOG..HANGUL SYLLABLE DDYOH
B69D..B6B7 ; LVT # Lo [27] HANGUL SYLLABLE DDUG..HANGUL SYLLABLE DDUH
B6B9..B6D3 ; LVT # Lo [27] HANGUL SYLLABLE DDWEOG..HANGUL SYLLABLE DDWEOH
B6D5..B6EF ; LVT # Lo [27] HANGUL SYLLABLE DDWEG..HANGUL SYLLABLE DDWEH
B6F1..B70B ; LVT # Lo [27] HANGUL SYLLABLE DDWIG..HANGUL SYLLABLE DDWIH
B70D..B727 ; LVT # Lo [27] HANGUL SYLLABLE DDYUG..HANGUL SYLLABLE DDYUH
B729..B743 ; LVT # Lo [27] HANGUL SYLLABLE DDEUG..HANGUL SYLLABLE DDEUH
B745..B75F ; LVT # Lo [27] HANGUL SYLLABLE DDYIG..HANGUL SYLLABLE DDYIH
B761..B77B ; LVT # Lo [27] HANGUL SYLLABLE DDIG..HANGUL SYLLABLE DDIH
B77D..B797 ; LVT # Lo [27] HANGUL SYLLABLE RAG..HANGUL SYLLABLE RAH
B799..B7B3 ; LVT # Lo [27] HANGUL SYLLABLE RAEG..HANGUL SYLLABLE RAEH
B7B5..B7CF ; LVT # Lo [27] HANGUL SYLLABLE RYAG..HANGUL SYLLABLE RYAH
B7D1..B7EB ; LVT # Lo [27] HANGUL SYLLABLE RYAEG..HANGUL SYLLABLE RYAEH
B7ED..B807 ; LVT # Lo [27] HANGUL SYLLABLE REOG..HANGUL SYLLABLE REOH
B809..B823 ; LVT # Lo [27] HANGUL SYLLABLE REG..HANGUL SYLLABLE REH
B825..B83F ; LVT # Lo [27] HANGUL SYLLABLE RYEOG..HANGUL SYLLABLE RYEOH
B841..B85B ; LVT # Lo [27] HANGUL SYLLABLE RYEG..HANGUL SYLLABLE RYEH
B85D..B877 ; LVT # Lo [27] HANGUL SYLLABLE ROG..HANGUL SYLLABLE ROH
B879..B893 ; LVT # Lo [27] HANGUL SYLLABLE RWAG..HANGUL SYLLABLE RWAH
B895..B8AF ; LVT # Lo [27] HANGUL SYLLABLE RWAEG..HANGUL SYLLABLE RWAEH
B8B1..B8CB ; LVT # Lo [27] HANGUL SYLLABLE ROEG..HANGUL SYLLABLE ROEH
B8CD..B8E7 ; LVT # Lo [27] HANGUL SYLLABLE RYOG..HANGUL SYLLABLE RYOH
B8E9..B903 ; LVT # Lo [27] HANGUL SYLLABLE RUG..HANGUL SYLLABLE RUH
B905..B91F ; LVT # Lo [27] HANGUL SYLLABLE RWEOG..HANGUL SYLLABLE RWEOH
B921..B93B ; LVT # Lo [27] HANGUL SYLLABLE RWEG..HANGUL SYLLABLE RWEH
B93D..B957 ; LVT # Lo [27] HANGUL SYLLABLE RWIG..HANGUL SYLLABLE RWIH
B959..B973 ; LVT # Lo [27] HANGUL SYLLABLE RYUG..HANGUL SYLLABLE RYUH
B975..B98F ; LVT # Lo [27] HANGUL SYLLABLE REUG..HANGUL SYLLABLE REUH
B991..B9AB ; LVT # Lo [27] HANGUL SYLLABLE RYIG..HANGUL SYLLABLE RYIH
B9AD..B9C7 ; LVT # Lo [27] HANGUL SYLLABLE RIG..HANGUL SYLLABLE RIH
B9C9..B9E3 ; LVT # Lo [27] HANGUL SYLLABLE MAG..HANGUL SYLLABLE MAH
B9E5..B9FF ; LVT # Lo [27] HANGUL SYLLABLE MAEG..HANGUL SYLLABLE MAEH
BA01..BA1B ; LVT # Lo [27] HANGUL SYLLABLE MYAG..HANGUL SYLLABLE MYAH
BA1D..BA37 ; LVT # Lo [27] HANGUL SYLLABLE MYAEG..HANGUL SYLLABLE MYAEH
BA39..BA53 ; LVT # Lo [27] HANGUL SYLLABLE MEOG..HANGUL SYLLABLE MEOH
BA55..BA6F ; LVT # Lo [27] HANGUL SYLLABLE MEG..HANGUL SYLLABLE MEH
BA71..BA8B ; LVT # Lo [27] HANGUL SYLLABLE MYEOG..HANGUL SYLLABLE MYEOH
BA8D..BAA7 ; LVT # Lo [27] HANGUL SYLLABLE MYEG..HANGUL SYLLABLE MYEH
BAA9..BAC3 ; LVT # Lo [27] HANGUL SYLLABLE MOG..HANGUL SYLLABLE MOH
BAC5..BADF ; LVT # Lo [27] HANGUL SYLLABLE MWAG..HANGUL SYLLABLE MWAH
BAE1..BAFB ; LVT # Lo [27] HANGUL SYLLABLE MWAEG..HANGUL SYLLABLE MWAEH
BAFD..BB17 ; LVT # Lo [27] HANGUL SYLLABLE MOEG..HANGUL SYLLABLE MOEH
BB19..BB33 ; LVT # Lo [27] HANGUL SYLLABLE MYOG..HANGUL SYLLABLE MYOH
BB35..BB4F ; LVT # Lo [27] HANGUL SYLLABLE MUG..HANGUL SYLLABLE MUH
BB51..BB6B ; LVT # Lo [27] HANGUL SYLLABLE MWEOG..HANGUL SYLLABLE MWEOH
BB6D..BB87 ; LVT # Lo [27] HANGUL SYLLABLE MWEG..HANGUL SYLLABLE MWEH
BB89..BBA3 ; LVT # Lo [27] HANGUL SYLLABLE MWIG..HANGUL SYLLABLE MWIH
BBA5..BBBF ; LVT # Lo [27] HANGUL SYLLABLE MYUG..HANGUL SYLLABLE MYUH
BBC1..BBDB ; LVT # Lo [27] HANGUL SYLLABLE MEUG..HANGUL SYLLABLE MEUH
BBDD..BBF7 ; LVT # Lo [27] HANGUL SYLLABLE MYIG..HANGUL SYLLABLE MYIH
BBF9..BC13 ; LVT # Lo [27] HANGUL SYLLABLE MIG..HANGUL SYLLABLE MIH
BC15..BC2F ; LVT # Lo [27] HANGUL SYLLABLE BAG..HANGUL SYLLABLE BAH
BC31..BC4B ; LVT # Lo [27] HANGUL SYLLABLE BAEG..HANGUL SYLLABLE BAEH
BC4D..BC67 ; LVT # Lo [27] HANGUL SYLLABLE BYAG..HANGUL SYLLABLE BYAH
BC69..BC83 ; LVT # Lo [27] HANGUL SYLLABLE BYAEG..HANGUL SYLLABLE BYAEH
BC85..BC9F ; LVT # Lo [27] HANGUL SYLLABLE BEOG..HANGUL SYLLABLE BEOH
BCA1..BCBB ; LVT # Lo [27] HANGUL SYLLABLE BEG..HANGUL SYLLABLE BEH
BCBD..BCD7 ; LVT # Lo [27] HANGUL SYLLABLE BYEOG..HANGUL SYLLABLE BYEOH
BCD9..BCF3 ; LVT # Lo [27] HANGUL SYLLABLE BYEG..HANGUL SYLLABLE BYEH
BCF5..BD0F ; LVT # Lo [27] HANGUL SYLLABLE BOG..HANGUL SYLLABLE BOH
BD11..BD2B ; LVT # Lo [27] HANGUL SYLLABLE BWAG..HANGUL SYLLABLE BWAH
BD2D..BD47 ; LVT # Lo [27] HANGUL SYLLABLE BWAEG..HANGUL SYLLABLE BWAEH
BD49..BD63 ; LVT # Lo [27] HANGUL SYLLABLE BOEG..HANGUL SYLLABLE BOEH
BD65..BD7F ; LVT # Lo [27] HANGUL SYLLABLE BYOG..HANGUL SYLLABLE BYOH
BD81..BD9B ; LVT # Lo [27] HANGUL SYLLABLE BUG..HANGUL SYLLABLE BUH
BD9D..BDB7 ; LVT # Lo [27] HANGUL SYLLABLE BWEOG..HANGUL SYLLABLE BWEOH
BDB9..BDD3 ; LVT # Lo [27] HANGUL SYLLABLE BWEG..HANGUL SYLLABLE BWEH
BDD5..BDEF ; LVT # Lo [27] HANGUL SYLLABLE BWIG..HANGUL SYLLABLE BWIH
BDF1..BE0B ; LVT # Lo [27] HANGUL SYLLABLE BYUG..HANGUL SYLLABLE BYUH
BE0D..BE27 ; LVT # Lo [27] HANGUL SYLLABLE BEUG..HANGUL SYLLABLE BEUH
BE29..BE43 ; LVT # Lo [27] HANGUL SYLLABLE BYIG..HANGUL SYLLABLE BYIH
BE45..BE5F ; LVT # Lo [27] HANGUL SYLLABLE BIG..HANGUL SYLLABLE BIH
BE61..BE7B ; LVT # Lo [27] HANGUL SYLLABLE BBAG..HANGUL SYLLABLE BBAH
BE7D..BE97 ; LVT # Lo [27] HANGUL SYLLABLE BBAEG..HANGUL SYLLABLE BBAEH
BE99..BEB3 ; LVT # Lo [27] HANGUL SYLLABLE BBYAG..HANGUL SYLLABLE BBYAH
BEB5..BECF ; LVT # Lo [27] HANGUL SYLLABLE BBYAEG..HANGUL SYLLABLE BBYAEH
BED1..BEEB ; LVT # Lo [27] HANGUL SYLLABLE BBEOG..HANGUL SYLLABLE BBEOH
BEED..BF07 ; LVT # Lo [27] HANGUL SYLLABLE BBEG..HANGUL SYLLABLE BBEH
BF09..BF23 ; LVT # Lo [27] HANGUL SYLLABLE BBYEOG..HANGUL SYLLABLE BBYEOH
BF25..BF3F ; LVT # Lo [27] HANGUL SYLLABLE BBYEG..HANGUL SYLLABLE BBYEH
BF41..BF5B ; LVT # Lo [27] HANGUL SYLLABLE BBOG..HANGUL SYLLABLE BBOH
BF5D..BF77 ; LVT # Lo [27] HANGUL SYLLABLE BBWAG..HANGUL SYLLABLE BBWAH
BF79..BF93 ; LVT # Lo [27] HANGUL SYLLABLE BBWAEG..HANGUL SYLLABLE BBWAEH
BF95..BFAF ; LVT # Lo [27] HANGUL SYLLABLE BBOEG..HANGUL SYLLABLE BBOEH
BFB1..BFCB ; LVT # Lo [27] HANGUL SYLLABLE BBYOG..HANGUL SYLLABLE BBYOH
BFCD..BFE7 ; LVT # Lo [27] HANGUL SYLLABLE BBUG..HANGUL SYLLABLE BBUH
BFE9..C003 ; LVT # Lo [27] HANGUL SYLLABLE BBWEOG..HANGUL SYLLABLE BBWEOH
C005..C01F ; LVT # Lo [27] HANGUL SYLLABLE BBWEG..HANGUL SYLLABLE BBWEH
C021..C03B ; LVT # Lo [27] HANGUL SYLLABLE BBWIG..HANGUL SYLLABLE BBWIH
C03D..C057 ; LVT # Lo [27] HANGUL SYLLABLE BBYUG..HANGUL SYLLABLE BBYUH
C059..C073 ; LVT # Lo [27] HANGUL SYLLABLE BBEUG..HANGUL SYLLABLE BBEUH
C075..C08F ; LVT # Lo [27] HANGUL SYLLABLE BBYIG..HANGUL SYLLABLE BBYIH
C091..C0AB ; LVT # Lo [27] HANGUL SYLLABLE BBIG..HANGUL SYLLABLE BBIH
C0AD..C0C7 ; LVT # Lo [27] HANGUL SYLLABLE SAG..HANGUL SYLLABLE SAH
C0C9..C0E3 ; LVT # Lo [27] HANGUL SYLLABLE SAEG..HANGUL SYLLABLE SAEH
C0E5..C0FF ; LVT # Lo [27] HANGUL SYLLABLE SYAG..HANGUL SYLLABLE SYAH
C101..C11B ; LVT # Lo [27] HANGUL SYLLABLE SYAEG..HANGUL SYLLABLE SYAEH
C11D..C137 ; LVT # Lo [27] HANGUL SYLLABLE SEOG..HANGUL SYLLABLE SEOH
C139..C153 ; LVT # Lo [27] HANGUL SYLLABLE SEG..HANGUL SYLLABLE SEH
C155..C16F ; LVT # Lo [27] HANGUL SYLLABLE SYEOG..HANGUL SYLLABLE SYEOH
C171..C18B ; LVT # Lo [27] HANGUL SYLLABLE SYEG..HANGUL SYLLABLE SYEH
C18D..C1A7 ; LVT # Lo [27] HANGUL SYLLABLE SOG..HANGUL SYLLABLE SOH
C1A9..C1C3 ; LVT # Lo [27] HANGUL SYLLABLE SWAG..HANGUL SYLLABLE SWAH
C1C5..C1DF ; LVT # Lo [27] HANGUL SYLLABLE SWAEG..HANGUL SYLLABLE SWAEH
C1E1..C1FB ; LVT # Lo [27] HANGUL SYLLABLE SOEG..HANGUL SYLLABLE SOEH
C1FD..C217 ; LVT # Lo [27] HANGUL SYLLABLE SYOG..HANGUL SYLLABLE SYOH
C219..C233 ; LVT # Lo [27] HANGUL SYLLABLE SUG..HANGUL SYLLABLE SUH
C235..C24F ; LVT # Lo [27] HANGUL SYLLABLE SWEOG..HANGUL SYLLABLE SWEOH
C251..C26B ; LVT # Lo [27] HANGUL SYLLABLE SWEG..HANGUL SYLLABLE SWEH
C26D..C287 ; LVT # Lo [27] HANGUL SYLLABLE SWIG..HANGUL SYLLABLE SWIH
C289..C2A3 ; LVT # Lo [27] HANGUL SYLLABLE SYUG..HANGUL SYLLABLE SYUH
C2A5..C2BF ; LVT # Lo [27] HANGUL SYLLABLE SEUG..HANGUL SYLLABLE SEUH
C2C1..C2DB ; LVT # Lo [27] HANGUL SYLLABLE SYIG..HANGUL SYLLABLE SYIH
C2DD..C2F7 ; LVT # Lo [27] HANGUL SYLLABLE SIG..HANGUL SYLLABLE SIH
C2F9..C313 ; LVT # Lo [27] HANGUL SYLLABLE SSAG..HANGUL SYLLABLE SSAH
C315..C32F ; LVT # Lo [27] HANGUL SYLLABLE SSAEG..HANGUL SYLLABLE SSAEH
C331..C34B ; LVT # Lo [27] HANGUL SYLLABLE SSYAG..HANGUL SYLLABLE SSYAH
C34D..C367 ; LVT # Lo [27] HANGUL SYLLABLE SSYAEG..HANGUL SYLLABLE SSYAEH
C369..C383 ; LVT # Lo [27] HANGUL SYLLABLE SSEOG..HANGUL SYLLABLE SSEOH
C385..C39F ; LVT # Lo [27] HANGUL SYLLABLE SSEG..HANGUL SYLLABLE SSEH
C3A1..C3BB ; LVT # Lo [27] HANGUL SYLLABLE SSYEOG..HANGUL SYLLABLE SSYEOH
C3BD..C3D7 ; LVT # Lo [27] HANGUL SYLLABLE SSYEG..HANGUL SYLLABLE SSYEH
C3D9..C3F3 ; LVT # Lo [27] HANGUL SYLLABLE SSOG..HANGUL SYLLABLE SSOH
C3F5..C40F ; LVT # Lo [27] HANGUL SYLLABLE SSWAG..HANGUL SYLLABLE SSWAH
C411..C42B ; LVT # Lo [27] HANGUL SYLLABLE SSWAEG..HANGUL SYLLABLE SSWAEH
C42D..C447 ; LVT # Lo [27] HANGUL SYLLABLE SSOEG..HANGUL SYLLABLE SSOEH
C449..C463 ; LVT # Lo [27] HANGUL SYLLABLE SSYOG..HANGUL SYLLABLE SSYOH
C465..C47F ; LVT # Lo [27] HANGUL SYLLABLE SSUG..HANGUL SYLLABLE SSUH
C481..C49B ; LVT # Lo [27] HANGUL SYLLABLE SSWEOG..HANGUL SYLLABLE SSWEOH
C49D..C4B7 ; LVT # Lo [27] HANGUL SYLLABLE SSWEG..HANGUL SYLLABLE SSWEH
C4B9..C4D3 ; LVT # Lo [27] HANGUL SYLLABLE SSWIG..HANGUL SYLLABLE SSWIH
C4D5..C4EF ; LVT # Lo [27] HANGUL SYLLABLE SSYUG..HANGUL SYLLABLE SSYUH
C4F1..C50B ; LVT # Lo [27] HANGUL SYLLABLE SSEUG..HANGUL SYLLABLE SSEUH
C50D..C527 ; LVT # Lo [27] HANGUL SYLLABLE SSYIG..HANGUL SYLLABLE SSYIH
C529..C543 ; LVT # Lo [27] HANGUL SYLLABLE SSIG..HANGUL SYLLABLE SSIH
C545..C55F ; LVT # Lo [27] HANGUL SYLLABLE AG..HANGUL SYLLABLE AH
C561..C57B ; LVT # Lo [27] HANGUL SYLLABLE AEG..HANGUL SYLLABLE AEH
C57D..C597 ; LVT # Lo [27] HANGUL SYLLABLE YAG..HANGUL SYLLABLE YAH
C599..C5B3 ; LVT # Lo [27] HANGUL SYLLABLE YAEG..HANGUL SYLLABLE YAEH
C5B5..C5CF ; LVT # Lo [27] HANGUL SYLLABLE EOG..HANGUL SYLLABLE EOH
C5D1..C5EB ; LVT # Lo [27] HANGUL SYLLABLE EG..HANGUL SYLLABLE EH
C5ED..C607 ; LVT # Lo [27] HANGUL SYLLABLE YEOG..HANGUL SYLLABLE YEOH
C609..C623 ; LVT # Lo [27] HANGUL SYLLABLE YEG..HANGUL SYLLABLE YEH
C625..C63F ; LVT # Lo [27] HANGUL SYLLABLE OG..HANGUL SYLLABLE OH
C641..C65B ; LVT # Lo [27] HANGUL SYLLABLE WAG..HANGUL SYLLABLE WAH
C65D..C677 ; LVT # Lo [27] HANGUL SYLLABLE WAEG..HANGUL SYLLABLE WAEH
C679..C693 ; LVT # Lo [27] HANGUL SYLLABLE OEG..HANGUL SYLLABLE OEH
C695..C6AF ; LVT # Lo [27] HANGUL SYLLABLE YOG..HANGUL SYLLABLE YOH
C6B1..C6CB ; LVT # Lo [27] HANGUL SYLLABLE UG..HANGUL SYLLABLE UH
C6CD..C6E7 ; LVT # Lo [27] HANGUL SYLLABLE WEOG..HANGUL SYLLABLE WEOH
C6E9..C703 ; LVT # Lo [27] HANGUL SYLLABLE WEG..HANGUL SYLLABLE WEH
C705..C71F ; LVT # Lo [27] HANGUL SYLLABLE WIG..HANGUL SYLLABLE WIH
C721..C73B ; LVT # Lo [27] HANGUL SYLLABLE YUG..HANGUL SYLLABLE YUH
C73D..C757 ; LVT # Lo [27] HANGUL SYLLABLE EUG..HANGUL SYLLABLE EUH
C759..C773 ; LVT # Lo [27] HANGUL SYLLABLE YIG..HANGUL SYLLABLE YIH
C775..C78F ; LVT # Lo [27] HANGUL SYLLABLE IG..HANGUL SYLLABLE IH
C791..C7AB ; LVT # Lo [27] HANGUL SYLLABLE JAG..HANGUL SYLLABLE JAH
C7AD..C7C7 ; LVT # Lo [27] HANGUL SYLLABLE JAEG..HANGUL SYLLABLE JAEH
C7C9..C7E3 ; LVT # Lo [27] HANGUL SYLLABLE JYAG..HANGUL SYLLABLE JYAH
C7E5..C7FF ; LVT # Lo [27] HANGUL SYLLABLE JYAEG..HANGUL SYLLABLE JYAEH
C801..C81B ; LVT # Lo [27] HANGUL SYLLABLE JEOG..HANGUL SYLLABLE JEOH
C81D..C837 ; LVT # Lo [27] HANGUL SYLLABLE JEG..HANGUL SYLLABLE JEH
C839..C853 ; LVT # Lo [27] HANGUL SYLLABLE JYEOG..HANGUL SYLLABLE JYEOH
C855..C86F ; LVT # Lo [27] HANGUL SYLLABLE JYEG..HANGUL SYLLABLE JYEH
C871..C88B ; LVT # Lo [27] HANGUL SYLLABLE JOG..HANGUL SYLLABLE JOH
C88D..C8A7 ; LVT # Lo [27] HANGUL SYLLABLE JWAG..HANGUL SYLLABLE JWAH
C8A9..C8C3 ; LVT # Lo [27] HANGUL SYLLABLE JWAEG..HANGUL SYLLABLE JWAEH
C8C5..C8DF ; LVT # Lo [27] HANGUL SYLLABLE JOEG..HANGUL SYLLABLE JOEH
C8E1..C8FB ; LVT # Lo [27] HANGUL SYLLABLE JYOG..HANGUL SYLLABLE JYOH
C8FD..C917 ; LVT # Lo [27] HANGUL SYLLABLE JUG..HANGUL SYLLABLE JUH
C919..C933 ; LVT # Lo [27] HANGUL SYLLABLE JWEOG..HANGUL SYLLABLE JWEOH
C935..C94F ; LVT # Lo [27] HANGUL SYLLABLE JWEG..HANGUL SYLLABLE JWEH
C951..C96B ; LVT # Lo [27] HANGUL SYLLABLE JWIG..HANGUL SYLLABLE JWIH
C96D..C987 ; LVT # Lo [27] HANGUL SYLLABLE JYUG..HANGUL SYLLABLE JYUH
C989..C9A3 ; LVT # Lo [27] HANGUL SYLLABLE JEUG..HANGUL SYLLABLE JEUH
C9A5..C9BF ; LVT # Lo [27] HANGUL SYLLABLE JYIG..HANGUL SYLLABLE JYIH
C9C1..C9DB ; LVT # Lo [27] HANGUL SYLLABLE JIG..HANGUL SYLLABLE JIH
C9DD..C9F7 ; LVT # Lo [27] HANGUL SYLLABLE JJAG..HANGUL SYLLABLE JJAH
C9F9..CA13 ; LVT # Lo [27] HANGUL SYLLABLE JJAEG..HANGUL SYLLABLE JJAEH
CA15..CA2F ; LVT # Lo [27] HANGUL SYLLABLE JJYAG..HANGUL SYLLABLE JJYAH
CA31..CA4B ; LVT # Lo [27] HANGUL SYLLABLE JJYAEG..HANGUL SYLLABLE JJYAEH
CA4D..CA67 ; LVT # Lo [27] HANGUL SYLLABLE JJEOG..HANGUL SYLLABLE JJEOH
CA69..CA83 ; LVT # Lo [27] HANGUL SYLLABLE JJEG..HANGUL SYLLABLE JJEH
CA85..CA9F ; LVT # Lo [27] HANGUL SYLLABLE JJYEOG..HANGUL SYLLABLE JJYEOH
CAA1..CABB ; LVT # Lo [27] HANGUL SYLLABLE JJYEG..HANGUL SYLLABLE JJYEH
CABD..CAD7 ; LVT # Lo [27] HANGUL SYLLABLE JJOG..HANGUL SYLLABLE JJOH
CAD9..CAF3 ; LVT # Lo [27] HANGUL SYLLABLE JJWAG..HANGUL SYLLABLE JJWAH
CAF5..CB0F ; LVT # Lo [27] HANGUL SYLLABLE JJWAEG..HANGUL SYLLABLE JJWAEH
CB11..CB2B ; LVT # Lo [27] HANGUL SYLLABLE JJOEG..HANGUL SYLLABLE JJOEH
CB2D..CB47 ; LVT # Lo [27] HANGUL SYLLABLE JJYOG..HANGUL SYLLABLE JJYOH
CB49..CB63 ; LVT # Lo [27] HANGUL SYLLABLE JJUG..HANGUL SYLLABLE JJUH
CB65..CB7F ; LVT # Lo [27] HANGUL SYLLABLE JJWEOG..HANGUL SYLLABLE JJWEOH
CB81..CB9B ; LVT # Lo [27] HANGUL SYLLABLE JJWEG..HANGUL SYLLABLE JJWEH
CB9D..CBB7 ; LVT # Lo [27] HANGUL SYLLABLE JJWIG..HANGUL SYLLABLE JJWIH
CBB9..CBD3 ; LVT # Lo [27] HANGUL SYLLABLE JJYUG..HANGUL SYLLABLE JJYUH
CBD5..CBEF ; LVT # Lo [27] HANGUL SYLLABLE JJEUG..HANGUL SYLLABLE JJEUH
CBF1..CC0B ; LVT # Lo [27] HANGUL SYLLABLE JJYIG..HANGUL SYLLABLE JJYIH
CC0D..CC27 ; LVT # Lo [27] HANGUL SYLLABLE JJIG..HANGUL SYLLABLE JJIH
CC29..CC43 ; LVT # Lo [27] HANGUL SYLLABLE CAG..HANGUL SYLLABLE CAH
CC45..CC5F ; LVT # Lo [27] HANGUL SYLLABLE CAEG..HANGUL SYLLABLE CAEH
CC61..CC7B ; LVT # Lo [27] HANGUL SYLLABLE CYAG..HANGUL SYLLABLE CYAH
CC7D..CC97 ; LVT # Lo [27] HANGUL SYLLABLE CYAEG..HANGUL SYLLABLE CYAEH
CC99..CCB3 ; LVT # Lo [27] HANGUL SYLLABLE CEOG..HANGUL SYLLABLE CEOH
CCB5..CCCF ; LVT # Lo [27] HANGUL SYLLABLE CEG..HANGUL SYLLABLE CEH
CCD1..CCEB ; LVT # Lo [27] HANGUL SYLLABLE CYEOG..HANGUL SYLLABLE CYEOH
CCED..CD07 ; LVT # Lo [27] HANGUL SYLLABLE CYEG..HANGUL SYLLABLE CYEH
CD09..CD23 ; LVT # Lo [27] HANGUL SYLLABLE COG..HANGUL SYLLABLE COH
CD25..CD3F ; LVT # Lo [27] HANGUL SYLLABLE CWAG..HANGUL SYLLABLE CWAH
CD41..CD5B ; LVT # Lo [27] HANGUL SYLLABLE CWAEG..HANGUL SYLLABLE CWAEH
CD5D..CD77 ; LVT # Lo [27] HANGUL SYLLABLE COEG..HANGUL SYLLABLE COEH
CD79..CD93 ; LVT # Lo [27] HANGUL SYLLABLE CYOG..HANGUL SYLLABLE CYOH
CD95..CDAF ; LVT # Lo [27] HANGUL SYLLABLE CUG..HANGUL SYLLABLE CUH
CDB1..CDCB ; LVT # Lo [27] HANGUL SYLLABLE CWEOG..HANGUL SYLLABLE CWEOH
CDCD..CDE7 ; LVT # Lo [27] HANGUL SYLLABLE CWEG..HANGUL SYLLABLE CWEH
CDE9..CE03 ; LVT # Lo [27] HANGUL SYLLABLE CWIG..HANGUL SYLLABLE CWIH
CE05..CE1F ; LVT # Lo [27] HANGUL SYLLABLE CYUG..HANGUL SYLLABLE CYUH
CE21..CE3B ; LVT # Lo [27] HANGUL SYLLABLE CEUG..HANGUL SYLLABLE CEUH
CE3D..CE57 ; LVT # Lo [27] HANGUL SYLLABLE CYIG..HANGUL SYLLABLE CYIH
CE59..CE73 ; LVT # Lo [27] HANGUL SYLLABLE CIG..HANGUL SYLLABLE CIH
CE75..CE8F ; LVT # Lo [27] HANGUL SYLLABLE KAG..HANGUL SYLLABLE KAH
CE91..CEAB ; LVT # Lo [27] HANGUL SYLLABLE KAEG..HANGUL SYLLABLE KAEH
CEAD..CEC7 ; LVT # Lo [27] HANGUL SYLLABLE KYAG..HANGUL SYLLABLE KYAH
CEC9..CEE3 ; LVT # Lo [27] HANGUL SYLLABLE KYAEG..HANGUL SYLLABLE KYAEH
CEE5..CEFF ; LVT # Lo [27] HANGUL SYLLABLE KEOG..HANGUL SYLLABLE KEOH
CF01..CF1B ; LVT # Lo [27] HANGUL SYLLABLE KEG..HANGUL SYLLABLE KEH
CF1D..CF37 ; LVT # Lo [27] HANGUL SYLLABLE KYEOG..HANGUL SYLLABLE KYEOH
CF39..CF53 ; LVT # Lo [27] HANGUL SYLLABLE KYEG..HANGUL SYLLABLE KYEH
CF55..CF6F ; LVT # Lo [27] HANGUL SYLLABLE KOG..HANGUL SYLLABLE KOH
CF71..CF8B ; LVT # Lo [27] HANGUL SYLLABLE KWAG..HANGUL SYLLABLE KWAH
CF8D..CFA7 ; LVT # Lo [27] HANGUL SYLLABLE KWAEG..HANGUL SYLLABLE KWAEH
CFA9..CFC3 ; LVT # Lo [27] HANGUL SYLLABLE KOEG..HANGUL SYLLABLE KOEH
CFC5..CFDF ; LVT # Lo [27] HANGUL SYLLABLE KYOG..HANGUL SYLLABLE KYOH
CFE1..CFFB ; LVT # Lo [27] HANGUL SYLLABLE KUG..HANGUL SYLLABLE KUH
CFFD..D017 ; LVT # Lo [27] HANGUL SYLLABLE KWEOG..HANGUL SYLLABLE KWEOH
D019..D033 ; LVT # Lo [27] HANGUL SYLLABLE KWEG..HANGUL SYLLABLE KWEH
D035..D04F ; LVT # Lo [27] HANGUL SYLLABLE KWIG..HANGUL SYLLABLE KWIH
D051..D06B ; LVT # Lo [27] HANGUL SYLLABLE KYUG..HANGUL SYLLABLE KYUH
D06D..D087 ; LVT # Lo [27] HANGUL SYLLABLE KEUG..HANGUL SYLLABLE KEUH
D089..D0A3 ; LVT # Lo [27] HANGUL SYLLABLE KYIG..HANGUL SYLLABLE KYIH
D0A5..D0BF ; LVT # Lo [27] HANGUL SYLLABLE KIG..HANGUL SYLLABLE KIH
D0C1..D0DB ; LVT # Lo [27] HANGUL SYLLABLE TAG..HANGUL SYLLABLE TAH
D0DD..D0F7 ; LVT # Lo [27] HANGUL SYLLABLE TAEG..HANGUL SYLLABLE TAEH
D0F9..D113 ; LVT # Lo [27] HANGUL SYLLABLE TYAG..HANGUL SYLLABLE TYAH
D115..D12F ; LVT # Lo [27] HANGUL SYLLABLE TYAEG..HANGUL SYLLABLE TYAEH
D131..D14B ; LVT # Lo [27] HANGUL SYLLABLE TEOG..HANGUL SYLLABLE TEOH
D14D..D167 ; LVT # Lo [27] HANGUL SYLLABLE TEG..HANGUL SYLLABLE TEH
D169..D183 ; LVT # Lo [27] HANGUL SYLLABLE TYEOG..HANGUL SYLLABLE TYEOH
D185..D19F ; LVT # Lo [27] HANGUL SYLLABLE TYEG..HANGUL SYLLABLE TYEH
D1A1..D1BB ; LVT # Lo [27] HANGUL SYLLABLE TOG..HANGUL SYLLABLE TOH
D1BD..D1D7 ; LVT # Lo [27] HANGUL SYLLABLE TWAG..HANGUL SYLLABLE TWAH
D1D9..D1F3 ; LVT # Lo [27] HANGUL SYLLABLE TWAEG..HANGUL SYLLABLE TWAEH
D1F5..D20F ; LVT # Lo [27] HANGUL SYLLABLE TOEG..HANGUL SYLLABLE TOEH
D211..D22B ; LVT # Lo [27] HANGUL SYLLABLE TYOG..HANGUL SYLLABLE TYOH
D22D..D247 ; LVT # Lo [27] HANGUL SYLLABLE TUG..HANGUL SYLLABLE TUH
D249..D263 ; LVT # Lo [27] HANGUL SYLLABLE TWEOG..HANGUL SYLLABLE TWEOH
D265..D27F ; LVT # Lo [27] HANGUL SYLLABLE TWEG..HANGUL SYLLABLE TWEH
D281..D29B ; LVT # Lo [27] HANGUL SYLLABLE TWIG..HANGUL SYLLABLE TWIH
D29D..D2B7 ; LVT # Lo [27] HANGUL SYLLABLE TYUG..HANGUL SYLLABLE TYUH
D2B9..D2D3 ; LVT # Lo [27] HANGUL SYLLABLE TEUG..HANGUL SYLLABLE TEUH
D2D5..D2EF ; LVT # Lo [27] HANGUL SYLLABLE TYIG..HANGUL SYLLABLE TYIH
D2F1..D30B ; LVT # Lo [27] HANGUL SYLLABLE TIG..HANGUL SYLLABLE TIH
D30D..D327 ; LVT # Lo [27] HANGUL SYLLABLE PAG..HANGUL SYLLABLE PAH
D329..D343 ; LVT # Lo [27] HANGUL SYLLABLE PAEG..HANGUL SYLLABLE PAEH
D345..D35F ; LVT # Lo [27] HANGUL SYLLABLE PYAG..HANGUL SYLLABLE PYAH
D361..D37B ; LVT # Lo [27] HANGUL SYLLABLE PYAEG..HANGUL SYLLABLE PYAEH
D37D..D397 ; LVT # Lo [27] HANGUL SYLLABLE PEOG..HANGUL SYLLABLE PEOH
D399..D3B3 ; LVT # Lo [27] HANGUL SYLLABLE PEG..HANGUL SYLLABLE PEH
D3B5..D3CF ; LVT # Lo [27] HANGUL SYLLABLE PYEOG..HANGUL SYLLABLE PYEOH
D3D1..D3EB ; LVT # Lo [27] HANGUL SYLLABLE PYEG..HANGUL SYLLABLE PYEH
D3ED..D407 ; LVT # Lo [27] HANGUL SYLLABLE POG..HANGUL SYLLABLE POH
D409..D423 ; LVT # Lo [27] HANGUL SYLLABLE PWAG..HANGUL SYLLABLE PWAH
D425..D43F ; LVT # Lo [27] HANGUL SYLLABLE PWAEG..HANGUL SYLLABLE PWAEH
D441..D45B ; LVT # Lo [27] HANGUL SYLLABLE POEG..HANGUL SYLLABLE POEH
D45D..D477 ; LVT # Lo [27] HANGUL SYLLABLE PYOG..HANGUL SYLLABLE PYOH
D479..D493 ; LVT # Lo [27] HANGUL SYLLABLE PUG..HANGUL SYLLABLE PUH
D495..D4AF ; LVT # Lo [27] HANGUL SYLLABLE PWEOG..HANGUL SYLLABLE PWEOH
D4B1..D4CB ; LVT # Lo [27] HANGUL SYLLABLE PWEG..HANGUL SYLLABLE PWEH
D4CD..D4E7 ; LVT # Lo [27] HANGUL SYLLABLE PWIG..HANGUL SYLLABLE PWIH
D4E9..D503 ; LVT # Lo [27] HANGUL SYLLABLE PYUG..HANGUL SYLLABLE PYUH
D505..D51F ; LVT # Lo [27] HANGUL SYLLABLE PEUG..HANGUL SYLLABLE PEUH
D521..D53B ; LVT # Lo [27] HANGUL SYLLABLE PYIG..HANGUL SYLLABLE PYIH
D53D..D557 ; LVT # Lo [27] HANGUL SYLLABLE PIG..HANGUL SYLLABLE PIH
D559..D573 ; LVT # Lo [27] HANGUL SYLLABLE HAG..HANGUL SYLLABLE HAH
D575..D58F ; LVT # Lo [27] HANGUL SYLLABLE HAEG..HANGUL SYLLABLE HAEH
D591..D5AB ; LVT # Lo [27] HANGUL SYLLABLE HYAG..HANGUL SYLLABLE HYAH
D5AD..D5C7 ; LVT # Lo [27] HANGUL SYLLABLE HYAEG..HANGUL SYLLABLE HYAEH
D5C9..D5E3 ; LVT # Lo [27] HANGUL SYLLABLE HEOG..HANGUL SYLLABLE HEOH
D5E5..D5FF ; LVT # Lo [27] HANGUL SYLLABLE HEG..HANGUL SYLLABLE HEH
D601..D61B ; LVT # Lo [27] HANGUL SYLLABLE HYEOG..HANGUL SYLLABLE HYEOH
D61D..D637 ; LVT # Lo [27] HANGUL SYLLABLE HYEG..HANGUL SYLLABLE HYEH
D639..D653 ; LVT # Lo [27] HANGUL SYLLABLE HOG..HANGUL SYLLABLE HOH
D655..D66F ; LVT # Lo [27] HANGUL SYLLABLE HWAG..HANGUL SYLLABLE HWAH
D671..D68B ; LVT # Lo [27] HANGUL SYLLABLE HWAEG..HANGUL SYLLABLE HWAEH
D68D..D6A7 ; LVT # Lo [27] HANGUL SYLLABLE HOEG..HANGUL SYLLABLE HOEH
D6A9..D6C3 ; LVT # Lo [27] HANGUL SYLLABLE HYOG..HANGUL SYLLABLE HYOH
D6C5..D6DF ; LVT # Lo [27] HANGUL SYLLABLE HUG..HANGUL SYLLABLE HUH
D6E1..D6FB ; LVT # Lo [27] HANGUL SYLLABLE HWEOG..HANGUL SYLLABLE HWEOH
D6FD..D717 ; LVT # Lo [27] HANGUL SYLLABLE HWEG..HANGUL SYLLABLE HWEH
D719..D733 ; LVT # Lo [27] HANGUL SYLLABLE HWIG..HANGUL SYLLABLE HWIH
D735..D74F ; LVT # Lo [27] HANGUL SYLLABLE HYUG..HANGUL SYLLABLE HYUH
D751..D76B ; LVT # Lo [27] HANGUL SYLLABLE HEUG..HANGUL SYLLABLE HEUH
D76D..D787 ; LVT # Lo [27] HANGUL SYLLABLE HYIG..HANGUL SYLLABLE HYIH
D789..D7A3 ; LVT # Lo [27] HANGUL SYLLABLE HIG..HANGUL SYLLABLE HIH
# Total code points: 10773
# EOF

File diff suppressed because it is too large Load Diff

View File

@ -0,0 +1,92 @@
# Jamo-5.0.0.txt
# Date: 2006-07-14, 11:22 PST [KW]
#
# Unicode Character Database
# Copyright (c) 1991-2006 Unicode, Inc.
# For terms of use, see http://www.unicode.org/terms_of_use.html
# For documentation, see UCD.html
#
# This file defines the Jamo Short Name property.
#
# See Section 3.12 of The Unicode Standard, Version 4.0
# for more information.
#
# Each line contains two fields, separated by a semicolon.
#
# The first field gives the code point, in 4-digit hexadecimal
# form, of a combining jamo character that participates in
# the algorithmic determination Hangul syllable character names.
# The second field gives the Jamo Short Name as a one-, two-,
# or three-character ASCII string (or in one case, for U+110B,
# the null string).
#
# #############################################################
1100; G # HANGUL CHOSEONG KIYEOK
1101; GG # HANGUL CHOSEONG SSANGKIYEOK
1102; N # HANGUL CHOSEONG NIEUN
1103; D # HANGUL CHOSEONG TIKEUT
1104; DD # HANGUL CHOSEONG SSANGTIKEUT
1105; R # HANGUL CHOSEONG RIEUL
1106; M # HANGUL CHOSEONG MIEUM
1107; B # HANGUL CHOSEONG PIEUP
1108; BB # HANGUL CHOSEONG SSANGPIEUP
1109; S # HANGUL CHOSEONG SIOS
110A; SS # HANGUL CHOSEONG SSANGSIOS
110B; # HANGUL CHOSEONG IEUNG
110C; J # HANGUL CHOSEONG CIEUC
110D; JJ # HANGUL CHOSEONG SSANGCIEUC
110E; C # HANGUL CHOSEONG CHIEUCH
110F; K # HANGUL CHOSEONG KHIEUKH
1110; T # HANGUL CHOSEONG THIEUTH
1111; P # HANGUL CHOSEONG PHIEUPH
1112; H # HANGUL CHOSEONG HIEUH
1161; A # HANGUL JUNGSEONG A
1162; AE # HANGUL JUNGSEONG AE
1163; YA # HANGUL JUNGSEONG YA
1164; YAE # HANGUL JUNGSEONG YAE
1165; EO # HANGUL JUNGSEONG EO
1166; E # HANGUL JUNGSEONG E
1167; YEO # HANGUL JUNGSEONG YEO
1168; YE # HANGUL JUNGSEONG YE
1169; O # HANGUL JUNGSEONG O
116A; WA # HANGUL JUNGSEONG WA
116B; WAE # HANGUL JUNGSEONG WAE
116C; OE # HANGUL JUNGSEONG OE
116D; YO # HANGUL JUNGSEONG YO
116E; U # HANGUL JUNGSEONG U
116F; WEO # HANGUL JUNGSEONG WEO
1170; WE # HANGUL JUNGSEONG WE
1171; WI # HANGUL JUNGSEONG WI
1172; YU # HANGUL JUNGSEONG YU
1173; EU # HANGUL JUNGSEONG EU
1174; YI # HANGUL JUNGSEONG YI
1175; I # HANGUL JUNGSEONG I
11A8; G # HANGUL JONGSEONG KIYEOK
11A9; GG # HANGUL JONGSEONG SSANGKIYEOK
11AA; GS # HANGUL JONGSEONG KIYEOK-SIOS
11AB; N # HANGUL JONGSEONG NIEUN
11AC; NJ # HANGUL JONGSEONG NIEUN-CIEUC
11AD; NH # HANGUL JONGSEONG NIEUN-HIEUH
11AE; D # HANGUL JONGSEONG TIKEUT
11AF; L # HANGUL JONGSEONG RIEUL
11B0; LG # HANGUL JONGSEONG RIEUL-KIYEOK
11B1; LM # HANGUL JONGSEONG RIEUL-MIEUM
11B2; LB # HANGUL JONGSEONG RIEUL-PIEUP
11B3; LS # HANGUL JONGSEONG RIEUL-SIOS
11B4; LT # HANGUL JONGSEONG RIEUL-THIEUTH
11B5; LP # HANGUL JONGSEONG RIEUL-PHIEUPH
11B6; LH # HANGUL JONGSEONG RIEUL-HIEUH
11B7; M # HANGUL JONGSEONG MIEUM
11B8; B # HANGUL JONGSEONG PIEUP
11B9; BS # HANGUL JONGSEONG PIEUP-SIOS
11BA; S # HANGUL JONGSEONG SIOS
11BB; SS # HANGUL JONGSEONG SSANGSIOS
11BC; NG # HANGUL JONGSEONG IEUNG
11BD; J # HANGUL JONGSEONG CIEUC
11BE; C # HANGUL JONGSEONG CHIEUCH
11BF; K # HANGUL JONGSEONG KHIEUKH
11C0; T # HANGUL JONGSEONG THIEUTH
11C1; P # HANGUL JONGSEONG PHIEUPH
11C2; H # HANGUL JONGSEONG HIEUH

File diff suppressed because it is too large Load Diff

View File

@ -0,0 +1,40 @@
# NameAliases-5.0.0.txt
# Date: 2006-05-25, 11:10:00 PST [AF/KW]
#
# This file is a normative contributory data file in the
# Unicode Character Database.
#
# Copyright (c) 2005-2006 Unicode, Inc.
# For terms of use, see http://www.unicode.org/terms_of_use.html
#
# This file defines the formal name aliases for Unicode characters.
#
# For informative aliases see NamesList.txt
#
# For documentation, see UCD.html and NamesList.html
#
# FORMAT
#
# Each line has two fields
# First field: Code point
# Second field: Alias
#
# In case multiple aliases are assigned, additional aliases
# would be provided on separate lines
#
#-----------------------------------------------------------------
01A2;LATIN CAPITAL LETTER GHA
01A3;LATIN SMALL LETTER GHA
0CDE;KANNADA LETTER LLLA
0E9D;LAO LETTER FO FON
0E9F;LAO LETTER FO FAY
0EA3;LAO LETTER RO
0EA5;LAO LETTER LO
0FD0;TIBETAN MARK BKA- SHOG GI MGO RGYAN
A015;YI SYLLABLE ITERATION MARK
FE18;PRESENTATION FORM FOR VERTICAL RIGHT WHITE LENTICULAR BRACKET
1D0C5;BYZANTINE MUSICAL SYMBOL FTHORA SKLIRON CHROMA VASIS
# Total code points: 11
# EOF

View File

@ -0,0 +1,88 @@
# NamedSequences-5.0.0.txt
# Date: 2006-05-23, 11:01 PST [KW]
#
# Unicode Character Database
# Copyright (c) 1991-2006 Unicode, Inc.
# For terms of use, see http://www.unicode.org/terms_of_use.html
# For documentation, see UCD.html
#
# Format:
# Name of Sequence; Code Point Sequence for USI
#
# Note: The order of entries in this file is not significant.
# However, entries are generally in script order corresponding
# to block order in the Unicode Standard, to make it easier
# to find entries in the list.
# ================================================
LATIN CAPITAL LETTER A WITH MACRON AND GRAVE;0100 0300
LATIN SMALL LETTER A WITH MACRON AND GRAVE;0101 0300
LATIN CAPITAL LETTER E WITH VERTICAL LINE BELOW;0045 0329
LATIN SMALL LETTER E WITH VERTICAL LINE BELOW;0065 0329
LATIN CAPITAL LETTER E WITH VERTICAL LINE BELOW AND GRAVE;00C8 0329
LATIN SMALL LETTER E WITH VERTICAL LINE BELOW AND GRAVE;00E8 0329
LATIN CAPITAL LETTER E WITH VERTICAL LINE BELOW AND ACUTE;00C9 0329
LATIN SMALL LETTER E WITH VERTICAL LINE BELOW AND ACUTE;00E9 0329
LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND MACRON;00CA 0304
LATIN SMALL LETTER E WITH CIRCUMFLEX AND MACRON;00EA 0304
LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND CARON;00CA 030C
LATIN SMALL LETTER E WITH CIRCUMFLEX AND CARON;00EA 030C
LATIN CAPITAL LETTER I WITH MACRON AND GRAVE;012A 0300
LATIN SMALL LETTER I WITH MACRON AND GRAVE;012B 0300
LATIN SMALL LETTER I WITH DOT ABOVE AND ACUTE;0069 0307 0301
LATIN SMALL LETTER NG WITH TILDE ABOVE;006E 0360 0067
LATIN CAPITAL LETTER O WITH VERTICAL LINE BELOW;004F 0329
LATIN SMALL LETTER O WITH VERTICAL LINE BELOW;006F 0329
LATIN CAPITAL LETTER O WITH VERTICAL LINE BELOW AND GRAVE;00D2 0329
LATIN SMALL LETTER O WITH VERTICAL LINE BELOW AND GRAVE;00F2 0329
LATIN CAPITAL LETTER O WITH VERTICAL LINE BELOW AND ACUTE;00D3 0329
LATIN SMALL LETTER O WITH VERTICAL LINE BELOW AND ACUTE;00F3 0329
LATIN CAPITAL LETTER S WITH VERTICAL LINE BELOW;0053 0329
LATIN SMALL LETTER S WITH VERTICAL LINE BELOW;0073 0329
LATIN CAPITAL LETTER U WITH MACRON AND GRAVE;016A 0300
LATIN SMALL LETTER U WITH MACRON AND GRAVE;016B 0300
GEORGIAN LETTER U-BRJGU;10E3 0302
KHMER CONSONANT SIGN COENG KA;17D2 1780
KHMER CONSONANT SIGN COENG KHA;17D2 1781
KHMER CONSONANT SIGN COENG KO;17D2 1782
KHMER CONSONANT SIGN COENG KHO;17D2 1783
KHMER CONSONANT SIGN COENG NGO;17D2 1784
KHMER CONSONANT SIGN COENG CA;17D2 1785
KHMER CONSONANT SIGN COENG CHA;17D2 1786
KHMER CONSONANT SIGN COENG CO;17D2 1787
KHMER CONSONANT SIGN COENG CHO;17D2 1788
KHMER CONSONANT SIGN COENG NYO;17D2 1789
KHMER CONSONANT SIGN COENG DA;17D2 178A
KHMER CONSONANT SIGN COENG TTHA;17D2 178B
KHMER CONSONANT SIGN COENG DO;17D2 178C
KHMER CONSONANT SIGN COENG TTHO;17D2 178D
KHMER CONSONANT SIGN COENG NA;17D2 178E
KHMER CONSONANT SIGN COENG TA;17D2 178F
KHMER CONSONANT SIGN COENG THA;17D2 1790
KHMER CONSONANT SIGN COENG TO;17D2 1791
KHMER CONSONANT SIGN COENG THO;17D2 1792
KHMER CONSONANT SIGN COENG NO;17D2 1793
KHMER CONSONANT SIGN COENG BA;17D2 1794
KHMER CONSONANT SIGN COENG PHA;17D2 1795
KHMER CONSONANT SIGN COENG PO;17D2 1796
KHMER CONSONANT SIGN COENG PHO;17D2 1797
KHMER CONSONANT SIGN COENG MO;17D2 1798
KHMER CONSONANT SIGN COENG YO;17D2 1799
KHMER CONSONANT SIGN COENG RO;17D2 179A
KHMER CONSONANT SIGN COENG LO;17D2 179B
KHMER CONSONANT SIGN COENG VO;17D2 179C
KHMER CONSONANT SIGN COENG SHA;17D2 179D
KHMER CONSONANT SIGN COENG SSA;17D2 179E
KHMER CONSONANT SIGN COENG SA;17D2 179F
KHMER CONSONANT SIGN COENG HA;17D2 17A0
KHMER CONSONANT SIGN COENG LA;17D2 17A1
KHMER VOWEL SIGN COENG QA;17D2 17A2
KHMER INDEPENDENT VOWEL SIGN COENG QU;17D2 17A7
KHMER INDEPENDENT VOWEL SIGN COENG RY;17D2 17AB
KHMER INDEPENDENT VOWEL SIGN COENG RYY;17D2 17AC
KHMER INDEPENDENT VOWEL SIGN COENG QE;17D2 17AF
KHMER VOWEL SIGN OM;17BB 17C6
KHMER VOWEL SIGN AAM;17B6 17C6
KATAKANA LETTER AINU P;31F7 309A
MODIFIER LETTER EXTRA-HIGH EXTRA-LOW CONTOUR TONE BAR;02E5 02E9

View File

@ -0,0 +1,84 @@
# NamedSequencesProv-5.0.0.txt
# Date: 2006-05-23, 11:33 PST [KW]
#
# Unicode Character Database
# Copyright (c) 1991-2006 Unicode, Inc.
# For terms of use, see http://www.unicode.org/terms_of_use.html
# For documentation, see UCD.html
#
# Provisional Named Sequences
# Note: This data file contains those named
# sequences which have been designated to be provisional,
# rather than fully approved.
#
# Format:
# Name of Sequence; Code Point Sequence for USI
#
# Note: The order of entries in this file is not significant.
# However, entries are generally in script order corresponding
# to block order in the Unicode Standard, to make it easier
# to find entries in the list.
# ================================================
# Entries from Unicode 4.1.0 version of NamedSequences.txt,
# subsequently disapproved because of potential errors in
# representation.
# GURMUKHI HALF YA;0A2F 0A4D
# GURMUKHI PARI YA;0A4D 0A2F
# Entry removed 2006-05-18:
#
# LATIN SMALL LETTER A WITH ACUTE AND OGONEK;00E1 0328
#
# This entry was removed because the sequence was not in NFC,
# as required. It will be replaced with the NFC version of
# the sequence, based on the Lithuanian additions proposed
# here for a future version of the standard.
# ================================================
# Provisional entries for NamedSequences.txt.
# Proposed additions for Lithuanian. 2006-05-18
LATIN CAPITAL LETTER A WITH OGONEK AND ACUTE;0104 0301
LATIN SMALL LETTER A WITH OGONEK AND ACUTE;0105 0301
LATIN CAPITAL LETTER A WITH OGONEK AND TILDE;0104 0303
LATIN SMALL LETTER A WITH OGONEK AND TILDE;0105 0303
LATIN CAPITAL LETTER E WITH OGONEK AND ACUTE;0118 0301
LATIN SMALL LETTER E WITH OGONEK AND ACUTE;0119 0301
LATIN CAPITAL LETTER E WITH OGONEK AND TILDE;0118 0303
LATIN SMALL LETTER E WITH OGONEK AND TILDE;0119 0303
LATIN CAPITAL LETTER E WITH DOT ABOVE AND ACUTE;0116 0301
LATIN SMALL LETTER E WITH DOT ABOVE AND ACUTE;0117 0301
LATIN CAPITAL LETTER E WITH DOT ABOVE AND TILDE;0116 0303
LATIN SMALL LETTER E WITH DOT ABOVE AND TILDE;0117 0303
LATIN SMALL LETTER I WITH DOT ABOVE AND GRAVE;0069 0307 0300
LATIN SMALL LETTER I WITH DOT ABOVE AND TILDE;0069 0307 0303
LATIN CAPITAL LETTER I WITH OGONEK AND ACUTE;012E 0301
LATIN SMALL LETTER I WITH OGONEK AND DOT ABOVE AND ACUTE;012F 0307 0301
LATIN CAPITAL LETTER I WITH OGONEK AND TILDE;012E 0303
LATIN SMALL LETTER I WITH OGONEK AND DOT ABOVE AND TILDE;012F 0307 0303
LATIN CAPITAL LETTER J WITH TILDE;004A 0303
LATIN SMALL LETTER J WITH DOT ABOVE AND TILDE;006A 0307 0303
LATIN CAPITAL LETTER L WITH TILDE;004C 0303
LATIN SMALL LETTER L WITH TILDE;006C 0303
LATIN CAPITAL LETTER M WITH TILDE;004D 0303
LATIN SMALL LETTER M WITH TILDE;006D 0303
LATIN CAPITAL LETTER R WITH TILDE;0052 0303
LATIN SMALL LETTER R WITH TILDE;0072 0303
LATIN CAPITAL LETTER U WITH OGONEK AND ACUTE;0172 0301
LATIN SMALL LETTER U WITH OGONEK AND ACUTE;0173 0301
LATIN CAPITAL LETTER U WITH OGONEK AND TILDE;0172 0303
LATIN SMALL LETTER U WITH OGONEK AND TILDE;0173 0303
LATIN CAPITAL LETTER U WITH MACRON AND ACUTE;016A 0301
LATIN SMALL LETTER U WITH MACRON AND ACUTE;016B 0301
LATIN CAPITAL LETTER U WITH MACRON AND TILDE;016A 0303
LATIN SMALL LETTER U WITH MACRON AND TILDE;016B 0303
# Proposed additions for Tamil.
TAMIL LETTER KSSA;0B95 0BCD 0BB7
TAMIL LETTER SHRII;0BB6 0BCD 0BB0 0BC0

File diff suppressed because it is too large Load Diff

View File

@ -0,0 +1,48 @@
# NormalizationCorrections-5.0.0.txt
# Date: 2006-07-14, 11:23:00 PDT [KW]
#
# This file is a normative contributory data file in the
# Unicode Character Database.
#
# Copyright (c) 1991-2006 Unicode, Inc.
# For terms of use, see http://www.unicode.org/terms_of_use.html
#
# The normalization stabilization policy of the Unicode
# Consortium ordinarily precludes any change to the decomposition
# for any character, once established in a relevant version
# of the UnicodeData.txt data file. However, under certain
# exceptional (and rare) conditions, an error in a decomposition
# mapping may be discovered that is truly just an unintended
# typo in the data, and not a matter of dubious interpretation.
#
# Whenever such an error may be found, and if it meets the
# requirements for possible exceptions to normalization
# stability, the correction is entered in this data file,
# so that any implementation depending on absolute stability
# of normalization, *including* any errors in the data, can
# safely reconstruct the exact state of the data tables at
# any given version of Unicode.
#
# Currently this list has exactly six entries in it, one for the
# typo found and corrected in Corrigendum #3, and five for
# the typos and misidentifications found and corrected in
# Corrigendum #4. All efforts
# will be made to keep the entries limited to just those fixes.
#
# Interpretation of the fields:
# Field 0: Unicode code point
# Field 1: Original (erroneous) decomposition
# Field 2: Corrected decomposition
# Field 3: Version of Unicode for which the correction was
# entered into UnicodeData.txt, in n.n.n format.
# Comment: Indicates the Unicode Corrigendum which documents
# the correction
#
# For more information, see UAX #15, Unicode Normalization Forms.
#
F951;96FB;964B;3.2.0 # Corrigendum 3
2F868;2136A;36FC;4.0.0 # Corrigendum 4
2F874;5F33;5F53;4.0.0 # Corrigendum 4
2F91F;43AB;243AB;4.0.0 # Corrigendum 4
2F95F;7AAE;7AEE;4.0.0 # Corrigendum 4
2F9BF;4D57;45D7;4.0.0 # Corrigendum 4

File diff suppressed because it is too large Load Diff

File diff suppressed because it is too large Load Diff

View File

@ -0,0 +1,165 @@
# PropertyAliases-5.0.0.txt
# Date: 2006-03-03, 08:23:34 GMT [MD]
#
# Unicode Character Database
# Copyright (c) 1991-2006 Unicode, Inc.
# For terms of use, see http://www.unicode.org/terms_of_use.html
# For documentation, see UCD.html
#
# This file contains aliases for properties used in the UCD.
# These names can be used for XML formats of UCD data, for regular-expression
# property tests, and other programmatic textual descriptions of Unicode data.
# For information on which properties are normative, see UCD.html.
#
# The names may be translated in appropriate environments, and additional
# aliases may be useful.
#
# FORMAT
#
# Each line has two or more fields, separated by semicolons.
#
# First Field: The first field is an abbreviated name for the property.
#
# Second Field: The second field is a long name
#
# The above are the preferred aliases. Other aliases may be listed in additional fields.
#
# Loose matching should be applied to all property names and property values, with
# the exception of String Property values. With loose matching of property names and
# values, the case distinctions, whitespace, and '_' are ignored. For Numeric Property
# values, numeric equivalencies are applied: thus "01.00" is equivalent to "1".
#
# NOTE: Property value names are NOT unique across properties. For example:
#
# AL means Arabic Letter for the Bidi_Class property, and
# AL means Alpha_Left for the Combining_Class property, and
# AL means Alphabetic for the Line_Break property.
#
# In addition, some property names may be the same as some property value names.
# For example:
#
# sc means the Script property, and
# Sc means the General_Category property value Currency_Symbol (Sc)
#
# The combination of property value and property name is, however, unique.
#
# For more information, see UTS #18: Regular Expression Guidelines
# ================================================
# ================================================
# Numeric Properties
# ================================================
nv ; Numeric_Value
# ================================================
# String Properties
# ================================================
bmg ; Bidi_Mirroring_Glyph
cf ; Case_Folding
dm ; Decomposition_Mapping
FC_NFKC ; FC_NFKC_Closure
lc ; Lowercase_Mapping
scc ; Special_Case_Condition
sfc ; Simple_Case_Folding
slc ; Simple_Lowercase_Mapping
stc ; Simple_Titlecase_Mapping
suc ; Simple_Uppercase_Mapping
tc ; Titlecase_Mapping
uc ; Uppercase_Mapping
# ================================================
# Miscellaneous Properties
# ================================================
isc ; ISO_Comment
na ; Name
na1 ; Unicode_1_Name
URS ; Unicode_Radical_Stroke
# ================================================
# Catalog Properties
# ================================================
age ; Age
blk ; Block
sc ; Script
# ================================================
# Enumerated Properties
# ================================================
bc ; Bidi_Class
ccc ; Canonical_Combining_Class
dt ; Decomposition_Type
ea ; East_Asian_Width
gc ; General_Category
GCB ; Grapheme_Cluster_Break
hst ; Hangul_Syllable_Type
jg ; Joining_Group
jt ; Joining_Type
lb ; Line_Break
NFC_QC ; NFC_Quick_Check
NFD_QC ; NFD_Quick_Check
NFKC_QC ; NFKC_Quick_Check
NFKD_QC ; NFKD_Quick_Check
nt ; Numeric_Type
SB ; Sentence_Break
WB ; Word_Break
# ================================================
# Binary Properties
# ================================================
AHex ; ASCII_Hex_Digit
Alpha ; Alphabetic
Bidi_C ; Bidi_Control
Bidi_M ; Bidi_Mirrored
CE ; Composition_Exclusion
Comp_Ex ; Full_Composition_Exclusion
Dash ; Dash
Dep ; Deprecated
DI ; Default_Ignorable_Code_Point
Dia ; Diacritic
Ext ; Extender
Gr_Base ; Grapheme_Base
Gr_Ext ; Grapheme_Extend
Gr_Link ; Grapheme_Link
Hex ; Hex_Digit
Hyphen ; Hyphen
IDC ; ID_Continue
Ideo ; Ideographic
IDS ; ID_Start
IDSB ; IDS_Binary_Operator
IDST ; IDS_Trinary_Operator
Join_C ; Join_Control
LOE ; Logical_Order_Exception
Lower ; Lowercase
Math ; Math
NChar ; Noncharacter_Code_Point
OAlpha ; Other_Alphabetic
ODI ; Other_Default_Ignorable_Code_Point
OGr_Ext ; Other_Grapheme_Extend
OIDC ; Other_ID_Continue
OIDS ; Other_ID_Start
OLower ; Other_Lowercase
OMath ; Other_Math
OUpper ; Other_Uppercase
Pat_Syn ; Pattern_Syntax
Pat_WS ; Pattern_White_Space
QMark ; Quotation_Mark
Radical ; Radical
SD ; Soft_Dotted
STerm ; STerm
Term ; Terminal_Punctuation
UIdeo ; Unified_Ideograph
Upper ; Uppercase
VS ; Variation_Selector
WSpace ; White_Space ; space
XIDC ; XID_Continue
XIDS ; XID_Start
XO_NFC ; Expands_On_NFC
XO_NFD ; Expands_On_NFD
XO_NFKC ; Expands_On_NFKC
XO_NFKD ; Expands_On_NFKD
# ================================================
# Total: 88
# EOF

View File

@ -0,0 +1,596 @@
# PropertyValueAliases-5.0.0.txt
# Date: 2006-03-03, 08:23:34 GMT [MD]
#
# Unicode Character Database
# Copyright (c) 1991-2006 Unicode, Inc.
# For terms of use, see http://www.unicode.org/terms_of_use.html
# For documentation, see UCD.html
#
# This file contains aliases for property values used in the UCD.
# These names can be used for XML formats of UCD data, for regular-expression
# property tests, and other programmatic textual descriptions of Unicode data.
# For information on which properties are normative, see UCD.html.
#
# The names may be translated in appropriate environments, and additional
# aliases may be useful.
#
# FORMAT
#
# Each line describes a property value name.
# This consists of three or more fields, separated by semicolons.
#
# First Field: The first field describes the property for which that
# property value name is used.
#
# Second Field: The second field is an abbreviated name.
# If there is no abbreviated name available, the field is marked with "n/a".
#
# Third Field: The third field is a long name.
#
# In the case of ccc, there are 4 fields. The second field is numeric, third
# is abbreviated, and fourth is long.
#
# The above are the preferred aliases. Other aliases may be listed in additional fields.
#
# Loose matching should be applied to all property names and property values, with
# the exception of String Property values. With loose matching of property names and
# values, the case distinctions, whitespace, and '_' are ignored. For Numeric Property
# values, numeric equivalencies are applied: thus "01.00" is equivalent to "1".
#
# NOTE: Property value names are NOT unique across properties. For example:
#
# AL means Arabic Letter for the Bidi_Class property, and
# AL means Alpha_Left for the Combining_Class property, and
# AL means Alphabetic for the Line_Break property.
#
# In addition, some property names may be the same as some property value names.
# For example:
#
# sc means the Script property, and
# Sc means the General_Category property value Currency_Symbol (Sc)
#
# The combination of property value and property name is, however, unique.
#
# For more information, see UTS #18: Regular Expression Guidelines
# ================================================
# Age (age)
age; n/a ; 1.1
age; n/a ; 2.0
age; n/a ; 2.1
age; n/a ; 3.0
age; n/a ; 3.1
age; n/a ; 3.2
age; n/a ; 4.0
age; n/a ; 4.1
age; n/a ; 5.0
age; n/a ; unassigned
# Bidi_Class (bc)
bc ; AL ; Arabic_Letter
bc ; AN ; Arabic_Number
bc ; B ; Paragraph_Separator
bc ; BN ; Boundary_Neutral
bc ; CS ; Common_Separator
bc ; EN ; European_Number
bc ; ES ; European_Separator
bc ; ET ; European_Terminator
bc ; L ; Left_To_Right
bc ; LRE ; Left_To_Right_Embedding
bc ; LRO ; Left_To_Right_Override
bc ; NSM ; Nonspacing_Mark
bc ; ON ; Other_Neutral
bc ; PDF ; Pop_Directional_Format
bc ; R ; Right_To_Left
bc ; RLE ; Right_To_Left_Embedding
bc ; RLO ; Right_To_Left_Override
bc ; S ; Segment_Separator
bc ; WS ; White_Space
# Block (blk)
blk; n/a ; Aegean_Numbers
blk; n/a ; Alphabetic_Presentation_Forms
blk; n/a ; Ancient_Greek_Musical_Notation
blk; n/a ; Ancient_Greek_Numbers
blk; n/a ; Arabic
blk; n/a ; Arabic_Presentation_Forms-A
blk; n/a ; Arabic_Presentation_Forms-B
blk; n/a ; Arabic_Supplement
blk; n/a ; Armenian
blk; n/a ; Arrows
blk; n/a ; Balinese
blk; n/a ; Basic_Latin
blk; n/a ; Bengali
blk; n/a ; Block_Elements
blk; n/a ; Bopomofo
blk; n/a ; Bopomofo_Extended
blk; n/a ; Box_Drawing
blk; n/a ; Braille_Patterns
blk; n/a ; Buginese
blk; n/a ; Buhid
blk; n/a ; Byzantine_Musical_Symbols
blk; n/a ; Cherokee
blk; n/a ; CJK_Compatibility
blk; n/a ; CJK_Compatibility_Forms
blk; n/a ; CJK_Compatibility_Ideographs
blk; n/a ; CJK_Compatibility_Ideographs_Supplement
blk; n/a ; CJK_Radicals_Supplement
blk; n/a ; CJK_Strokes
blk; n/a ; CJK_Symbols_and_Punctuation
blk; n/a ; CJK_Unified_Ideographs
blk; n/a ; CJK_Unified_Ideographs_Extension_A
blk; n/a ; CJK_Unified_Ideographs_Extension_B
blk; n/a ; Combining_Diacritical_Marks
blk; n/a ; Combining_Diacritical_Marks_for_Symbols
blk; n/a ; Combining_Diacritical_Marks_Supplement
blk; n/a ; Combining_Half_Marks
blk; n/a ; Control_Pictures
blk; n/a ; Coptic
blk; n/a ; Counting_Rod_Numerals
blk; n/a ; Cuneiform
blk; n/a ; Cuneiform_Numbers_and_Punctuation
blk; n/a ; Currency_Symbols
blk; n/a ; Cypriot_Syllabary
blk; n/a ; Cyrillic
blk; n/a ; Cyrillic_Supplement ; Cyrillic_Supplementary
blk; n/a ; Deseret
blk; n/a ; Devanagari
blk; n/a ; Dingbats
blk; n/a ; Enclosed_Alphanumerics
blk; n/a ; Enclosed_CJK_Letters_and_Months
blk; n/a ; Ethiopic
blk; n/a ; Ethiopic_Extended
blk; n/a ; Ethiopic_Supplement
blk; n/a ; General_Punctuation
blk; n/a ; Geometric_Shapes
blk; n/a ; Georgian
blk; n/a ; Georgian_Supplement
blk; n/a ; Glagolitic
blk; n/a ; Gothic
blk; n/a ; Greek_and_Coptic
blk; n/a ; Greek_Extended
blk; n/a ; Gujarati
blk; n/a ; Gurmukhi
blk; n/a ; Halfwidth_and_Fullwidth_Forms
blk; n/a ; Hangul_Compatibility_Jamo
blk; n/a ; Hangul_Jamo
blk; n/a ; Hangul_Syllables
blk; n/a ; Hanunoo
blk; n/a ; Hebrew
blk; n/a ; High_Private_Use_Surrogates
blk; n/a ; High_Surrogates
blk; n/a ; Hiragana
blk; n/a ; Ideographic_Description_Characters
blk; n/a ; IPA_Extensions
blk; n/a ; Kanbun
blk; n/a ; Kangxi_Radicals
blk; n/a ; Kannada
blk; n/a ; Katakana
blk; n/a ; Katakana_Phonetic_Extensions
blk; n/a ; Kharoshthi
blk; n/a ; Khmer
blk; n/a ; Khmer_Symbols
blk; n/a ; Lao
blk; n/a ; Latin-1_Supplement
blk; n/a ; Latin_Extended-A
blk; n/a ; Latin_Extended-B
blk; n/a ; Latin_Extended-C
blk; n/a ; Latin_Extended-D
blk; n/a ; Latin_Extended_Additional
blk; n/a ; Letterlike_Symbols
blk; n/a ; Limbu
blk; n/a ; Linear_B_Ideograms
blk; n/a ; Linear_B_Syllabary
blk; n/a ; Low_Surrogates
blk; n/a ; Malayalam
blk; n/a ; Mathematical_Alphanumeric_Symbols
blk; n/a ; Mathematical_Operators
blk; n/a ; Miscellaneous_Mathematical_Symbols-A
blk; n/a ; Miscellaneous_Mathematical_Symbols-B
blk; n/a ; Miscellaneous_Symbols
blk; n/a ; Miscellaneous_Symbols_and_Arrows
blk; n/a ; Miscellaneous_Technical
blk; n/a ; Modifier_Tone_Letters
blk; n/a ; Mongolian
blk; n/a ; Musical_Symbols
blk; n/a ; Myanmar
blk; n/a ; New_Tai_Lue
blk; n/a ; NKo
blk; n/a ; No_Block
blk; n/a ; Number_Forms
blk; n/a ; Ogham
blk; n/a ; Old_Italic
blk; n/a ; Old_Persian
blk; n/a ; Optical_Character_Recognition
blk; n/a ; Oriya
blk; n/a ; Osmanya
blk; n/a ; Phags-pa
blk; n/a ; Phoenician
blk; n/a ; Phonetic_Extensions
blk; n/a ; Phonetic_Extensions_Supplement
blk; n/a ; Private_Use_Area
blk; n/a ; Runic
blk; n/a ; Shavian
blk; n/a ; Sinhala
blk; n/a ; Small_Form_Variants
blk; n/a ; Spacing_Modifier_Letters
blk; n/a ; Specials
blk; n/a ; Superscripts_and_Subscripts
blk; n/a ; Supplemental_Arrows-A
blk; n/a ; Supplemental_Arrows-B
blk; n/a ; Supplemental_Mathematical_Operators
blk; n/a ; Supplemental_Punctuation
blk; n/a ; Supplementary_Private_Use_Area-A
blk; n/a ; Supplementary_Private_Use_Area-B
blk; n/a ; Syloti_Nagri
blk; n/a ; Syriac
blk; n/a ; Tagalog
blk; n/a ; Tagbanwa
blk; n/a ; Tags
blk; n/a ; Tai_Le
blk; n/a ; Tai_Xuan_Jing_Symbols
blk; n/a ; Tamil
blk; n/a ; Telugu
blk; n/a ; Thaana
blk; n/a ; Thai
blk; n/a ; Tibetan
blk; n/a ; Tifinagh
blk; n/a ; Ugaritic
blk; n/a ; Unified_Canadian_Aboriginal_Syllabics
blk; n/a ; Variation_Selectors
blk; n/a ; Variation_Selectors_Supplement
blk; n/a ; Vertical_Forms
blk; n/a ; Yi_Radicals
blk; n/a ; Yi_Syllables
blk; n/a ; Yijing_Hexagram_Symbols
# Canonical_Combining_Class (ccc)
ccc; 0; NR ; Not_Reordered
ccc; 1; OV ; Overlay
ccc; 7; NK ; Nukta
ccc; 8; KV ; Kana_Voicing
ccc; 9; VR ; Virama
ccc; 200; ATBL ; Attached_Below_Left
ccc; 202; ATB ; Attached_Below
ccc; 216; ATAR ; Attached_Above_Right
ccc; 218; BL ; Below_Left
ccc; 220; B ; Below
ccc; 222; BR ; Below_Right
ccc; 224; L ; Left
ccc; 226; R ; Right
ccc; 228; AL ; Above_Left
ccc; 230; A ; Above
ccc; 232; AR ; Above_Right
ccc; 233; DB ; Double_Below
ccc; 234; DA ; Double_Above
ccc; 240; IS ; Iota_Subscript
# Decomposition_Type (dt)
dt ; can ; Canonical
dt ; com ; Compat
dt ; enc ; Circle
dt ; fin ; Final
dt ; font ; Font
dt ; fra ; Fraction
dt ; init ; Initial
dt ; iso ; Isolated
dt ; med ; Medial
dt ; nar ; Narrow
dt ; nb ; Nobreak
dt ; none ; None
dt ; sml ; Small
dt ; sqr ; Square
dt ; sub ; Sub
dt ; sup ; Super
dt ; vert ; Vertical
dt ; wide ; Wide
# East_Asian_Width (ea)
ea ; A ; Ambiguous
ea ; F ; Fullwidth
ea ; H ; Halfwidth
ea ; N ; Neutral
ea ; Na ; Narrow
ea ; W ; Wide
# General_Category (gc)
gc ; C ; Other # Cc | Cf | Cn | Co | Cs
gc ; Cc ; Control ; cntrl
gc ; Cf ; Format
gc ; Cn ; Unassigned
gc ; Co ; Private_Use
gc ; Cs ; Surrogate
gc ; L ; Letter # Ll | Lm | Lo | Lt | Lu
gc ; LC ; Cased_Letter # Ll | Lt | Lu
gc ; Ll ; Lowercase_Letter
gc ; Lm ; Modifier_Letter
gc ; Lo ; Other_Letter
gc ; Lt ; Titlecase_Letter
gc ; Lu ; Uppercase_Letter
gc ; M ; Mark # Mc | Me | Mn
gc ; Mc ; Spacing_Mark
gc ; Me ; Enclosing_Mark
gc ; Mn ; Nonspacing_Mark
gc ; N ; Number # Nd | Nl | No
gc ; Nd ; Decimal_Number ; digit
gc ; Nl ; Letter_Number
gc ; No ; Other_Number
gc ; P ; Punctuation ; punct # Pc | Pd | Pe | Pf | Pi | Po | Ps
gc ; Pc ; Connector_Punctuation
gc ; Pd ; Dash_Punctuation
gc ; Pe ; Close_Punctuation
gc ; Pf ; Final_Punctuation
gc ; Pi ; Initial_Punctuation
gc ; Po ; Other_Punctuation
gc ; Ps ; Open_Punctuation
gc ; S ; Symbol # Sc | Sk | Sm | So
gc ; Sc ; Currency_Symbol
gc ; Sk ; Modifier_Symbol
gc ; Sm ; Math_Symbol
gc ; So ; Other_Symbol
gc ; Z ; Separator # Zl | Zp | Zs
gc ; Zl ; Line_Separator
gc ; Zp ; Paragraph_Separator
gc ; Zs ; Space_Separator
# Grapheme_Cluster_Break (GCB)
GCB; CN ; Control
GCB; CR ; CR
GCB; EX ; Extend
GCB; L ; L
GCB; LF ; LF
GCB; LV ; LV
GCB; LVT ; LVT
GCB; T ; T
GCB; V ; V
GCB; XX ; Other
# Hangul_Syllable_Type (hst)
hst; L ; Leading_Jamo
hst; LV ; LV_Syllable
hst; LVT ; LVT_Syllable
hst; NA ; Not_Applicable
hst; T ; Trailing_Jamo
hst; V ; Vowel_Jamo
# Joining_Group (jg)
jg ; n/a ; Ain
jg ; n/a ; Alaph
jg ; n/a ; Alef
jg ; n/a ; Beh
jg ; n/a ; Beth
jg ; n/a ; Dal
jg ; n/a ; Dalath_Rish
jg ; n/a ; E
jg ; n/a ; Fe
jg ; n/a ; Feh
jg ; n/a ; Final_Semkath
jg ; n/a ; Gaf
jg ; n/a ; Gamal
jg ; n/a ; Hah
jg ; n/a ; Hamza_On_Heh_Goal
jg ; n/a ; He
jg ; n/a ; Heh
jg ; n/a ; Heh_Goal
jg ; n/a ; Heth
jg ; n/a ; Kaf
jg ; n/a ; Kaph
jg ; n/a ; Khaph
jg ; n/a ; Knotted_Heh
jg ; n/a ; Lam
jg ; n/a ; Lamadh
jg ; n/a ; Meem
jg ; n/a ; Mim
jg ; n/a ; No_Joining_Group
jg ; n/a ; Noon
jg ; n/a ; Nun
jg ; n/a ; Pe
jg ; n/a ; Qaf
jg ; n/a ; Qaph
jg ; n/a ; Reh
jg ; n/a ; Reversed_Pe
jg ; n/a ; Sad
jg ; n/a ; Sadhe
jg ; n/a ; Seen
jg ; n/a ; Semkath
jg ; n/a ; Shin
jg ; n/a ; Swash_Kaf
jg ; n/a ; Syriac_Waw
jg ; n/a ; Tah
jg ; n/a ; Taw
jg ; n/a ; Teh_Marbuta
jg ; n/a ; Teth
jg ; n/a ; Waw
jg ; n/a ; Yeh
jg ; n/a ; Yeh_Barree
jg ; n/a ; Yeh_With_Tail
jg ; n/a ; Yudh
jg ; n/a ; Yudh_He
jg ; n/a ; Zain
jg ; n/a ; Zhain
# Joining_Type (jt)
jt ; C ; Join_Causing
jt ; D ; Dual_Joining
jt ; L ; Left_Joining
jt ; R ; Right_Joining
jt ; T ; Transparent
jt ; U ; Non_Joining
# Line_Break (lb)
lb ; AI ; Ambiguous
lb ; AL ; Alphabetic
lb ; B2 ; Break_Both
lb ; BA ; Break_After
lb ; BB ; Break_Before
lb ; BK ; Mandatory_Break
lb ; CB ; Contingent_Break
lb ; CL ; Close_Punctuation
lb ; CM ; Combining_Mark
lb ; CR ; Carriage_Return
lb ; EX ; Exclamation
lb ; GL ; Glue
lb ; H2 ; H2
lb ; H3 ; H3
lb ; HY ; Hyphen
lb ; ID ; Ideographic
lb ; IN ; Inseparable ; Inseperable
lb ; IS ; Infix_Numeric
lb ; JL ; JL
lb ; JT ; JT
lb ; JV ; JV
lb ; LF ; Line_Feed
lb ; NL ; Next_Line
lb ; NS ; Nonstarter
lb ; NU ; Numeric
lb ; OP ; Open_Punctuation
lb ; PO ; Postfix_Numeric
lb ; PR ; Prefix_Numeric
lb ; QU ; Quotation
lb ; SA ; Complex_Context
lb ; SG ; Surrogate
lb ; SP ; Space
lb ; SY ; Break_Symbols
lb ; WJ ; Word_Joiner
lb ; XX ; Unknown
lb ; ZW ; ZWSpace
# NFC_Quick_Check (NFC_QC)
NFC_QC; M ; Maybe
NFC_QC; N ; No
NFC_QC; Y ; Yes
# NFD_Quick_Check (NFD_QC)
NFD_QC; N ; No
NFD_QC; Y ; Yes
# NFKC_Quick_Check (NFKC_QC)
NFKC_QC; M ; Maybe
NFKC_QC; N ; No
NFKC_QC; Y ; Yes
# NFKD_Quick_Check (NFKD_QC)
NFKD_QC; N ; No
NFKD_QC; Y ; Yes
# Numeric_Type (nt)
nt ; De ; Decimal
nt ; Di ; Digit
nt ; None ; None
nt ; Nu ; Numeric
# Script (sc)
sc ; Arab ; Arabic
sc ; Armn ; Armenian
sc ; Bali ; Balinese
sc ; Beng ; Bengali
sc ; Bopo ; Bopomofo
sc ; Brai ; Braille
sc ; Bugi ; Buginese
sc ; Buhd ; Buhid
sc ; Cans ; Canadian_Aboriginal
sc ; Cher ; Cherokee
sc ; Copt ; Coptic ; Qaac
sc ; Cprt ; Cypriot
sc ; Cyrl ; Cyrillic
sc ; Deva ; Devanagari
sc ; Dsrt ; Deseret
sc ; Ethi ; Ethiopic
sc ; Geor ; Georgian
sc ; Glag ; Glagolitic
sc ; Goth ; Gothic
sc ; Grek ; Greek
sc ; Gujr ; Gujarati
sc ; Guru ; Gurmukhi
sc ; Hang ; Hangul
sc ; Hani ; Han
sc ; Hano ; Hanunoo
sc ; Hebr ; Hebrew
sc ; Hira ; Hiragana
sc ; Hrkt ; Katakana_Or_Hiragana
sc ; Ital ; Old_Italic
sc ; Kana ; Katakana
sc ; Khar ; Kharoshthi
sc ; Khmr ; Khmer
sc ; Knda ; Kannada
sc ; Laoo ; Lao
sc ; Latn ; Latin
sc ; Limb ; Limbu
sc ; Linb ; Linear_B
sc ; Mlym ; Malayalam
sc ; Mong ; Mongolian
sc ; Mymr ; Myanmar
sc ; Nkoo ; Nko
sc ; Ogam ; Ogham
sc ; Orya ; Oriya
sc ; Osma ; Osmanya
sc ; Phag ; Phags_Pa
sc ; Phnx ; Phoenician
sc ; Qaai ; Inherited
sc ; Runr ; Runic
sc ; Shaw ; Shavian
sc ; Sinh ; Sinhala
sc ; Sylo ; Syloti_Nagri
sc ; Syrc ; Syriac
sc ; Tagb ; Tagbanwa
sc ; Tale ; Tai_Le
sc ; Talu ; New_Tai_Lue
sc ; Taml ; Tamil
sc ; Telu ; Telugu
sc ; Tfng ; Tifinagh
sc ; Tglg ; Tagalog
sc ; Thaa ; Thaana
sc ; Thai ; Thai
sc ; Tibt ; Tibetan
sc ; Ugar ; Ugaritic
sc ; Xpeo ; Old_Persian
sc ; Xsux ; Cuneiform
sc ; Yiii ; Yi
sc ; Zyyy ; Common
sc ; Zzzz ; Unknown
# Sentence_Break (SB)
SB ; AT ; ATerm
SB ; CL ; Close
SB ; FO ; Format
SB ; LE ; OLetter
SB ; LO ; Lower
SB ; NU ; Numeric
SB ; SE ; Sep
SB ; SP ; Sp
SB ; ST ; STerm
SB ; UP ; Upper
SB ; XX ; Other
# Word_Break (WB)
WB ; EX ; ExtendNumLet
WB ; FO ; Format
WB ; KA ; Katakana
WB ; LE ; ALetter
WB ; ML ; MidLetter
WB ; MN ; MidNum
WB ; NU ; Numeric
WB ; XX ; Other
# EOF

View File

@ -0,0 +1,13 @@
# Date: 2006-07-14, 15:34:00 PST [KW]
#
# Unicode Character Database
# Copyright (c) 1991-2006 Unicode, Inc.
# For terms of use, see http://www.unicode.org/terms_of_use.html
#
# For documentation, see UCD.html, Unihan.html, and NamesList.html
#
This directory contains final contributory data files
for the Unicode Character Database (UCD) for Unicode 5.0.0.

File diff suppressed because it is too large Load Diff

View File

@ -0,0 +1,264 @@
# SpecialCasing-5.0.0.txt
# Date: 2006-03-03, 08:23:36 GMT [MD]
#
# Unicode Character Database
# Copyright (c) 1991-2006 Unicode, Inc.
# For terms of use, see http://www.unicode.org/terms_of_use.html
# For documentation, see UCD.html
#
# Special Casing Properties
#
# This file is a supplement to the UnicodeData file.
# It contains additional information about the casing of Unicode characters.
# (For compatibility, the UnicodeData.txt file only contains case mappings for
# characters where they are 1-1, and does not have locale-specific mappings.)
# For more information, see the discussion of Case Mappings in the Unicode Standard.
#
# All code points not listed in this file that do not have a simple case mappings
# in UnicodeData.txt map to themselves.
# ================================================================================
# Format
# ================================================================================
# The entries in this file are in the following machine-readable format:
#
# <code>; <lower> ; <title> ; <upper> ; (<condition_list> ;)? # <comment>
#
# <code>, <lower>, <title>, and <upper> provide character values in hex. If there is more
# than one character, they are separated by spaces. Other than as used to separate
# elements, spaces are to be ignored.
#
# The <condition_list> is optional. Where present, it consists of one or more locale IDs
# or contexts, separated by spaces. In these conditions:
# - A condition list overrides the normal behavior if all of the listed conditions are true.
# - The context is always the context of the characters in the original string,
# NOT in the resulting string.
# - Case distinctions in the condition list are not significant.
# - Conditions preceded by "Not_" represent the negation of the condition.
#
# A locale ID is defined by taking any language tag as defined by
# RFC 3066 (or its successor), and replacing '-' by '_'.
#
# A context for a character C is defined by Section 3.13 Default Case
# Operations, of The Unicode Standard, Version 5.0.
# (This is identical to the context defined by Unicode 4.1.0,
# as specified in http://www.unicode.org/versions/Unicode4.1.0/)
#
# Parsers of this file must be prepared to deal with future additions to this format:
# * Additional contexts
# * Additional fields
# ================================================================================
# ================================================================================
# Unconditional mappings
# ================================================================================
# The German es-zed is special--the normal mapping is to SS.
# Note: the titlecase should never occur in practice. It is equal to titlecase(uppercase(<es-zed>))
00DF; 00DF; 0053 0073; 0053 0053; # LATIN SMALL LETTER SHARP S
# Preserve canonical equivalence for I with dot. Turkic is handled below.
0130; 0069 0307; 0130; 0130; # LATIN CAPITAL LETTER I WITH DOT ABOVE
# Ligatures
FB00; FB00; 0046 0066; 0046 0046; # LATIN SMALL LIGATURE FF
FB01; FB01; 0046 0069; 0046 0049; # LATIN SMALL LIGATURE FI
FB02; FB02; 0046 006C; 0046 004C; # LATIN SMALL LIGATURE FL
FB03; FB03; 0046 0066 0069; 0046 0046 0049; # LATIN SMALL LIGATURE FFI
FB04; FB04; 0046 0066 006C; 0046 0046 004C; # LATIN SMALL LIGATURE FFL
FB05; FB05; 0053 0074; 0053 0054; # LATIN SMALL LIGATURE LONG S T
FB06; FB06; 0053 0074; 0053 0054; # LATIN SMALL LIGATURE ST
0587; 0587; 0535 0582; 0535 0552; # ARMENIAN SMALL LIGATURE ECH YIWN
FB13; FB13; 0544 0576; 0544 0546; # ARMENIAN SMALL LIGATURE MEN NOW
FB14; FB14; 0544 0565; 0544 0535; # ARMENIAN SMALL LIGATURE MEN ECH
FB15; FB15; 0544 056B; 0544 053B; # ARMENIAN SMALL LIGATURE MEN INI
FB16; FB16; 054E 0576; 054E 0546; # ARMENIAN SMALL LIGATURE VEW NOW
FB17; FB17; 0544 056D; 0544 053D; # ARMENIAN SMALL LIGATURE MEN XEH
# No corresponding uppercase precomposed character
0149; 0149; 02BC 004E; 02BC 004E; # LATIN SMALL LETTER N PRECEDED BY APOSTROPHE
0390; 0390; 0399 0308 0301; 0399 0308 0301; # GREEK SMALL LETTER IOTA WITH DIALYTIKA AND TONOS
03B0; 03B0; 03A5 0308 0301; 03A5 0308 0301; # GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND TONOS
01F0; 01F0; 004A 030C; 004A 030C; # LATIN SMALL LETTER J WITH CARON
1E96; 1E96; 0048 0331; 0048 0331; # LATIN SMALL LETTER H WITH LINE BELOW
1E97; 1E97; 0054 0308; 0054 0308; # LATIN SMALL LETTER T WITH DIAERESIS
1E98; 1E98; 0057 030A; 0057 030A; # LATIN SMALL LETTER W WITH RING ABOVE
1E99; 1E99; 0059 030A; 0059 030A; # LATIN SMALL LETTER Y WITH RING ABOVE
1E9A; 1E9A; 0041 02BE; 0041 02BE; # LATIN SMALL LETTER A WITH RIGHT HALF RING
1F50; 1F50; 03A5 0313; 03A5 0313; # GREEK SMALL LETTER UPSILON WITH PSILI
1F52; 1F52; 03A5 0313 0300; 03A5 0313 0300; # GREEK SMALL LETTER UPSILON WITH PSILI AND VARIA
1F54; 1F54; 03A5 0313 0301; 03A5 0313 0301; # GREEK SMALL LETTER UPSILON WITH PSILI AND OXIA
1F56; 1F56; 03A5 0313 0342; 03A5 0313 0342; # GREEK SMALL LETTER UPSILON WITH PSILI AND PERISPOMENI
1FB6; 1FB6; 0391 0342; 0391 0342; # GREEK SMALL LETTER ALPHA WITH PERISPOMENI
1FC6; 1FC6; 0397 0342; 0397 0342; # GREEK SMALL LETTER ETA WITH PERISPOMENI
1FD2; 1FD2; 0399 0308 0300; 0399 0308 0300; # GREEK SMALL LETTER IOTA WITH DIALYTIKA AND VARIA
1FD3; 1FD3; 0399 0308 0301; 0399 0308 0301; # GREEK SMALL LETTER IOTA WITH DIALYTIKA AND OXIA
1FD6; 1FD6; 0399 0342; 0399 0342; # GREEK SMALL LETTER IOTA WITH PERISPOMENI
1FD7; 1FD7; 0399 0308 0342; 0399 0308 0342; # GREEK SMALL LETTER IOTA WITH DIALYTIKA AND PERISPOMENI
1FE2; 1FE2; 03A5 0308 0300; 03A5 0308 0300; # GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND VARIA
1FE3; 1FE3; 03A5 0308 0301; 03A5 0308 0301; # GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND OXIA
1FE4; 1FE4; 03A1 0313; 03A1 0313; # GREEK SMALL LETTER RHO WITH PSILI
1FE6; 1FE6; 03A5 0342; 03A5 0342; # GREEK SMALL LETTER UPSILON WITH PERISPOMENI
1FE7; 1FE7; 03A5 0308 0342; 03A5 0308 0342; # GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND PERISPOMENI
1FF6; 1FF6; 03A9 0342; 03A9 0342; # GREEK SMALL LETTER OMEGA WITH PERISPOMENI
# IMPORTANT-when capitalizing iota-subscript (0345)
# It MUST be in normalized form--moved to the end of any sequence of combining marks.
# This is because logically it represents a following base character!
# E.g. <iota_subscript> (<Mn> | <Mc> | <Me>)+ => (<Mn> | <Mc> | <Me>)+ <iota_subscript>
# It should never be the first character in a word, so in titlecasing it can be left as is.
# The following cases are already in the UnicodeData file, so are only commented here.
# 0345; 0345; 0345; 0399; # COMBINING GREEK YPOGEGRAMMENI
# All letters with YPOGEGRAMMENI (iota-subscript) or PROSGEGRAMMENI (iota adscript)
# have special uppercases.
# Note: characters with PROSGEGRAMMENI are actually titlecase, not uppercase!
1F80; 1F80; 1F88; 1F08 0399; # GREEK SMALL LETTER ALPHA WITH PSILI AND YPOGEGRAMMENI
1F81; 1F81; 1F89; 1F09 0399; # GREEK SMALL LETTER ALPHA WITH DASIA AND YPOGEGRAMMENI
1F82; 1F82; 1F8A; 1F0A 0399; # GREEK SMALL LETTER ALPHA WITH PSILI AND VARIA AND YPOGEGRAMMENI
1F83; 1F83; 1F8B; 1F0B 0399; # GREEK SMALL LETTER ALPHA WITH DASIA AND VARIA AND YPOGEGRAMMENI
1F84; 1F84; 1F8C; 1F0C 0399; # GREEK SMALL LETTER ALPHA WITH PSILI AND OXIA AND YPOGEGRAMMENI
1F85; 1F85; 1F8D; 1F0D 0399; # GREEK SMALL LETTER ALPHA WITH DASIA AND OXIA AND YPOGEGRAMMENI
1F86; 1F86; 1F8E; 1F0E 0399; # GREEK SMALL LETTER ALPHA WITH PSILI AND PERISPOMENI AND YPOGEGRAMMENI
1F87; 1F87; 1F8F; 1F0F 0399; # GREEK SMALL LETTER ALPHA WITH DASIA AND PERISPOMENI AND YPOGEGRAMMENI
1F88; 1F80; 1F88; 1F08 0399; # GREEK CAPITAL LETTER ALPHA WITH PSILI AND PROSGEGRAMMENI
1F89; 1F81; 1F89; 1F09 0399; # GREEK CAPITAL LETTER ALPHA WITH DASIA AND PROSGEGRAMMENI
1F8A; 1F82; 1F8A; 1F0A 0399; # GREEK CAPITAL LETTER ALPHA WITH PSILI AND VARIA AND PROSGEGRAMMENI
1F8B; 1F83; 1F8B; 1F0B 0399; # GREEK CAPITAL LETTER ALPHA WITH DASIA AND VARIA AND PROSGEGRAMMENI
1F8C; 1F84; 1F8C; 1F0C 0399; # GREEK CAPITAL LETTER ALPHA WITH PSILI AND OXIA AND PROSGEGRAMMENI
1F8D; 1F85; 1F8D; 1F0D 0399; # GREEK CAPITAL LETTER ALPHA WITH DASIA AND OXIA AND PROSGEGRAMMENI
1F8E; 1F86; 1F8E; 1F0E 0399; # GREEK CAPITAL LETTER ALPHA WITH PSILI AND PERISPOMENI AND PROSGEGRAMMENI
1F8F; 1F87; 1F8F; 1F0F 0399; # GREEK CAPITAL LETTER ALPHA WITH DASIA AND PERISPOMENI AND PROSGEGRAMMENI
1F90; 1F90; 1F98; 1F28 0399; # GREEK SMALL LETTER ETA WITH PSILI AND YPOGEGRAMMENI
1F91; 1F91; 1F99; 1F29 0399; # GREEK SMALL LETTER ETA WITH DASIA AND YPOGEGRAMMENI
1F92; 1F92; 1F9A; 1F2A 0399; # GREEK SMALL LETTER ETA WITH PSILI AND VARIA AND YPOGEGRAMMENI
1F93; 1F93; 1F9B; 1F2B 0399; # GREEK SMALL LETTER ETA WITH DASIA AND VARIA AND YPOGEGRAMMENI
1F94; 1F94; 1F9C; 1F2C 0399; # GREEK SMALL LETTER ETA WITH PSILI AND OXIA AND YPOGEGRAMMENI
1F95; 1F95; 1F9D; 1F2D 0399; # GREEK SMALL LETTER ETA WITH DASIA AND OXIA AND YPOGEGRAMMENI
1F96; 1F96; 1F9E; 1F2E 0399; # GREEK SMALL LETTER ETA WITH PSILI AND PERISPOMENI AND YPOGEGRAMMENI
1F97; 1F97; 1F9F; 1F2F 0399; # GREEK SMALL LETTER ETA WITH DASIA AND PERISPOMENI AND YPOGEGRAMMENI
1F98; 1F90; 1F98; 1F28 0399; # GREEK CAPITAL LETTER ETA WITH PSILI AND PROSGEGRAMMENI
1F99; 1F91; 1F99; 1F29 0399; # GREEK CAPITAL LETTER ETA WITH DASIA AND PROSGEGRAMMENI
1F9A; 1F92; 1F9A; 1F2A 0399; # GREEK CAPITAL LETTER ETA WITH PSILI AND VARIA AND PROSGEGRAMMENI
1F9B; 1F93; 1F9B; 1F2B 0399; # GREEK CAPITAL LETTER ETA WITH DASIA AND VARIA AND PROSGEGRAMMENI
1F9C; 1F94; 1F9C; 1F2C 0399; # GREEK CAPITAL LETTER ETA WITH PSILI AND OXIA AND PROSGEGRAMMENI
1F9D; 1F95; 1F9D; 1F2D 0399; # GREEK CAPITAL LETTER ETA WITH DASIA AND OXIA AND PROSGEGRAMMENI
1F9E; 1F96; 1F9E; 1F2E 0399; # GREEK CAPITAL LETTER ETA WITH PSILI AND PERISPOMENI AND PROSGEGRAMMENI
1F9F; 1F97; 1F9F; 1F2F 0399; # GREEK CAPITAL LETTER ETA WITH DASIA AND PERISPOMENI AND PROSGEGRAMMENI
1FA0; 1FA0; 1FA8; 1F68 0399; # GREEK SMALL LETTER OMEGA WITH PSILI AND YPOGEGRAMMENI
1FA1; 1FA1; 1FA9; 1F69 0399; # GREEK SMALL LETTER OMEGA WITH DASIA AND YPOGEGRAMMENI
1FA2; 1FA2; 1FAA; 1F6A 0399; # GREEK SMALL LETTER OMEGA WITH PSILI AND VARIA AND YPOGEGRAMMENI
1FA3; 1FA3; 1FAB; 1F6B 0399; # GREEK SMALL LETTER OMEGA WITH DASIA AND VARIA AND YPOGEGRAMMENI
1FA4; 1FA4; 1FAC; 1F6C 0399; # GREEK SMALL LETTER OMEGA WITH PSILI AND OXIA AND YPOGEGRAMMENI
1FA5; 1FA5; 1FAD; 1F6D 0399; # GREEK SMALL LETTER OMEGA WITH DASIA AND OXIA AND YPOGEGRAMMENI
1FA6; 1FA6; 1FAE; 1F6E 0399; # GREEK SMALL LETTER OMEGA WITH PSILI AND PERISPOMENI AND YPOGEGRAMMENI
1FA7; 1FA7; 1FAF; 1F6F 0399; # GREEK SMALL LETTER OMEGA WITH DASIA AND PERISPOMENI AND YPOGEGRAMMENI
1FA8; 1FA0; 1FA8; 1F68 0399; # GREEK CAPITAL LETTER OMEGA WITH PSILI AND PROSGEGRAMMENI
1FA9; 1FA1; 1FA9; 1F69 0399; # GREEK CAPITAL LETTER OMEGA WITH DASIA AND PROSGEGRAMMENI
1FAA; 1FA2; 1FAA; 1F6A 0399; # GREEK CAPITAL LETTER OMEGA WITH PSILI AND VARIA AND PROSGEGRAMMENI
1FAB; 1FA3; 1FAB; 1F6B 0399; # GREEK CAPITAL LETTER OMEGA WITH DASIA AND VARIA AND PROSGEGRAMMENI
1FAC; 1FA4; 1FAC; 1F6C 0399; # GREEK CAPITAL LETTER OMEGA WITH PSILI AND OXIA AND PROSGEGRAMMENI
1FAD; 1FA5; 1FAD; 1F6D 0399; # GREEK CAPITAL LETTER OMEGA WITH DASIA AND OXIA AND PROSGEGRAMMENI
1FAE; 1FA6; 1FAE; 1F6E 0399; # GREEK CAPITAL LETTER OMEGA WITH PSILI AND PERISPOMENI AND PROSGEGRAMMENI
1FAF; 1FA7; 1FAF; 1F6F 0399; # GREEK CAPITAL LETTER OMEGA WITH DASIA AND PERISPOMENI AND PROSGEGRAMMENI
1FB3; 1FB3; 1FBC; 0391 0399; # GREEK SMALL LETTER ALPHA WITH YPOGEGRAMMENI
1FBC; 1FB3; 1FBC; 0391 0399; # GREEK CAPITAL LETTER ALPHA WITH PROSGEGRAMMENI
1FC3; 1FC3; 1FCC; 0397 0399; # GREEK SMALL LETTER ETA WITH YPOGEGRAMMENI
1FCC; 1FC3; 1FCC; 0397 0399; # GREEK CAPITAL LETTER ETA WITH PROSGEGRAMMENI
1FF3; 1FF3; 1FFC; 03A9 0399; # GREEK SMALL LETTER OMEGA WITH YPOGEGRAMMENI
1FFC; 1FF3; 1FFC; 03A9 0399; # GREEK CAPITAL LETTER OMEGA WITH PROSGEGRAMMENI
# Some characters with YPOGEGRAMMENI also have no corresponding titlecases
1FB2; 1FB2; 1FBA 0345; 1FBA 0399; # GREEK SMALL LETTER ALPHA WITH VARIA AND YPOGEGRAMMENI
1FB4; 1FB4; 0386 0345; 0386 0399; # GREEK SMALL LETTER ALPHA WITH OXIA AND YPOGEGRAMMENI
1FC2; 1FC2; 1FCA 0345; 1FCA 0399; # GREEK SMALL LETTER ETA WITH VARIA AND YPOGEGRAMMENI
1FC4; 1FC4; 0389 0345; 0389 0399; # GREEK SMALL LETTER ETA WITH OXIA AND YPOGEGRAMMENI
1FF2; 1FF2; 1FFA 0345; 1FFA 0399; # GREEK SMALL LETTER OMEGA WITH VARIA AND YPOGEGRAMMENI
1FF4; 1FF4; 038F 0345; 038F 0399; # GREEK SMALL LETTER OMEGA WITH OXIA AND YPOGEGRAMMENI
1FB7; 1FB7; 0391 0342 0345; 0391 0342 0399; # GREEK SMALL LETTER ALPHA WITH PERISPOMENI AND YPOGEGRAMMENI
1FC7; 1FC7; 0397 0342 0345; 0397 0342 0399; # GREEK SMALL LETTER ETA WITH PERISPOMENI AND YPOGEGRAMMENI
1FF7; 1FF7; 03A9 0342 0345; 03A9 0342 0399; # GREEK SMALL LETTER OMEGA WITH PERISPOMENI AND YPOGEGRAMMENI
# ================================================================================
# Conditional mappings
# ================================================================================
# Special case for final form of sigma
03A3; 03C2; 03A3; 03A3; Final_Sigma; # GREEK CAPITAL LETTER SIGMA
# Note: the following cases for non-final are already in the UnicodeData file.
# 03A3; 03C3; 03A3; 03A3; # GREEK CAPITAL LETTER SIGMA
# 03C3; 03C3; 03A3; 03A3; # GREEK SMALL LETTER SIGMA
# 03C2; 03C2; 03A3; 03A3; # GREEK SMALL LETTER FINAL SIGMA
# Note: the following cases are not included, since they would case-fold in lowercasing
# 03C3; 03C2; 03A3; 03A3; Final_Sigma; # GREEK SMALL LETTER SIGMA
# 03C2; 03C3; 03A3; 03A3; Not_Final_Sigma; # GREEK SMALL LETTER FINAL SIGMA
# ================================================================================
# Locale-sensitive mappings
# ================================================================================
# Lithuanian
# Lithuanian retains the dot in a lowercase i when followed by accents.
# Remove DOT ABOVE after "i" with upper or titlecase
0307; 0307; ; ; lt After_Soft_Dotted; # COMBINING DOT ABOVE
# Introduce an explicit dot above when lowercasing capital I's and J's
# whenever there are more accents above.
# (of the accents used in Lithuanian: grave, acute, tilde above, and ogonek)
0049; 0069 0307; 0049; 0049; lt More_Above; # LATIN CAPITAL LETTER I
004A; 006A 0307; 004A; 004A; lt More_Above; # LATIN CAPITAL LETTER J
012E; 012F 0307; 012E; 012E; lt More_Above; # LATIN CAPITAL LETTER I WITH OGONEK
00CC; 0069 0307 0300; 00CC; 00CC; lt; # LATIN CAPITAL LETTER I WITH GRAVE
00CD; 0069 0307 0301; 00CD; 00CD; lt; # LATIN CAPITAL LETTER I WITH ACUTE
0128; 0069 0307 0303; 0128; 0128; lt; # LATIN CAPITAL LETTER I WITH TILDE
# ================================================================================
# Turkish and Azeri
# I and i-dotless; I-dot and i are case pairs in Turkish and Azeri
# The following rules handle those cases.
0130; 0069; 0130; 0130; tr; # LATIN CAPITAL LETTER I WITH DOT ABOVE
0130; 0069; 0130; 0130; az; # LATIN CAPITAL LETTER I WITH DOT ABOVE
# When lowercasing, remove dot_above in the sequence I + dot_above, which will turn into i.
# This matches the behavior of the canonically equivalent I-dot_above
0307; ; 0307; 0307; tr After_I; # COMBINING DOT ABOVE
0307; ; 0307; 0307; az After_I; # COMBINING DOT ABOVE
# When lowercasing, unless an I is before a dot_above, it turns into a dotless i.
0049; 0131; 0049; 0049; tr Not_Before_Dot; # LATIN CAPITAL LETTER I
0049; 0131; 0049; 0049; az Not_Before_Dot; # LATIN CAPITAL LETTER I
# When uppercasing, i turns into a dotted capital I
0069; 0069; 0130; 0130; tr; # LATIN SMALL LETTER I
0069; 0069; 0130; 0130; az; # LATIN SMALL LETTER I
# Note: the following case is already in the UnicodeData file.
# 0131; 0131; 0049; 0049; tr; # LATIN SMALL LETTER DOTLESS I
# EOF

View File

@ -0,0 +1,131 @@
# StandardizedVariants-4.1.0.txt
# Date: 2006-01-16, 13:03:00 PST [KW]
#
# Specification of the variant sequences that are defined in the
# Unicode Standard.
#
# This file is a normative contributory data file in the
# Unicode Character Database.
#
# Copyright (c) 1991-2006 Unicode, Inc.
# For terms of use, see http://www.unicode.org/terms_of_use.html
#
# Warning: Only the variation sequences specifically defined in this file
# are sanctioned for standard use. In all other cases the variation selector
# cannot change the visual appearance of the preceding base character from
# what it would have had in the absence of the variation selector.
#
# For more information, see Section 16.4, Variation Selectors,
# in The Unicode Standard, Version 5.0.
#
# Format:
# Field 0: the variation sequence
# Field 1: the description of the desired appearance
# Field 2: where the appearance is only different in in particular shaping environments
# this field lists them. The possible values are: isolate, initial, medial, final.
# If more than one is present, there are spaces between them.
# =============================
# Mathematical
2229 FE00; with serifs; # INTERSECTION
222A FE00; with serifs; # UNION
2268 FE00; with vertical stroke; # LESS-THAN BUT NOT EQUAL TO
2269 FE00; with vertical stroke; # GREATER-THAN BUT NOT EQUAL TO
2272 FE00; following the slant of the lower leg; # LESS-THAN OR EQUIVALENT TO
2273 FE00; following the slant of the lower leg; # GREATER-THAN OR EQUIVALENT TO
#2278 FE00; with vertical stroke; # NEITHER LESS-THAN NOR GREATER-THAN
#2279 FE00; with vertical stroke; # NEITHER GREATER-THAN NOR LESS-THAN
228A FE00; with stroke through bottom members; # SUBSET OF WITH NOT EQUAL TO
228B FE00; with stroke through bottom members; # SUPERSET OF WITH NOT EQUAL TO
2293 FE00; with serifs; # SQUARE CAP
2294 FE00; with serifs; # SQUARE CUP
2295 FE00; with white rim; # CIRCLED PLUS
2297 FE00; with white rim; # CIRCLED TIMES
229C FE00; with equal sign touching the circle; # CIRCLED EQUALS
22DA FE00; with slanted equal; # LESS-THAN EQUAL TO OR GREATER-THAN
22DB FE00; with slanted equal; # GREATER-THAN EQUAL TO OR LESS-THAN
2A3C FE00; tall variant with narrow foot; # INTERIOR PRODUCT
2A3D FE00; tall variant with narrow foot; # RIGHTHAND INTERIOR PRODUCT
2A9D FE00; with similar following the slant of the upper leg; # SIMILAR OR LESS-THAN
2A9E FE00; with similar following the slant of the upper leg; # SIMILAR OR GREATER-THAN
2AAC FE00; with slanted equal; # SMALLER THAN OR EQUAL TO
2AAD FE00; with slanted equal; # LARGER THAN OR EQUAL TO
2ACB FE00; with stroke through bottom members; # SUBSET OF ABOVE NOT EQUAL TO
2ACC FE00; with stroke through bottom members; # SUPERSET OF ABOVE NOT EQUAL TO
# Phags-pa
A856 FE00; phags-pa letter reversed shaping small a; # PHAGS-PA LETTER SMALL A
A85C FE00; phags-pa letter reversed shaping ha; # PHAGS-PA LETTER HA
A85E FE00; phags-pa letter reversed shaping i; # PHAGS-PA LETTER I
A85F FE00; phags-pa letter reversed shaping u; # PHAGS-PA LETTER U
A860 FE00; phags-pa letter reversed shaping e; # PHAGS-PA LETTER E
A868 FE00; phags-pa letter reversed shaping subjoined ya; # PHAGS-PA SUBJOINED LETTER YA
# Mongolian
1820 180B; second form; isolate medial final # MONGOLIAN LETTER A
1820 180C; third form; medial # MONGOLIAN LETTER A
1821 180B; second form; initial final # MONGOLIAN LETTER E
1822 180B; second form; medial # MONGOLIAN LETTER I
1823 180B; second form; medial final # MONGOLIAN LETTER O
1824 180B; second form; medial # MONGOLIAN LETTER U
1825 180B; second form; medial final # MONGOLIAN LETTER OE
1825 180C; third form; medial # MONGOLIAN LETTER OE
1826 180B; second form; isolate medial final # MONGOLIAN LETTER UE
1826 180C; third form; medial # MONGOLIAN LETTER UE
1828 180B; second form; initial medial # MONGOLIAN LETTER NA
1828 180C; third form; medial # MONGOLIAN LETTER NA
1828 180D; separate form; medial # MONGOLIAN LETTER NA
182A 180B; alternative form; final # MONGOLIAN LETTER BA
182C 180B; second form; initial medial # MONGOLIAN LETTER QA
182C 180B; feminine second form; isolate # MONGOLIAN LETTER QA
182C 180C; third form; medial # MONGOLIAN LETTER QA
182C 180D; fourth form; medial # MONGOLIAN LETTER QA
182D 180B; second form; initial medial # MONGOLIAN LETTER GA
182D 180B; feminine form; final # MONGOLIAN LETTER GA
182D 180C; third form; medial # MONGOLIAN LETTER GA
182D 180D; feminine form; medial # MONGOLIAN LETTER GA
1830 180B; second form; final # MONGOLIAN LETTER SA
1830 180C; third form; final # MONGOLIAN LETTER SA
1832 180B; second form; medial # MONGOLIAN LETTER TA
1833 180B; second form; initial medial final # MONGOLIAN LETTER DA
1835 180B; second form; medial # MONGOLIAN LETTER JA
1836 180B; second form; initial medial # # MONGOLIAN LETTER YA
1836 180C; third form; medial # MONGOLIAN LETTER YA
1838 180B; second form; final # MONGOLIAN LETTER WA
1844 180B; second form; medial # MONGOLIAN LETTER TODO E
1845 180B; second form; medial # MONGOLIAN LETTER TODO I
1846 180B; second form; medial # MONGOLIAN LETTER TODO O
1847 180B; second form; isolate medial final # MONGOLIAN LETTER TODO U
1847 180C; third form; medial # MONGOLIAN LETTER TODO U
1848 180B; second form; medial # MONGOLIAN LETTER TODO OE
1849 180B; second form; isolate medial # MONGOLIAN LETTER TODO UE
184D 180B; feminine form; initial medial # MONGOLIAN LETTER TODO QA
184E 180B; second form; medial # MONGOLIAN LETTER TODO GA
185D 180B; second form; medial final # MONGOLIAN LETTER SIBE E
185E 180B; second form; medial final # MONGOLIAN LETTER SIBE I
185E 180C; third form; medial final # MONGOLIAN LETTER SIBE I
1860 180B; second form; medial final # MONGOLIAN LETTER SIBE UE
1863 180B; second form; medial # MONGOLIAN LETTER SIBE KA
1868 180B; second form; initial medial # MONGOLIAN LETTER SIBE TA
1868 180C; third form; medial # MONGOLIAN LETTER SIBE TA
1869 180B; second form; initial medial # MONGOLIAN LETTER SIBE DA
186F 180B; second form; initial medial # MONGOLIAN LETTER SIBE ZA
1873 180B; second form; medial final # MONGOLIAN LETTER MANCHU I
1873 180C; third form; medial final # MONGOLIAN LETTER MANCHU I
1873 180D; fourth form; medial # MONGOLIAN LETTER MANCHU I
1874 180B; second form; medial # MONGOLIAN LETTER MANCHU KA
1874 180B; feminine first final form; final # MONGOLIAN LETTER MANCHU KA
1874 180C; feminine first medial form; medial # MONGOLIAN LETTER MANCHU KA
1874 180C; feminine second final form; final # MONGOLIAN LETTER MANCHU KA
1874 180D; feminine second medial form; medial # MONGOLIAN LETTER MANCHU KA
1876 180B; second form; initial medial # MONGOLIAN LETTER MANCHU FA
1880 180B; second form; # MONGOLIAN LETTER ALI GALI ANUSVARA ONE
1881 180B; second form; # MONGOLIAN LETTER ALI GALI VISARGA ONE
1887 180B; second form; isolate final # MONGOLIAN LETTER ALI GALI A
1887 180C; third form; final # MONGOLIAN LETTER ALI GALI A
1887 180D; fourth form; final # MONGOLIAN LETTER ALI GALI A
1888 180B; second form; final # MONGOLIAN LETTER ALI GALI I
188A 180B; second form; initial medial # MONGOLIAN LETTER ALI GALI NGA

File diff suppressed because it is too large Load Diff

129
src/unicode/extract-categories.ss Executable file
View File

@ -0,0 +1,129 @@
#!/usr/bin/env ikarus --r6rs-script
(import (ikarus))
(define (read-line)
(let f ([ac '()])
(let ([x (read-char)])
(cond
[(eof-object? x)
(if (null? ac)
(eof-object)
(list->string (reverse ac)))]
[(char=? x #\newline)
(if (null? ac) (f) (list->string (reverse ac)))]
[else (f (cons x ac))]))))
(define (find-semi str i n)
(cond
[(or (fx= i n)
(char=? (string-ref str i) #\;)) i]
[else (find-semi str (+ i 1) n)]))
(define (split str)
(let f ([i 0] [n (string-length str)])
(cond
[(= i n) '()]
[else
(let ([j (find-semi str i n)])
(cond
[(= j n) (list (substring str i j))]
[else
(cons (substring str i j)
(f (+ j 1) n))]))])))
(define (extract-uni-data)
(let f ([ls '()])
(let ([line (read-line)])
(cond
[(eof-object? line)
(reverse ls)]
[else
(let ([fields (split line)])
(let ([num (car fields)]
[cat (caddr fields)])
(f (cons
(cons
(read
(open-input-string (format "#x~a" num)))
(string->symbol cat))
ls))))]))))
(define (codes-in-cats ls cats)
(let f ([ls ls] [ac '()])
(cond
[(null? ls) (reverse ac)]
[(memq (cdar ls) cats)
(f (cdr ls) (cons (caar ls) ac))]
[else (f (cdr ls) ac)])))
(define (make-xonxoff ls)
;;; makes a list where if your index is at an odd
;;; position, then you're ON. If your index is not in
;;; the list, then look for the index before you.
(cons 0
(let f ([i 1] [on? #f]
[ls (if (= (car ls) 0)
(error 'make-xonxoff "first is on")
ls)])
(cond
[(null? ls) (list i)]
[(= i (car ls))
(if on?
(f (+ i 1) #t (cdr ls))
(cons i (f (+ i 1) #t (cdr ls))))]
[else
(if on?
(cons i (f (+ i 1) #f ls))
(f (+ i 1) #f ls))]))))
(define (odd? n) (= (fxlogand n 1) 1))
(define (search-on? n v)
(let ([k (- (vector-length v) 1)])
(let f ([i 0] [k k])
(cond
[(fx= i k) (odd? i)]
[else
(let ([j (fxsra (+ i k 1) 1)])
(cond
[(<= (vector-ref v j) n) (f j k)]
[else (f i (- j 1))]))]))))
(define (verify vec ls)
(let f ([i 0] [ls ls])
(unless (> i #x10FFFF)
(let-values ([(on? ls)
(cond
[(null? ls) (values #f '())]
[(= i (car ls)) (values #t (cdr ls))]
[else (values #f ls)])])
(unless (equal? on? (search-on? i vec))
(error #f "did not pass on ~s" i))
(f (+ i 1) ls)))))
(let ([ls
(with-input-from-file
"UNIDATA/UnicodeData.txt"
extract-uni-data)])
(let ([wanted
(codes-in-cats ls
'(Lu Ll Lt Lm Lo Mn Mc Me Nd Nl No Pd Pc Po Sc Sm Sk So Co))])
(let ([xonxoff (list->vector (make-xonxoff wanted))])
(verify xonxoff wanted)
(with-output-to-file "unicode-constituents.ss"
(lambda ()
(printf ";;; DO NOT EDIT\n")
(printf ";;; automatically generated\n")
(printf ";;; ~s elements in vector\n\n" (vector-length xonxoff))
(pretty-print
`(define unicode-constituents-vector ',xonxoff)))
'replace))))
(printf "Happy Happy Joy Joy\n")

View File

@ -0,0 +1,75 @@
;;; DO NOT EDIT
;;; automatically generated
;;; 947 elements in vector
(define unicode-constituents-vector
'#(0 33 40 42 91 92 93 94 123 124 125 126 127 161 171 172 173 174 187 188 880
884 886 890 895 900 907 908 909 910 930 931 975 976 1159 1160 1300 1329
1367 1369 1376 1377 1416 1417 1419 1425 1480 1488 1515 1520 1525 1547 1558
1563 1564 1566 1568 1569 1595 1600 1631 1632 1757 1758 1806 1808 1867 1869
1902 1920 1970 1984 2043 2305 2362 2364 2382 2384 2389 2392 2417 2427 2432
2433 2436 2437 2445 2447 2449 2451 2473 2474 2481 2482 2483 2486 2490 2492
2501 2503 2505 2507 2511 2519 2520 2524 2526 2527 2532 2534 2555 2561 2564
2565 2571 2575 2577 2579 2601 2602 2609 2610 2612 2613 2615 2616 2618 2620
2621 2622 2627 2631 2633 2635 2638 2649 2653 2654 2655 2662 2677 2689 2692
2693 2702 2703 2706 2707 2729 2730 2737 2738 2740 2741 2746 2748 2758 2759
2762 2763 2766 2768 2769 2784 2788 2790 2800 2801 2802 2817 2820 2821 2829
2831 2833 2835 2857 2858 2865 2866 2868 2869 2874 2876 2884 2887 2889 2891
2894 2902 2904 2908 2910 2911 2914 2918 2930 2946 2948 2949 2955 2958 2961
2962 2966 2969 2971 2972 2973 2974 2976 2979 2981 2984 2987 2990 3002 3006
3011 3014 3017 3018 3022 3031 3032 3046 3067 3073 3076 3077 3085 3086 3089
3090 3113 3114 3124 3125 3130 3134 3141 3142 3145 3146 3150 3157 3159 3168
3170 3174 3184 3202 3204 3205 3213 3214 3217 3218 3241 3242 3252 3253 3258
3260 3269 3270 3273 3274 3278 3285 3287 3294 3295 3296 3300 3302 3312 3313
3315 3330 3332 3333 3341 3342 3345 3346 3369 3370 3386 3390 3396 3398 3401
3402 3406 3415 3416 3424 3426 3430 3440 3458 3460 3461 3479 3482 3506 3507
3516 3517 3518 3520 3527 3530 3531 3535 3541 3542 3543 3544 3552 3570 3573
3585 3643 3647 3676 3713 3715 3716 3717 3719 3721 3722 3723 3725 3726 3732
3736 3737 3744 3745 3748 3749 3750 3751 3752 3754 3756 3757 3770 3771 3774
3776 3781 3782 3783 3784 3790 3792 3802 3804 3806 3840 3898 3902 3912 3913
3947 3953 3980 3984 3992 3993 4029 4030 4045 4047 4050 4096 4130 4131 4136
4137 4139 4140 4147 4150 4154 4160 4186 4256 4294 4304 4349 4352 4442 4447
4515 4520 4602 4608 4681 4682 4686 4688 4695 4696 4697 4698 4702 4704 4745
4746 4750 4752 4785 4786 4790 4792 4799 4800 4801 4802 4806 4808 4823 4824
4881 4882 4886 4888 4955 4959 4989 4992 5018 5024 5109 5121 5751 5761 5787
5792 5873 5888 5901 5902 5909 5920 5943 5952 5972 5984 5997 5998 6001 6002
6004 6016 6068 6070 6110 6112 6122 6128 6138 6144 6158 6160 6170 6176 6264
6272 6314 6400 6429 6432 6444 6448 6460 6464 6465 6468 6510 6512 6517 6528
6570 6576 6602 6608 6618 6622 6684 6686 6688 6912 6988 6992 7037 7424 7627
7678 7836 7840 7930 7936 7958 7960 7966 7968 8006 8008 8014 8016 8024 8025
8026 8027 8028 8029 8030 8031 8062 8064 8117 8118 8133 8134 8148 8150 8156
8157 8176 8178 8181 8182 8191 8208 8216 8224 8232 8240 8249 8251 8261 8263
8287 8304 8306 8308 8317 8319 8333 8336 8341 8352 8374 8400 8432 8448 8527
8531 8581 8592 9001 9003 9192 9216 9255 9280 9291 9312 9885 9888 9907 9985
9989 9990 9994 9996 10024 10025 10060 10061 10062 10063 10067 10070 10071
10072 10079 10081 10088 10102 10133 10136 10160 10161 10175 10176 10181
10183 10187 10192 10214 10224 10627 10649 10712 10716 10748 10750 11035
11040 11044 11264 11311 11312 11359 11360 11373 11380 11384 11392 11499
11513 11558 11568 11622 11631 11632 11648 11671 11680 11687 11688 11695
11696 11703 11704 11711 11712 11719 11720 11727 11728 11735 11736 11743
11776 11778 11782 11785 11787 11788 11790 11800 11904 11930 11931 12020
12032 12246 12272 12284 12289 12296 12306 12308 12316 12317 12320 12352
12353 12439 12441 12544 12549 12589 12593 12687 12688 12728 12736 12752
12784 12831 12832 12868 12880 13055 13056 13313 19893 19894 19904 19969
40891 40892 40960 42125 42128 42183 42752 42779 42784 42786 43008 43052
43072 43128 44032 44033 55203 55204 57344 57345 63743 64046 64048 64107
64112 64218 64256 64263 64275 64280 64285 64311 64312 64317 64318 64319
64320 64322 64323 64325 64326 64434 64467 64830 64848 64912 64914 64968
65008 65022 65024 65047 65049 65050 65056 65060 65072 65077 65093 65095
65097 65107 65108 65113 65119 65127 65128 65132 65136 65141 65142 65277
65281 65288 65290 65339 65340 65341 65342 65371 65372 65373 65374 65375
65377 65378 65380 65471 65474 65480 65482 65488 65490 65496 65498 65501
65504 65511 65512 65519 65532 65534 65536 65548 65549 65575 65576 65595
65596 65598 65599 65614 65616 65630 65664 65787 65792 65795 65799 65844
65847 65931 66304 66335 66336 66340 66352 66379 66432 66462 66463 66500
66504 66518 66560 66718 66720 66730 67584 67590 67592 67593 67594 67638
67639 67641 67644 67645 67647 67648 67840 67866 67871 67872 68096 68100
68101 68103 68108 68116 68117 68120 68121 68148 68152 68155 68159 68168
68176 68185 73728 74607 74752 74851 74864 74868 118784 119030 119040 119079
119082 119155 119163 119262 119296 119366 119552 119639 119648 119666
119808 119893 119894 119965 119966 119968 119970 119971 119973 119975
119977 119981 119982 119994 119995 119996 119997 120004 120005 120070
120071 120075 120077 120085 120086 120093 120094 120122 120123 120127
120128 120133 120134 120135 120138 120145 120146 120486 120488 120780
120782 120832 131072 131073 173782 173783 194560 195102 917760 918000
983040 983041 1048573 1048574 1048576 1048577 1114109 1114110))