You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@lucene.apache.org by ab...@apache.org on 2017/04/03 18:45:44 UTC
[38/52] [abbrv] lucene-solr:jira/solr-9959: SOLR-7383: Replace DIH
'rss' example with 'atom' rss example was broken for multiple reasons. atom
example showcases the same - and more - features and uses the smallest config
file needed to make it work.
http://git-wip-us.apache.org/repos/asf/lucene-solr/blob/580f6e98/solr/example/example-DIH/solr/rss/conf/mapping-FoldToASCII.txt
----------------------------------------------------------------------
diff --git a/solr/example/example-DIH/solr/rss/conf/mapping-FoldToASCII.txt b/solr/example/example-DIH/solr/rss/conf/mapping-FoldToASCII.txt
deleted file mode 100644
index 9a84b6e..0000000
--- a/solr/example/example-DIH/solr/rss/conf/mapping-FoldToASCII.txt
+++ /dev/null
@@ -1,3813 +0,0 @@
-# The ASF licenses this file to You under the Apache License, Version 2.0
-# (the "License"); you may not use this file except in compliance with
-# the License. You may obtain a copy of the License at
-#
-# http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-
-# This map converts alphabetic, numeric, and symbolic Unicode characters
-# which are not in the first 127 ASCII characters (the "Basic Latin" Unicode
-# block) into their ASCII equivalents, if one exists.
-#
-# Characters from the following Unicode blocks are converted; however, only
-# those characters with reasonable ASCII alternatives are converted:
-#
-# - C1 Controls and Latin-1 Supplement: http://www.unicode.org/charts/PDF/U0080.pdf
-# - Latin Extended-A: http://www.unicode.org/charts/PDF/U0100.pdf
-# - Latin Extended-B: http://www.unicode.org/charts/PDF/U0180.pdf
-# - Latin Extended Additional: http://www.unicode.org/charts/PDF/U1E00.pdf
-# - Latin Extended-C: http://www.unicode.org/charts/PDF/U2C60.pdf
-# - Latin Extended-D: http://www.unicode.org/charts/PDF/UA720.pdf
-# - IPA Extensions: http://www.unicode.org/charts/PDF/U0250.pdf
-# - Phonetic Extensions: http://www.unicode.org/charts/PDF/U1D00.pdf
-# - Phonetic Extensions Supplement: http://www.unicode.org/charts/PDF/U1D80.pdf
-# - General Punctuation: http://www.unicode.org/charts/PDF/U2000.pdf
-# - Superscripts and Subscripts: http://www.unicode.org/charts/PDF/U2070.pdf
-# - Enclosed Alphanumerics: http://www.unicode.org/charts/PDF/U2460.pdf
-# - Dingbats: http://www.unicode.org/charts/PDF/U2700.pdf
-# - Supplemental Punctuation: http://www.unicode.org/charts/PDF/U2E00.pdf
-# - Alphabetic Presentation Forms: http://www.unicode.org/charts/PDF/UFB00.pdf
-# - Halfwidth and Fullwidth Forms: http://www.unicode.org/charts/PDF/UFF00.pdf
-#
-# See: http://en.wikipedia.org/wiki/Latin_characters_in_Unicode
-#
-# The set of character conversions supported by this map is a superset of
-# those supported by the map represented by mapping-ISOLatin1Accent.txt.
-#
-# See the bottom of this file for the Perl script used to generate the contents
-# of this file (without this header) from ASCIIFoldingFilter.java.
-
-
-# Syntax:
-# "source" => "target"
-# "source".length() > 0 (source cannot be empty.)
-# "target".length() >= 0 (target can be empty.)
-
-
-# � [LATIN CAPITAL LETTER A WITH GRAVE]
-"\u00C0" => "A"
-
-# � [LATIN CAPITAL LETTER A WITH ACUTE]
-"\u00C1" => "A"
-
-# � [LATIN CAPITAL LETTER A WITH CIRCUMFLEX]
-"\u00C2" => "A"
-
-# � [LATIN CAPITAL LETTER A WITH TILDE]
-"\u00C3" => "A"
-
-# � [LATIN CAPITAL LETTER A WITH DIAERESIS]
-"\u00C4" => "A"
-
-# � [LATIN CAPITAL LETTER A WITH RING ABOVE]
-"\u00C5" => "A"
-
-# \u0100 [LATIN CAPITAL LETTER A WITH MACRON]
-"\u0100" => "A"
-
-# \u0102 [LATIN CAPITAL LETTER A WITH BREVE]
-"\u0102" => "A"
-
-# \u0104 [LATIN CAPITAL LETTER A WITH OGONEK]
-"\u0104" => "A"
-
-# \u018f http://en.wikipedia.org/wiki/Schwa [LATIN CAPITAL LETTER SCHWA]
-"\u018F" => "A"
-
-# \u01cd [LATIN CAPITAL LETTER A WITH CARON]
-"\u01CD" => "A"
-
-# \u01de [LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON]
-"\u01DE" => "A"
-
-# \u01e0 [LATIN CAPITAL LETTER A WITH DOT ABOVE AND MACRON]
-"\u01E0" => "A"
-
-# \u01fa [LATIN CAPITAL LETTER A WITH RING ABOVE AND ACUTE]
-"\u01FA" => "A"
-
-# \u0200 [LATIN CAPITAL LETTER A WITH DOUBLE GRAVE]
-"\u0200" => "A"
-
-# \u0202 [LATIN CAPITAL LETTER A WITH INVERTED BREVE]
-"\u0202" => "A"
-
-# \u0226 [LATIN CAPITAL LETTER A WITH DOT ABOVE]
-"\u0226" => "A"
-
-# \u023a [LATIN CAPITAL LETTER A WITH STROKE]
-"\u023A" => "A"
-
-# \u1d00 [LATIN LETTER SMALL CAPITAL A]
-"\u1D00" => "A"
-
-# \u1e00 [LATIN CAPITAL LETTER A WITH RING BELOW]
-"\u1E00" => "A"
-
-# \u1ea0 [LATIN CAPITAL LETTER A WITH DOT BELOW]
-"\u1EA0" => "A"
-
-# \u1ea2 [LATIN CAPITAL LETTER A WITH HOOK ABOVE]
-"\u1EA2" => "A"
-
-# \u1ea4 [LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND ACUTE]
-"\u1EA4" => "A"
-
-# \u1ea6 [LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND GRAVE]
-"\u1EA6" => "A"
-
-# \u1ea8 [LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND HOOK ABOVE]
-"\u1EA8" => "A"
-
-# \u1eaa [LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND TILDE]
-"\u1EAA" => "A"
-
-# \u1eac [LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND DOT BELOW]
-"\u1EAC" => "A"
-
-# \u1eae [LATIN CAPITAL LETTER A WITH BREVE AND ACUTE]
-"\u1EAE" => "A"
-
-# \u1eb0 [LATIN CAPITAL LETTER A WITH BREVE AND GRAVE]
-"\u1EB0" => "A"
-
-# \u1eb2 [LATIN CAPITAL LETTER A WITH BREVE AND HOOK ABOVE]
-"\u1EB2" => "A"
-
-# \u1eb4 [LATIN CAPITAL LETTER A WITH BREVE AND TILDE]
-"\u1EB4" => "A"
-
-# \u1eb6 [LATIN CAPITAL LETTER A WITH BREVE AND DOT BELOW]
-"\u1EB6" => "A"
-
-# \u24b6 [CIRCLED LATIN CAPITAL LETTER A]
-"\u24B6" => "A"
-
-# \uff21 [FULLWIDTH LATIN CAPITAL LETTER A]
-"\uFF21" => "A"
-
-# � [LATIN SMALL LETTER A WITH GRAVE]
-"\u00E0" => "a"
-
-# � [LATIN SMALL LETTER A WITH ACUTE]
-"\u00E1" => "a"
-
-# � [LATIN SMALL LETTER A WITH CIRCUMFLEX]
-"\u00E2" => "a"
-
-# � [LATIN SMALL LETTER A WITH TILDE]
-"\u00E3" => "a"
-
-# � [LATIN SMALL LETTER A WITH DIAERESIS]
-"\u00E4" => "a"
-
-# � [LATIN SMALL LETTER A WITH RING ABOVE]
-"\u00E5" => "a"
-
-# \u0101 [LATIN SMALL LETTER A WITH MACRON]
-"\u0101" => "a"
-
-# \u0103 [LATIN SMALL LETTER A WITH BREVE]
-"\u0103" => "a"
-
-# \u0105 [LATIN SMALL LETTER A WITH OGONEK]
-"\u0105" => "a"
-
-# \u01ce [LATIN SMALL LETTER A WITH CARON]
-"\u01CE" => "a"
-
-# \u01df [LATIN SMALL LETTER A WITH DIAERESIS AND MACRON]
-"\u01DF" => "a"
-
-# \u01e1 [LATIN SMALL LETTER A WITH DOT ABOVE AND MACRON]
-"\u01E1" => "a"
-
-# \u01fb [LATIN SMALL LETTER A WITH RING ABOVE AND ACUTE]
-"\u01FB" => "a"
-
-# \u0201 [LATIN SMALL LETTER A WITH DOUBLE GRAVE]
-"\u0201" => "a"
-
-# \u0203 [LATIN SMALL LETTER A WITH INVERTED BREVE]
-"\u0203" => "a"
-
-# \u0227 [LATIN SMALL LETTER A WITH DOT ABOVE]
-"\u0227" => "a"
-
-# \u0250 [LATIN SMALL LETTER TURNED A]
-"\u0250" => "a"
-
-# \u0259 [LATIN SMALL LETTER SCHWA]
-"\u0259" => "a"
-
-# \u025a [LATIN SMALL LETTER SCHWA WITH HOOK]
-"\u025A" => "a"
-
-# \u1d8f [LATIN SMALL LETTER A WITH RETROFLEX HOOK]
-"\u1D8F" => "a"
-
-# \u1d95 [LATIN SMALL LETTER SCHWA WITH RETROFLEX HOOK]
-"\u1D95" => "a"
-
-# \u1ea1 [LATIN SMALL LETTER A WITH RING BELOW]
-"\u1E01" => "a"
-
-# \u1ea3 [LATIN SMALL LETTER A WITH RIGHT HALF RING]
-"\u1E9A" => "a"
-
-# \u1ea1 [LATIN SMALL LETTER A WITH DOT BELOW]
-"\u1EA1" => "a"
-
-# \u1ea3 [LATIN SMALL LETTER A WITH HOOK ABOVE]
-"\u1EA3" => "a"
-
-# \u1ea5 [LATIN SMALL LETTER A WITH CIRCUMFLEX AND ACUTE]
-"\u1EA5" => "a"
-
-# \u1ea7 [LATIN SMALL LETTER A WITH CIRCUMFLEX AND GRAVE]
-"\u1EA7" => "a"
-
-# \u1ea9 [LATIN SMALL LETTER A WITH CIRCUMFLEX AND HOOK ABOVE]
-"\u1EA9" => "a"
-
-# \u1eab [LATIN SMALL LETTER A WITH CIRCUMFLEX AND TILDE]
-"\u1EAB" => "a"
-
-# \u1ead [LATIN SMALL LETTER A WITH CIRCUMFLEX AND DOT BELOW]
-"\u1EAD" => "a"
-
-# \u1eaf [LATIN SMALL LETTER A WITH BREVE AND ACUTE]
-"\u1EAF" => "a"
-
-# \u1eb1 [LATIN SMALL LETTER A WITH BREVE AND GRAVE]
-"\u1EB1" => "a"
-
-# \u1eb3 [LATIN SMALL LETTER A WITH BREVE AND HOOK ABOVE]
-"\u1EB3" => "a"
-
-# \u1eb5 [LATIN SMALL LETTER A WITH BREVE AND TILDE]
-"\u1EB5" => "a"
-
-# \u1eb7 [LATIN SMALL LETTER A WITH BREVE AND DOT BELOW]
-"\u1EB7" => "a"
-
-# \u2090 [LATIN SUBSCRIPT SMALL LETTER A]
-"\u2090" => "a"
-
-# \u2094 [LATIN SUBSCRIPT SMALL LETTER SCHWA]
-"\u2094" => "a"
-
-# \u24d0 [CIRCLED LATIN SMALL LETTER A]
-"\u24D0" => "a"
-
-# \u2c65 [LATIN SMALL LETTER A WITH STROKE]
-"\u2C65" => "a"
-
-# \u2c6f [LATIN CAPITAL LETTER TURNED A]
-"\u2C6F" => "a"
-
-# \uff41 [FULLWIDTH LATIN SMALL LETTER A]
-"\uFF41" => "a"
-
-# \ua732 [LATIN CAPITAL LETTER AA]
-"\uA732" => "AA"
-
-# � [LATIN CAPITAL LETTER AE]
-"\u00C6" => "AE"
-
-# \u01e2 [LATIN CAPITAL LETTER AE WITH MACRON]
-"\u01E2" => "AE"
-
-# \u01fc [LATIN CAPITAL LETTER AE WITH ACUTE]
-"\u01FC" => "AE"
-
-# \u1d01 [LATIN LETTER SMALL CAPITAL AE]
-"\u1D01" => "AE"
-
-# \ua734 [LATIN CAPITAL LETTER AO]
-"\uA734" => "AO"
-
-# \ua736 [LATIN CAPITAL LETTER AU]
-"\uA736" => "AU"
-
-# \ua738 [LATIN CAPITAL LETTER AV]
-"\uA738" => "AV"
-
-# \ua73a [LATIN CAPITAL LETTER AV WITH HORIZONTAL BAR]
-"\uA73A" => "AV"
-
-# \ua73c [LATIN CAPITAL LETTER AY]
-"\uA73C" => "AY"
-
-# \u249c [PARENTHESIZED LATIN SMALL LETTER A]
-"\u249C" => "(a)"
-
-# \ua733 [LATIN SMALL LETTER AA]
-"\uA733" => "aa"
-
-# � [LATIN SMALL LETTER AE]
-"\u00E6" => "ae"
-
-# \u01e3 [LATIN SMALL LETTER AE WITH MACRON]
-"\u01E3" => "ae"
-
-# \u01fd [LATIN SMALL LETTER AE WITH ACUTE]
-"\u01FD" => "ae"
-
-# \u1d02 [LATIN SMALL LETTER TURNED AE]
-"\u1D02" => "ae"
-
-# \ua735 [LATIN SMALL LETTER AO]
-"\uA735" => "ao"
-
-# \ua737 [LATIN SMALL LETTER AU]
-"\uA737" => "au"
-
-# \ua739 [LATIN SMALL LETTER AV]
-"\uA739" => "av"
-
-# \ua73b [LATIN SMALL LETTER AV WITH HORIZONTAL BAR]
-"\uA73B" => "av"
-
-# \ua73d [LATIN SMALL LETTER AY]
-"\uA73D" => "ay"
-
-# \u0181 [LATIN CAPITAL LETTER B WITH HOOK]
-"\u0181" => "B"
-
-# \u0182 [LATIN CAPITAL LETTER B WITH TOPBAR]
-"\u0182" => "B"
-
-# \u0243 [LATIN CAPITAL LETTER B WITH STROKE]
-"\u0243" => "B"
-
-# \u0299 [LATIN LETTER SMALL CAPITAL B]
-"\u0299" => "B"
-
-# \u1d03 [LATIN LETTER SMALL CAPITAL BARRED B]
-"\u1D03" => "B"
-
-# \u1e02 [LATIN CAPITAL LETTER B WITH DOT ABOVE]
-"\u1E02" => "B"
-
-# \u1e04 [LATIN CAPITAL LETTER B WITH DOT BELOW]
-"\u1E04" => "B"
-
-# \u1e06 [LATIN CAPITAL LETTER B WITH LINE BELOW]
-"\u1E06" => "B"
-
-# \u24b7 [CIRCLED LATIN CAPITAL LETTER B]
-"\u24B7" => "B"
-
-# \uff22 [FULLWIDTH LATIN CAPITAL LETTER B]
-"\uFF22" => "B"
-
-# \u0180 [LATIN SMALL LETTER B WITH STROKE]
-"\u0180" => "b"
-
-# \u0183 [LATIN SMALL LETTER B WITH TOPBAR]
-"\u0183" => "b"
-
-# \u0253 [LATIN SMALL LETTER B WITH HOOK]
-"\u0253" => "b"
-
-# \u1d6c [LATIN SMALL LETTER B WITH MIDDLE TILDE]
-"\u1D6C" => "b"
-
-# \u1d80 [LATIN SMALL LETTER B WITH PALATAL HOOK]
-"\u1D80" => "b"
-
-# \u1e03 [LATIN SMALL LETTER B WITH DOT ABOVE]
-"\u1E03" => "b"
-
-# \u1e05 [LATIN SMALL LETTER B WITH DOT BELOW]
-"\u1E05" => "b"
-
-# \u1e07 [LATIN SMALL LETTER B WITH LINE BELOW]
-"\u1E07" => "b"
-
-# \u24d1 [CIRCLED LATIN SMALL LETTER B]
-"\u24D1" => "b"
-
-# \uff42 [FULLWIDTH LATIN SMALL LETTER B]
-"\uFF42" => "b"
-
-# \u249d [PARENTHESIZED LATIN SMALL LETTER B]
-"\u249D" => "(b)"
-
-# � [LATIN CAPITAL LETTER C WITH CEDILLA]
-"\u00C7" => "C"
-
-# \u0106 [LATIN CAPITAL LETTER C WITH ACUTE]
-"\u0106" => "C"
-
-# \u0108 [LATIN CAPITAL LETTER C WITH CIRCUMFLEX]
-"\u0108" => "C"
-
-# \u010a [LATIN CAPITAL LETTER C WITH DOT ABOVE]
-"\u010A" => "C"
-
-# \u010c [LATIN CAPITAL LETTER C WITH CARON]
-"\u010C" => "C"
-
-# \u0187 [LATIN CAPITAL LETTER C WITH HOOK]
-"\u0187" => "C"
-
-# \u023b [LATIN CAPITAL LETTER C WITH STROKE]
-"\u023B" => "C"
-
-# \u0297 [LATIN LETTER STRETCHED C]
-"\u0297" => "C"
-
-# \u1d04 [LATIN LETTER SMALL CAPITAL C]
-"\u1D04" => "C"
-
-# \u1e08 [LATIN CAPITAL LETTER C WITH CEDILLA AND ACUTE]
-"\u1E08" => "C"
-
-# \u24b8 [CIRCLED LATIN CAPITAL LETTER C]
-"\u24B8" => "C"
-
-# \uff23 [FULLWIDTH LATIN CAPITAL LETTER C]
-"\uFF23" => "C"
-
-# � [LATIN SMALL LETTER C WITH CEDILLA]
-"\u00E7" => "c"
-
-# \u0107 [LATIN SMALL LETTER C WITH ACUTE]
-"\u0107" => "c"
-
-# \u0109 [LATIN SMALL LETTER C WITH CIRCUMFLEX]
-"\u0109" => "c"
-
-# \u010b [LATIN SMALL LETTER C WITH DOT ABOVE]
-"\u010B" => "c"
-
-# \u010d [LATIN SMALL LETTER C WITH CARON]
-"\u010D" => "c"
-
-# \u0188 [LATIN SMALL LETTER C WITH HOOK]
-"\u0188" => "c"
-
-# \u023c [LATIN SMALL LETTER C WITH STROKE]
-"\u023C" => "c"
-
-# \u0255 [LATIN SMALL LETTER C WITH CURL]
-"\u0255" => "c"
-
-# \u1e09 [LATIN SMALL LETTER C WITH CEDILLA AND ACUTE]
-"\u1E09" => "c"
-
-# \u2184 [LATIN SMALL LETTER REVERSED C]
-"\u2184" => "c"
-
-# \u24d2 [CIRCLED LATIN SMALL LETTER C]
-"\u24D2" => "c"
-
-# \ua73e [LATIN CAPITAL LETTER REVERSED C WITH DOT]
-"\uA73E" => "c"
-
-# \ua73f [LATIN SMALL LETTER REVERSED C WITH DOT]
-"\uA73F" => "c"
-
-# \uff43 [FULLWIDTH LATIN SMALL LETTER C]
-"\uFF43" => "c"
-
-# \u249e [PARENTHESIZED LATIN SMALL LETTER C]
-"\u249E" => "(c)"
-
-# � [LATIN CAPITAL LETTER ETH]
-"\u00D0" => "D"
-
-# \u010e [LATIN CAPITAL LETTER D WITH CARON]
-"\u010E" => "D"
-
-# \u0110 [LATIN CAPITAL LETTER D WITH STROKE]
-"\u0110" => "D"
-
-# \u0189 [LATIN CAPITAL LETTER AFRICAN D]
-"\u0189" => "D"
-
-# \u018a [LATIN CAPITAL LETTER D WITH HOOK]
-"\u018A" => "D"
-
-# \u018b [LATIN CAPITAL LETTER D WITH TOPBAR]
-"\u018B" => "D"
-
-# \u1d05 [LATIN LETTER SMALL CAPITAL D]
-"\u1D05" => "D"
-
-# \u1d06 [LATIN LETTER SMALL CAPITAL ETH]
-"\u1D06" => "D"
-
-# \u1e0a [LATIN CAPITAL LETTER D WITH DOT ABOVE]
-"\u1E0A" => "D"
-
-# \u1e0c [LATIN CAPITAL LETTER D WITH DOT BELOW]
-"\u1E0C" => "D"
-
-# \u1e0e [LATIN CAPITAL LETTER D WITH LINE BELOW]
-"\u1E0E" => "D"
-
-# \u1e10 [LATIN CAPITAL LETTER D WITH CEDILLA]
-"\u1E10" => "D"
-
-# \u1e12 [LATIN CAPITAL LETTER D WITH CIRCUMFLEX BELOW]
-"\u1E12" => "D"
-
-# \u24b9 [CIRCLED LATIN CAPITAL LETTER D]
-"\u24B9" => "D"
-
-# \ua779 [LATIN CAPITAL LETTER INSULAR D]
-"\uA779" => "D"
-
-# \uff24 [FULLWIDTH LATIN CAPITAL LETTER D]
-"\uFF24" => "D"
-
-# � [LATIN SMALL LETTER ETH]
-"\u00F0" => "d"
-
-# \u010f [LATIN SMALL LETTER D WITH CARON]
-"\u010F" => "d"
-
-# \u0111 [LATIN SMALL LETTER D WITH STROKE]
-"\u0111" => "d"
-
-# \u018c [LATIN SMALL LETTER D WITH TOPBAR]
-"\u018C" => "d"
-
-# \u0221 [LATIN SMALL LETTER D WITH CURL]
-"\u0221" => "d"
-
-# \u0256 [LATIN SMALL LETTER D WITH TAIL]
-"\u0256" => "d"
-
-# \u0257 [LATIN SMALL LETTER D WITH HOOK]
-"\u0257" => "d"
-
-# \u1d6d [LATIN SMALL LETTER D WITH MIDDLE TILDE]
-"\u1D6D" => "d"
-
-# \u1d81 [LATIN SMALL LETTER D WITH PALATAL HOOK]
-"\u1D81" => "d"
-
-# \u1d91 [LATIN SMALL LETTER D WITH HOOK AND TAIL]
-"\u1D91" => "d"
-
-# \u1e0b [LATIN SMALL LETTER D WITH DOT ABOVE]
-"\u1E0B" => "d"
-
-# \u1e0d [LATIN SMALL LETTER D WITH DOT BELOW]
-"\u1E0D" => "d"
-
-# \u1e0f [LATIN SMALL LETTER D WITH LINE BELOW]
-"\u1E0F" => "d"
-
-# \u1e11 [LATIN SMALL LETTER D WITH CEDILLA]
-"\u1E11" => "d"
-
-# \u1e13 [LATIN SMALL LETTER D WITH CIRCUMFLEX BELOW]
-"\u1E13" => "d"
-
-# \u24d3 [CIRCLED LATIN SMALL LETTER D]
-"\u24D3" => "d"
-
-# \ua77a [LATIN SMALL LETTER INSULAR D]
-"\uA77A" => "d"
-
-# \uff44 [FULLWIDTH LATIN SMALL LETTER D]
-"\uFF44" => "d"
-
-# \u01c4 [LATIN CAPITAL LETTER DZ WITH CARON]
-"\u01C4" => "DZ"
-
-# \u01f1 [LATIN CAPITAL LETTER DZ]
-"\u01F1" => "DZ"
-
-# \u01c5 [LATIN CAPITAL LETTER D WITH SMALL LETTER Z WITH CARON]
-"\u01C5" => "Dz"
-
-# \u01f2 [LATIN CAPITAL LETTER D WITH SMALL LETTER Z]
-"\u01F2" => "Dz"
-
-# \u249f [PARENTHESIZED LATIN SMALL LETTER D]
-"\u249F" => "(d)"
-
-# \u0238 [LATIN SMALL LETTER DB DIGRAPH]
-"\u0238" => "db"
-
-# \u01c6 [LATIN SMALL LETTER DZ WITH CARON]
-"\u01C6" => "dz"
-
-# \u01f3 [LATIN SMALL LETTER DZ]
-"\u01F3" => "dz"
-
-# \u02a3 [LATIN SMALL LETTER DZ DIGRAPH]
-"\u02A3" => "dz"
-
-# \u02a5 [LATIN SMALL LETTER DZ DIGRAPH WITH CURL]
-"\u02A5" => "dz"
-
-# � [LATIN CAPITAL LETTER E WITH GRAVE]
-"\u00C8" => "E"
-
-# � [LATIN CAPITAL LETTER E WITH ACUTE]
-"\u00C9" => "E"
-
-# � [LATIN CAPITAL LETTER E WITH CIRCUMFLEX]
-"\u00CA" => "E"
-
-# � [LATIN CAPITAL LETTER E WITH DIAERESIS]
-"\u00CB" => "E"
-
-# \u0112 [LATIN CAPITAL LETTER E WITH MACRON]
-"\u0112" => "E"
-
-# \u0114 [LATIN CAPITAL LETTER E WITH BREVE]
-"\u0114" => "E"
-
-# \u0116 [LATIN CAPITAL LETTER E WITH DOT ABOVE]
-"\u0116" => "E"
-
-# \u0118 [LATIN CAPITAL LETTER E WITH OGONEK]
-"\u0118" => "E"
-
-# \u011a [LATIN CAPITAL LETTER E WITH CARON]
-"\u011A" => "E"
-
-# \u018e [LATIN CAPITAL LETTER REVERSED E]
-"\u018E" => "E"
-
-# \u0190 [LATIN CAPITAL LETTER OPEN E]
-"\u0190" => "E"
-
-# \u0204 [LATIN CAPITAL LETTER E WITH DOUBLE GRAVE]
-"\u0204" => "E"
-
-# \u0206 [LATIN CAPITAL LETTER E WITH INVERTED BREVE]
-"\u0206" => "E"
-
-# \u0228 [LATIN CAPITAL LETTER E WITH CEDILLA]
-"\u0228" => "E"
-
-# \u0246 [LATIN CAPITAL LETTER E WITH STROKE]
-"\u0246" => "E"
-
-# \u1d07 [LATIN LETTER SMALL CAPITAL E]
-"\u1D07" => "E"
-
-# \u1e14 [LATIN CAPITAL LETTER E WITH MACRON AND GRAVE]
-"\u1E14" => "E"
-
-# \u1e16 [LATIN CAPITAL LETTER E WITH MACRON AND ACUTE]
-"\u1E16" => "E"
-
-# \u1e18 [LATIN CAPITAL LETTER E WITH CIRCUMFLEX BELOW]
-"\u1E18" => "E"
-
-# \u1e1a [LATIN CAPITAL LETTER E WITH TILDE BELOW]
-"\u1E1A" => "E"
-
-# \u1e1c [LATIN CAPITAL LETTER E WITH CEDILLA AND BREVE]
-"\u1E1C" => "E"
-
-# \u1eb8 [LATIN CAPITAL LETTER E WITH DOT BELOW]
-"\u1EB8" => "E"
-
-# \u1eba [LATIN CAPITAL LETTER E WITH HOOK ABOVE]
-"\u1EBA" => "E"
-
-# \u1ebc [LATIN CAPITAL LETTER E WITH TILDE]
-"\u1EBC" => "E"
-
-# \u1ebe [LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND ACUTE]
-"\u1EBE" => "E"
-
-# \u1ec0 [LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND GRAVE]
-"\u1EC0" => "E"
-
-# \u1ec2 [LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND HOOK ABOVE]
-"\u1EC2" => "E"
-
-# \u1ec4 [LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND TILDE]
-"\u1EC4" => "E"
-
-# \u1ec6 [LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND DOT BELOW]
-"\u1EC6" => "E"
-
-# \u24ba [CIRCLED LATIN CAPITAL LETTER E]
-"\u24BA" => "E"
-
-# \u2c7b [LATIN LETTER SMALL CAPITAL TURNED E]
-"\u2C7B" => "E"
-
-# \uff25 [FULLWIDTH LATIN CAPITAL LETTER E]
-"\uFF25" => "E"
-
-# � [LATIN SMALL LETTER E WITH GRAVE]
-"\u00E8" => "e"
-
-# � [LATIN SMALL LETTER E WITH ACUTE]
-"\u00E9" => "e"
-
-# � [LATIN SMALL LETTER E WITH CIRCUMFLEX]
-"\u00EA" => "e"
-
-# � [LATIN SMALL LETTER E WITH DIAERESIS]
-"\u00EB" => "e"
-
-# \u0113 [LATIN SMALL LETTER E WITH MACRON]
-"\u0113" => "e"
-
-# \u0115 [LATIN SMALL LETTER E WITH BREVE]
-"\u0115" => "e"
-
-# \u0117 [LATIN SMALL LETTER E WITH DOT ABOVE]
-"\u0117" => "e"
-
-# \u0119 [LATIN SMALL LETTER E WITH OGONEK]
-"\u0119" => "e"
-
-# \u011b [LATIN SMALL LETTER E WITH CARON]
-"\u011B" => "e"
-
-# \u01dd [LATIN SMALL LETTER TURNED E]
-"\u01DD" => "e"
-
-# \u0205 [LATIN SMALL LETTER E WITH DOUBLE GRAVE]
-"\u0205" => "e"
-
-# \u0207 [LATIN SMALL LETTER E WITH INVERTED BREVE]
-"\u0207" => "e"
-
-# \u0229 [LATIN SMALL LETTER E WITH CEDILLA]
-"\u0229" => "e"
-
-# \u0247 [LATIN SMALL LETTER E WITH STROKE]
-"\u0247" => "e"
-
-# \u0258 [LATIN SMALL LETTER REVERSED E]
-"\u0258" => "e"
-
-# \u025b [LATIN SMALL LETTER OPEN E]
-"\u025B" => "e"
-
-# \u025c [LATIN SMALL LETTER REVERSED OPEN E]
-"\u025C" => "e"
-
-# \u025d [LATIN SMALL LETTER REVERSED OPEN E WITH HOOK]
-"\u025D" => "e"
-
-# \u025e [LATIN SMALL LETTER CLOSED REVERSED OPEN E]
-"\u025E" => "e"
-
-# \u029a [LATIN SMALL LETTER CLOSED OPEN E]
-"\u029A" => "e"
-
-# \u1d08 [LATIN SMALL LETTER TURNED OPEN E]
-"\u1D08" => "e"
-
-# \u1d92 [LATIN SMALL LETTER E WITH RETROFLEX HOOK]
-"\u1D92" => "e"
-
-# \u1d93 [LATIN SMALL LETTER OPEN E WITH RETROFLEX HOOK]
-"\u1D93" => "e"
-
-# \u1d94 [LATIN SMALL LETTER REVERSED OPEN E WITH RETROFLEX HOOK]
-"\u1D94" => "e"
-
-# \u1e15 [LATIN SMALL LETTER E WITH MACRON AND GRAVE]
-"\u1E15" => "e"
-
-# \u1e17 [LATIN SMALL LETTER E WITH MACRON AND ACUTE]
-"\u1E17" => "e"
-
-# \u1e19 [LATIN SMALL LETTER E WITH CIRCUMFLEX BELOW]
-"\u1E19" => "e"
-
-# \u1e1b [LATIN SMALL LETTER E WITH TILDE BELOW]
-"\u1E1B" => "e"
-
-# \u1e1d [LATIN SMALL LETTER E WITH CEDILLA AND BREVE]
-"\u1E1D" => "e"
-
-# \u1eb9 [LATIN SMALL LETTER E WITH DOT BELOW]
-"\u1EB9" => "e"
-
-# \u1ebb [LATIN SMALL LETTER E WITH HOOK ABOVE]
-"\u1EBB" => "e"
-
-# \u1ebd [LATIN SMALL LETTER E WITH TILDE]
-"\u1EBD" => "e"
-
-# \u1ebf [LATIN SMALL LETTER E WITH CIRCUMFLEX AND ACUTE]
-"\u1EBF" => "e"
-
-# \u1ec1 [LATIN SMALL LETTER E WITH CIRCUMFLEX AND GRAVE]
-"\u1EC1" => "e"
-
-# \u1ec3 [LATIN SMALL LETTER E WITH CIRCUMFLEX AND HOOK ABOVE]
-"\u1EC3" => "e"
-
-# \u1ec5 [LATIN SMALL LETTER E WITH CIRCUMFLEX AND TILDE]
-"\u1EC5" => "e"
-
-# \u1ec7 [LATIN SMALL LETTER E WITH CIRCUMFLEX AND DOT BELOW]
-"\u1EC7" => "e"
-
-# \u2091 [LATIN SUBSCRIPT SMALL LETTER E]
-"\u2091" => "e"
-
-# \u24d4 [CIRCLED LATIN SMALL LETTER E]
-"\u24D4" => "e"
-
-# \u2c78 [LATIN SMALL LETTER E WITH NOTCH]
-"\u2C78" => "e"
-
-# \uff45 [FULLWIDTH LATIN SMALL LETTER E]
-"\uFF45" => "e"
-
-# \u24a0 [PARENTHESIZED LATIN SMALL LETTER E]
-"\u24A0" => "(e)"
-
-# \u0191 [LATIN CAPITAL LETTER F WITH HOOK]
-"\u0191" => "F"
-
-# \u1e1e [LATIN CAPITAL LETTER F WITH DOT ABOVE]
-"\u1E1E" => "F"
-
-# \u24bb [CIRCLED LATIN CAPITAL LETTER F]
-"\u24BB" => "F"
-
-# \ua730 [LATIN LETTER SMALL CAPITAL F]
-"\uA730" => "F"
-
-# \ua77b [LATIN CAPITAL LETTER INSULAR F]
-"\uA77B" => "F"
-
-# \ua7fb [LATIN EPIGRAPHIC LETTER REVERSED F]
-"\uA7FB" => "F"
-
-# \uff26 [FULLWIDTH LATIN CAPITAL LETTER F]
-"\uFF26" => "F"
-
-# \u0192 [LATIN SMALL LETTER F WITH HOOK]
-"\u0192" => "f"
-
-# \u1d6e [LATIN SMALL LETTER F WITH MIDDLE TILDE]
-"\u1D6E" => "f"
-
-# \u1d82 [LATIN SMALL LETTER F WITH PALATAL HOOK]
-"\u1D82" => "f"
-
-# \u1e1f [LATIN SMALL LETTER F WITH DOT ABOVE]
-"\u1E1F" => "f"
-
-# \u1e9b [LATIN SMALL LETTER LONG S WITH DOT ABOVE]
-"\u1E9B" => "f"
-
-# \u24d5 [CIRCLED LATIN SMALL LETTER F]
-"\u24D5" => "f"
-
-# \ua77c [LATIN SMALL LETTER INSULAR F]
-"\uA77C" => "f"
-
-# \uff46 [FULLWIDTH LATIN SMALL LETTER F]
-"\uFF46" => "f"
-
-# \u24a1 [PARENTHESIZED LATIN SMALL LETTER F]
-"\u24A1" => "(f)"
-
-# \ufb00 [LATIN SMALL LIGATURE FF]
-"\uFB00" => "ff"
-
-# \ufb03 [LATIN SMALL LIGATURE FFI]
-"\uFB03" => "ffi"
-
-# \ufb04 [LATIN SMALL LIGATURE FFL]
-"\uFB04" => "ffl"
-
-# \ufb01 [LATIN SMALL LIGATURE FI]
-"\uFB01" => "fi"
-
-# \ufb02 [LATIN SMALL LIGATURE FL]
-"\uFB02" => "fl"
-
-# \u011c [LATIN CAPITAL LETTER G WITH CIRCUMFLEX]
-"\u011C" => "G"
-
-# \u011e [LATIN CAPITAL LETTER G WITH BREVE]
-"\u011E" => "G"
-
-# \u0120 [LATIN CAPITAL LETTER G WITH DOT ABOVE]
-"\u0120" => "G"
-
-# \u0122 [LATIN CAPITAL LETTER G WITH CEDILLA]
-"\u0122" => "G"
-
-# \u0193 [LATIN CAPITAL LETTER G WITH HOOK]
-"\u0193" => "G"
-
-# \u01e4 [LATIN CAPITAL LETTER G WITH STROKE]
-"\u01E4" => "G"
-
-# \u01e5 [LATIN SMALL LETTER G WITH STROKE]
-"\u01E5" => "G"
-
-# \u01e6 [LATIN CAPITAL LETTER G WITH CARON]
-"\u01E6" => "G"
-
-# \u01e7 [LATIN SMALL LETTER G WITH CARON]
-"\u01E7" => "G"
-
-# \u01f4 [LATIN CAPITAL LETTER G WITH ACUTE]
-"\u01F4" => "G"
-
-# \u0262 [LATIN LETTER SMALL CAPITAL G]
-"\u0262" => "G"
-
-# \u029b [LATIN LETTER SMALL CAPITAL G WITH HOOK]
-"\u029B" => "G"
-
-# \u1e20 [LATIN CAPITAL LETTER G WITH MACRON]
-"\u1E20" => "G"
-
-# \u24bc [CIRCLED LATIN CAPITAL LETTER G]
-"\u24BC" => "G"
-
-# \ua77d [LATIN CAPITAL LETTER INSULAR G]
-"\uA77D" => "G"
-
-# \ua77e [LATIN CAPITAL LETTER TURNED INSULAR G]
-"\uA77E" => "G"
-
-# \uff27 [FULLWIDTH LATIN CAPITAL LETTER G]
-"\uFF27" => "G"
-
-# \u011d [LATIN SMALL LETTER G WITH CIRCUMFLEX]
-"\u011D" => "g"
-
-# \u011f [LATIN SMALL LETTER G WITH BREVE]
-"\u011F" => "g"
-
-# \u0121 [LATIN SMALL LETTER G WITH DOT ABOVE]
-"\u0121" => "g"
-
-# \u0123 [LATIN SMALL LETTER G WITH CEDILLA]
-"\u0123" => "g"
-
-# \u01f5 [LATIN SMALL LETTER G WITH ACUTE]
-"\u01F5" => "g"
-
-# \u0260 [LATIN SMALL LETTER G WITH HOOK]
-"\u0260" => "g"
-
-# \u0261 [LATIN SMALL LETTER SCRIPT G]
-"\u0261" => "g"
-
-# \u1d77 [LATIN SMALL LETTER TURNED G]
-"\u1D77" => "g"
-
-# \u1d79 [LATIN SMALL LETTER INSULAR G]
-"\u1D79" => "g"
-
-# \u1d83 [LATIN SMALL LETTER G WITH PALATAL HOOK]
-"\u1D83" => "g"
-
-# \u1e21 [LATIN SMALL LETTER G WITH MACRON]
-"\u1E21" => "g"
-
-# \u24d6 [CIRCLED LATIN SMALL LETTER G]
-"\u24D6" => "g"
-
-# \ua77f [LATIN SMALL LETTER TURNED INSULAR G]
-"\uA77F" => "g"
-
-# \uff47 [FULLWIDTH LATIN SMALL LETTER G]
-"\uFF47" => "g"
-
-# \u24a2 [PARENTHESIZED LATIN SMALL LETTER G]
-"\u24A2" => "(g)"
-
-# \u0124 [LATIN CAPITAL LETTER H WITH CIRCUMFLEX]
-"\u0124" => "H"
-
-# \u0126 [LATIN CAPITAL LETTER H WITH STROKE]
-"\u0126" => "H"
-
-# \u021e [LATIN CAPITAL LETTER H WITH CARON]
-"\u021E" => "H"
-
-# \u029c [LATIN LETTER SMALL CAPITAL H]
-"\u029C" => "H"
-
-# \u1e22 [LATIN CAPITAL LETTER H WITH DOT ABOVE]
-"\u1E22" => "H"
-
-# \u1e24 [LATIN CAPITAL LETTER H WITH DOT BELOW]
-"\u1E24" => "H"
-
-# \u1e26 [LATIN CAPITAL LETTER H WITH DIAERESIS]
-"\u1E26" => "H"
-
-# \u1e28 [LATIN CAPITAL LETTER H WITH CEDILLA]
-"\u1E28" => "H"
-
-# \u1e2a [LATIN CAPITAL LETTER H WITH BREVE BELOW]
-"\u1E2A" => "H"
-
-# \u24bd [CIRCLED LATIN CAPITAL LETTER H]
-"\u24BD" => "H"
-
-# \u2c67 [LATIN CAPITAL LETTER H WITH DESCENDER]
-"\u2C67" => "H"
-
-# \u2c75 [LATIN CAPITAL LETTER HALF H]
-"\u2C75" => "H"
-
-# \uff28 [FULLWIDTH LATIN CAPITAL LETTER H]
-"\uFF28" => "H"
-
-# \u0125 [LATIN SMALL LETTER H WITH CIRCUMFLEX]
-"\u0125" => "h"
-
-# \u0127 [LATIN SMALL LETTER H WITH STROKE]
-"\u0127" => "h"
-
-# \u021f [LATIN SMALL LETTER H WITH CARON]
-"\u021F" => "h"
-
-# \u0265 [LATIN SMALL LETTER TURNED H]
-"\u0265" => "h"
-
-# \u0266 [LATIN SMALL LETTER H WITH HOOK]
-"\u0266" => "h"
-
-# \u02ae [LATIN SMALL LETTER TURNED H WITH FISHHOOK]
-"\u02AE" => "h"
-
-# \u02af [LATIN SMALL LETTER TURNED H WITH FISHHOOK AND TAIL]
-"\u02AF" => "h"
-
-# \u1e23 [LATIN SMALL LETTER H WITH DOT ABOVE]
-"\u1E23" => "h"
-
-# \u1e25 [LATIN SMALL LETTER H WITH DOT BELOW]
-"\u1E25" => "h"
-
-# \u1e27 [LATIN SMALL LETTER H WITH DIAERESIS]
-"\u1E27" => "h"
-
-# \u1e29 [LATIN SMALL LETTER H WITH CEDILLA]
-"\u1E29" => "h"
-
-# \u1e2b [LATIN SMALL LETTER H WITH BREVE BELOW]
-"\u1E2B" => "h"
-
-# \u1e96 [LATIN SMALL LETTER H WITH LINE BELOW]
-"\u1E96" => "h"
-
-# \u24d7 [CIRCLED LATIN SMALL LETTER H]
-"\u24D7" => "h"
-
-# \u2c68 [LATIN SMALL LETTER H WITH DESCENDER]
-"\u2C68" => "h"
-
-# \u2c76 [LATIN SMALL LETTER HALF H]
-"\u2C76" => "h"
-
-# \uff48 [FULLWIDTH LATIN SMALL LETTER H]
-"\uFF48" => "h"
-
-# \u01f6 http://en.wikipedia.org/wiki/Hwair [LATIN CAPITAL LETTER HWAIR]
-"\u01F6" => "HV"
-
-# \u24a3 [PARENTHESIZED LATIN SMALL LETTER H]
-"\u24A3" => "(h)"
-
-# \u0195 [LATIN SMALL LETTER HV]
-"\u0195" => "hv"
-
-# � [LATIN CAPITAL LETTER I WITH GRAVE]
-"\u00CC" => "I"
-
-# � [LATIN CAPITAL LETTER I WITH ACUTE]
-"\u00CD" => "I"
-
-# � [LATIN CAPITAL LETTER I WITH CIRCUMFLEX]
-"\u00CE" => "I"
-
-# � [LATIN CAPITAL LETTER I WITH DIAERESIS]
-"\u00CF" => "I"
-
-# \u0128 [LATIN CAPITAL LETTER I WITH TILDE]
-"\u0128" => "I"
-
-# \u012a [LATIN CAPITAL LETTER I WITH MACRON]
-"\u012A" => "I"
-
-# \u012c [LATIN CAPITAL LETTER I WITH BREVE]
-"\u012C" => "I"
-
-# \u012e [LATIN CAPITAL LETTER I WITH OGONEK]
-"\u012E" => "I"
-
-# \u0130 [LATIN CAPITAL LETTER I WITH DOT ABOVE]
-"\u0130" => "I"
-
-# \u0196 [LATIN CAPITAL LETTER IOTA]
-"\u0196" => "I"
-
-# \u0197 [LATIN CAPITAL LETTER I WITH STROKE]
-"\u0197" => "I"
-
-# \u01cf [LATIN CAPITAL LETTER I WITH CARON]
-"\u01CF" => "I"
-
-# \u0208 [LATIN CAPITAL LETTER I WITH DOUBLE GRAVE]
-"\u0208" => "I"
-
-# \u020a [LATIN CAPITAL LETTER I WITH INVERTED BREVE]
-"\u020A" => "I"
-
-# \u026a [LATIN LETTER SMALL CAPITAL I]
-"\u026A" => "I"
-
-# \u1d7b [LATIN SMALL CAPITAL LETTER I WITH STROKE]
-"\u1D7B" => "I"
-
-# \u1e2c [LATIN CAPITAL LETTER I WITH TILDE BELOW]
-"\u1E2C" => "I"
-
-# \u1e2e [LATIN CAPITAL LETTER I WITH DIAERESIS AND ACUTE]
-"\u1E2E" => "I"
-
-# \u1ec8 [LATIN CAPITAL LETTER I WITH HOOK ABOVE]
-"\u1EC8" => "I"
-
-# \u1eca [LATIN CAPITAL LETTER I WITH DOT BELOW]
-"\u1ECA" => "I"
-
-# \u24be [CIRCLED LATIN CAPITAL LETTER I]
-"\u24BE" => "I"
-
-# \ua7fe [LATIN EPIGRAPHIC LETTER I LONGA]
-"\uA7FE" => "I"
-
-# \uff29 [FULLWIDTH LATIN CAPITAL LETTER I]
-"\uFF29" => "I"
-
-# � [LATIN SMALL LETTER I WITH GRAVE]
-"\u00EC" => "i"
-
-# � [LATIN SMALL LETTER I WITH ACUTE]
-"\u00ED" => "i"
-
-# � [LATIN SMALL LETTER I WITH CIRCUMFLEX]
-"\u00EE" => "i"
-
-# � [LATIN SMALL LETTER I WITH DIAERESIS]
-"\u00EF" => "i"
-
-# \u0129 [LATIN SMALL LETTER I WITH TILDE]
-"\u0129" => "i"
-
-# \u012b [LATIN SMALL LETTER I WITH MACRON]
-"\u012B" => "i"
-
-# \u012d [LATIN SMALL LETTER I WITH BREVE]
-"\u012D" => "i"
-
-# \u012f [LATIN SMALL LETTER I WITH OGONEK]
-"\u012F" => "i"
-
-# \u0131 [LATIN SMALL LETTER DOTLESS I]
-"\u0131" => "i"
-
-# \u01d0 [LATIN SMALL LETTER I WITH CARON]
-"\u01D0" => "i"
-
-# \u0209 [LATIN SMALL LETTER I WITH DOUBLE GRAVE]
-"\u0209" => "i"
-
-# \u020b [LATIN SMALL LETTER I WITH INVERTED BREVE]
-"\u020B" => "i"
-
-# \u0268 [LATIN SMALL LETTER I WITH STROKE]
-"\u0268" => "i"
-
-# \u1d09 [LATIN SMALL LETTER TURNED I]
-"\u1D09" => "i"
-
-# \u1d62 [LATIN SUBSCRIPT SMALL LETTER I]
-"\u1D62" => "i"
-
-# \u1d7c [LATIN SMALL LETTER IOTA WITH STROKE]
-"\u1D7C" => "i"
-
-# \u1d96 [LATIN SMALL LETTER I WITH RETROFLEX HOOK]
-"\u1D96" => "i"
-
-# \u1e2d [LATIN SMALL LETTER I WITH TILDE BELOW]
-"\u1E2D" => "i"
-
-# \u1e2f [LATIN SMALL LETTER I WITH DIAERESIS AND ACUTE]
-"\u1E2F" => "i"
-
-# \u1ec9 [LATIN SMALL LETTER I WITH HOOK ABOVE]
-"\u1EC9" => "i"
-
-# \u1ecb [LATIN SMALL LETTER I WITH DOT BELOW]
-"\u1ECB" => "i"
-
-# \u2071 [SUPERSCRIPT LATIN SMALL LETTER I]
-"\u2071" => "i"
-
-# \u24d8 [CIRCLED LATIN SMALL LETTER I]
-"\u24D8" => "i"
-
-# \uff49 [FULLWIDTH LATIN SMALL LETTER I]
-"\uFF49" => "i"
-
-# \u0132 [LATIN CAPITAL LIGATURE IJ]
-"\u0132" => "IJ"
-
-# \u24a4 [PARENTHESIZED LATIN SMALL LETTER I]
-"\u24A4" => "(i)"
-
-# \u0133 [LATIN SMALL LIGATURE IJ]
-"\u0133" => "ij"
-
-# \u0134 [LATIN CAPITAL LETTER J WITH CIRCUMFLEX]
-"\u0134" => "J"
-
-# \u0248 [LATIN CAPITAL LETTER J WITH STROKE]
-"\u0248" => "J"
-
-# \u1d0a [LATIN LETTER SMALL CAPITAL J]
-"\u1D0A" => "J"
-
-# \u24bf [CIRCLED LATIN CAPITAL LETTER J]
-"\u24BF" => "J"
-
-# \uff2a [FULLWIDTH LATIN CAPITAL LETTER J]
-"\uFF2A" => "J"
-
-# \u0135 [LATIN SMALL LETTER J WITH CIRCUMFLEX]
-"\u0135" => "j"
-
-# \u01f0 [LATIN SMALL LETTER J WITH CARON]
-"\u01F0" => "j"
-
-# \u0237 [LATIN SMALL LETTER DOTLESS J]
-"\u0237" => "j"
-
-# \u0249 [LATIN SMALL LETTER J WITH STROKE]
-"\u0249" => "j"
-
-# \u025f [LATIN SMALL LETTER DOTLESS J WITH STROKE]
-"\u025F" => "j"
-
-# \u0284 [LATIN SMALL LETTER DOTLESS J WITH STROKE AND HOOK]
-"\u0284" => "j"
-
-# \u029d [LATIN SMALL LETTER J WITH CROSSED-TAIL]
-"\u029D" => "j"
-
-# \u24d9 [CIRCLED LATIN SMALL LETTER J]
-"\u24D9" => "j"
-
-# \u2c7c [LATIN SUBSCRIPT SMALL LETTER J]
-"\u2C7C" => "j"
-
-# \uff4a [FULLWIDTH LATIN SMALL LETTER J]
-"\uFF4A" => "j"
-
-# \u24a5 [PARENTHESIZED LATIN SMALL LETTER J]
-"\u24A5" => "(j)"
-
-# \u0136 [LATIN CAPITAL LETTER K WITH CEDILLA]
-"\u0136" => "K"
-
-# \u0198 [LATIN CAPITAL LETTER K WITH HOOK]
-"\u0198" => "K"
-
-# \u01e8 [LATIN CAPITAL LETTER K WITH CARON]
-"\u01E8" => "K"
-
-# \u1d0b [LATIN LETTER SMALL CAPITAL K]
-"\u1D0B" => "K"
-
-# \u1e30 [LATIN CAPITAL LETTER K WITH ACUTE]
-"\u1E30" => "K"
-
-# \u1e32 [LATIN CAPITAL LETTER K WITH DOT BELOW]
-"\u1E32" => "K"
-
-# \u1e34 [LATIN CAPITAL LETTER K WITH LINE BELOW]
-"\u1E34" => "K"
-
-# \u24c0 [CIRCLED LATIN CAPITAL LETTER K]
-"\u24C0" => "K"
-
-# \u2c69 [LATIN CAPITAL LETTER K WITH DESCENDER]
-"\u2C69" => "K"
-
-# \ua740 [LATIN CAPITAL LETTER K WITH STROKE]
-"\uA740" => "K"
-
-# \ua742 [LATIN CAPITAL LETTER K WITH DIAGONAL STROKE]
-"\uA742" => "K"
-
-# \ua744 [LATIN CAPITAL LETTER K WITH STROKE AND DIAGONAL STROKE]
-"\uA744" => "K"
-
-# \uff2b [FULLWIDTH LATIN CAPITAL LETTER K]
-"\uFF2B" => "K"
-
-# \u0137 [LATIN SMALL LETTER K WITH CEDILLA]
-"\u0137" => "k"
-
-# \u0199 [LATIN SMALL LETTER K WITH HOOK]
-"\u0199" => "k"
-
-# \u01e9 [LATIN SMALL LETTER K WITH CARON]
-"\u01E9" => "k"
-
-# \u029e [LATIN SMALL LETTER TURNED K]
-"\u029E" => "k"
-
-# \u1d84 [LATIN SMALL LETTER K WITH PALATAL HOOK]
-"\u1D84" => "k"
-
-# \u1e31 [LATIN SMALL LETTER K WITH ACUTE]
-"\u1E31" => "k"
-
-# \u1e33 [LATIN SMALL LETTER K WITH DOT BELOW]
-"\u1E33" => "k"
-
-# \u1e35 [LATIN SMALL LETTER K WITH LINE BELOW]
-"\u1E35" => "k"
-
-# \u24da [CIRCLED LATIN SMALL LETTER K]
-"\u24DA" => "k"
-
-# \u2c6a [LATIN SMALL LETTER K WITH DESCENDER]
-"\u2C6A" => "k"
-
-# \ua741 [LATIN SMALL LETTER K WITH STROKE]
-"\uA741" => "k"
-
-# \ua743 [LATIN SMALL LETTER K WITH DIAGONAL STROKE]
-"\uA743" => "k"
-
-# \ua745 [LATIN SMALL LETTER K WITH STROKE AND DIAGONAL STROKE]
-"\uA745" => "k"
-
-# \uff4b [FULLWIDTH LATIN SMALL LETTER K]
-"\uFF4B" => "k"
-
-# \u24a6 [PARENTHESIZED LATIN SMALL LETTER K]
-"\u24A6" => "(k)"
-
-# \u0139 [LATIN CAPITAL LETTER L WITH ACUTE]
-"\u0139" => "L"
-
-# \u013b [LATIN CAPITAL LETTER L WITH CEDILLA]
-"\u013B" => "L"
-
-# \u013d [LATIN CAPITAL LETTER L WITH CARON]
-"\u013D" => "L"
-
-# \u013f [LATIN CAPITAL LETTER L WITH MIDDLE DOT]
-"\u013F" => "L"
-
-# \u0141 [LATIN CAPITAL LETTER L WITH STROKE]
-"\u0141" => "L"
-
-# \u023d [LATIN CAPITAL LETTER L WITH BAR]
-"\u023D" => "L"
-
-# \u029f [LATIN LETTER SMALL CAPITAL L]
-"\u029F" => "L"
-
-# \u1d0c [LATIN LETTER SMALL CAPITAL L WITH STROKE]
-"\u1D0C" => "L"
-
-# \u1e36 [LATIN CAPITAL LETTER L WITH DOT BELOW]
-"\u1E36" => "L"
-
-# \u1e38 [LATIN CAPITAL LETTER L WITH DOT BELOW AND MACRON]
-"\u1E38" => "L"
-
-# \u1e3a [LATIN CAPITAL LETTER L WITH LINE BELOW]
-"\u1E3A" => "L"
-
-# \u1e3c [LATIN CAPITAL LETTER L WITH CIRCUMFLEX BELOW]
-"\u1E3C" => "L"
-
-# \u24c1 [CIRCLED LATIN CAPITAL LETTER L]
-"\u24C1" => "L"
-
-# \u2c60 [LATIN CAPITAL LETTER L WITH DOUBLE BAR]
-"\u2C60" => "L"
-
-# \u2c62 [LATIN CAPITAL LETTER L WITH MIDDLE TILDE]
-"\u2C62" => "L"
-
-# \ua746 [LATIN CAPITAL LETTER BROKEN L]
-"\uA746" => "L"
-
-# \ua748 [LATIN CAPITAL LETTER L WITH HIGH STROKE]
-"\uA748" => "L"
-
-# \ua780 [LATIN CAPITAL LETTER TURNED L]
-"\uA780" => "L"
-
-# \uff2c [FULLWIDTH LATIN CAPITAL LETTER L]
-"\uFF2C" => "L"
-
-# \u013a [LATIN SMALL LETTER L WITH ACUTE]
-"\u013A" => "l"
-
-# \u013c [LATIN SMALL LETTER L WITH CEDILLA]
-"\u013C" => "l"
-
-# \u013e [LATIN SMALL LETTER L WITH CARON]
-"\u013E" => "l"
-
-# \u0140 [LATIN SMALL LETTER L WITH MIDDLE DOT]
-"\u0140" => "l"
-
-# \u0142 [LATIN SMALL LETTER L WITH STROKE]
-"\u0142" => "l"
-
-# \u019a [LATIN SMALL LETTER L WITH BAR]
-"\u019A" => "l"
-
-# \u0234 [LATIN SMALL LETTER L WITH CURL]
-"\u0234" => "l"
-
-# \u026b [LATIN SMALL LETTER L WITH MIDDLE TILDE]
-"\u026B" => "l"
-
-# \u026c [LATIN SMALL LETTER L WITH BELT]
-"\u026C" => "l"
-
-# \u026d [LATIN SMALL LETTER L WITH RETROFLEX HOOK]
-"\u026D" => "l"
-
-# \u1d85 [LATIN SMALL LETTER L WITH PALATAL HOOK]
-"\u1D85" => "l"
-
-# \u1e37 [LATIN SMALL LETTER L WITH DOT BELOW]
-"\u1E37" => "l"
-
-# \u1e39 [LATIN SMALL LETTER L WITH DOT BELOW AND MACRON]
-"\u1E39" => "l"
-
-# \u1e3b [LATIN SMALL LETTER L WITH LINE BELOW]
-"\u1E3B" => "l"
-
-# \u1e3d [LATIN SMALL LETTER L WITH CIRCUMFLEX BELOW]
-"\u1E3D" => "l"
-
-# \u24db [CIRCLED LATIN SMALL LETTER L]
-"\u24DB" => "l"
-
-# \u2c61 [LATIN SMALL LETTER L WITH DOUBLE BAR]
-"\u2C61" => "l"
-
-# \ua747 [LATIN SMALL LETTER BROKEN L]
-"\uA747" => "l"
-
-# \ua749 [LATIN SMALL LETTER L WITH HIGH STROKE]
-"\uA749" => "l"
-
-# \ua781 [LATIN SMALL LETTER TURNED L]
-"\uA781" => "l"
-
-# \uff4c [FULLWIDTH LATIN SMALL LETTER L]
-"\uFF4C" => "l"
-
-# \u01c7 [LATIN CAPITAL LETTER LJ]
-"\u01C7" => "LJ"
-
-# \u1efa [LATIN CAPITAL LETTER MIDDLE-WELSH LL]
-"\u1EFA" => "LL"
-
-# \u01c8 [LATIN CAPITAL LETTER L WITH SMALL LETTER J]
-"\u01C8" => "Lj"
-
-# \u24a7 [PARENTHESIZED LATIN SMALL LETTER L]
-"\u24A7" => "(l)"
-
-# \u01c9 [LATIN SMALL LETTER LJ]
-"\u01C9" => "lj"
-
-# \u1efb [LATIN SMALL LETTER MIDDLE-WELSH LL]
-"\u1EFB" => "ll"
-
-# \u02aa [LATIN SMALL LETTER LS DIGRAPH]
-"\u02AA" => "ls"
-
-# \u02ab [LATIN SMALL LETTER LZ DIGRAPH]
-"\u02AB" => "lz"
-
-# \u019c [LATIN CAPITAL LETTER TURNED M]
-"\u019C" => "M"
-
-# \u1d0d [LATIN LETTER SMALL CAPITAL M]
-"\u1D0D" => "M"
-
-# \u1e3e [LATIN CAPITAL LETTER M WITH ACUTE]
-"\u1E3E" => "M"
-
-# \u1e40 [LATIN CAPITAL LETTER M WITH DOT ABOVE]
-"\u1E40" => "M"
-
-# \u1e42 [LATIN CAPITAL LETTER M WITH DOT BELOW]
-"\u1E42" => "M"
-
-# \u24c2 [CIRCLED LATIN CAPITAL LETTER M]
-"\u24C2" => "M"
-
-# \u2c6e [LATIN CAPITAL LETTER M WITH HOOK]
-"\u2C6E" => "M"
-
-# \ua7fd [LATIN EPIGRAPHIC LETTER INVERTED M]
-"\uA7FD" => "M"
-
-# \ua7ff [LATIN EPIGRAPHIC LETTER ARCHAIC M]
-"\uA7FF" => "M"
-
-# \uff2d [FULLWIDTH LATIN CAPITAL LETTER M]
-"\uFF2D" => "M"
-
-# \u026f [LATIN SMALL LETTER TURNED M]
-"\u026F" => "m"
-
-# \u0270 [LATIN SMALL LETTER TURNED M WITH LONG LEG]
-"\u0270" => "m"
-
-# \u0271 [LATIN SMALL LETTER M WITH HOOK]
-"\u0271" => "m"
-
-# \u1d6f [LATIN SMALL LETTER M WITH MIDDLE TILDE]
-"\u1D6F" => "m"
-
-# \u1d86 [LATIN SMALL LETTER M WITH PALATAL HOOK]
-"\u1D86" => "m"
-
-# \u1e3f [LATIN SMALL LETTER M WITH ACUTE]
-"\u1E3F" => "m"
-
-# \u1e41 [LATIN SMALL LETTER M WITH DOT ABOVE]
-"\u1E41" => "m"
-
-# \u1e43 [LATIN SMALL LETTER M WITH DOT BELOW]
-"\u1E43" => "m"
-
-# \u24dc [CIRCLED LATIN SMALL LETTER M]
-"\u24DC" => "m"
-
-# \uff4d [FULLWIDTH LATIN SMALL LETTER M]
-"\uFF4D" => "m"
-
-# \u24a8 [PARENTHESIZED LATIN SMALL LETTER M]
-"\u24A8" => "(m)"
-
-# � [LATIN CAPITAL LETTER N WITH TILDE]
-"\u00D1" => "N"
-
-# \u0143 [LATIN CAPITAL LETTER N WITH ACUTE]
-"\u0143" => "N"
-
-# \u0145 [LATIN CAPITAL LETTER N WITH CEDILLA]
-"\u0145" => "N"
-
-# \u0147 [LATIN CAPITAL LETTER N WITH CARON]
-"\u0147" => "N"
-
-# \u014a http://en.wikipedia.org/wiki/Eng_(letter) [LATIN CAPITAL LETTER ENG]
-"\u014A" => "N"
-
-# \u019d [LATIN CAPITAL LETTER N WITH LEFT HOOK]
-"\u019D" => "N"
-
-# \u01f8 [LATIN CAPITAL LETTER N WITH GRAVE]
-"\u01F8" => "N"
-
-# \u0220 [LATIN CAPITAL LETTER N WITH LONG RIGHT LEG]
-"\u0220" => "N"
-
-# \u0274 [LATIN LETTER SMALL CAPITAL N]
-"\u0274" => "N"
-
-# \u1d0e [LATIN LETTER SMALL CAPITAL REVERSED N]
-"\u1D0E" => "N"
-
-# \u1e44 [LATIN CAPITAL LETTER N WITH DOT ABOVE]
-"\u1E44" => "N"
-
-# \u1e46 [LATIN CAPITAL LETTER N WITH DOT BELOW]
-"\u1E46" => "N"
-
-# \u1e48 [LATIN CAPITAL LETTER N WITH LINE BELOW]
-"\u1E48" => "N"
-
-# \u1e4a [LATIN CAPITAL LETTER N WITH CIRCUMFLEX BELOW]
-"\u1E4A" => "N"
-
-# \u24c3 [CIRCLED LATIN CAPITAL LETTER N]
-"\u24C3" => "N"
-
-# \uff2e [FULLWIDTH LATIN CAPITAL LETTER N]
-"\uFF2E" => "N"
-
-# � [LATIN SMALL LETTER N WITH TILDE]
-"\u00F1" => "n"
-
-# \u0144 [LATIN SMALL LETTER N WITH ACUTE]
-"\u0144" => "n"
-
-# \u0146 [LATIN SMALL LETTER N WITH CEDILLA]
-"\u0146" => "n"
-
-# \u0148 [LATIN SMALL LETTER N WITH CARON]
-"\u0148" => "n"
-
-# \u0149 [LATIN SMALL LETTER N PRECEDED BY APOSTROPHE]
-"\u0149" => "n"
-
-# \u014b http://en.wikipedia.org/wiki/Eng_(letter) [LATIN SMALL LETTER ENG]
-"\u014B" => "n"
-
-# \u019e [LATIN SMALL LETTER N WITH LONG RIGHT LEG]
-"\u019E" => "n"
-
-# \u01f9 [LATIN SMALL LETTER N WITH GRAVE]
-"\u01F9" => "n"
-
-# \u0235 [LATIN SMALL LETTER N WITH CURL]
-"\u0235" => "n"
-
-# \u0272 [LATIN SMALL LETTER N WITH LEFT HOOK]
-"\u0272" => "n"
-
-# \u0273 [LATIN SMALL LETTER N WITH RETROFLEX HOOK]
-"\u0273" => "n"
-
-# \u1d70 [LATIN SMALL LETTER N WITH MIDDLE TILDE]
-"\u1D70" => "n"
-
-# \u1d87 [LATIN SMALL LETTER N WITH PALATAL HOOK]
-"\u1D87" => "n"
-
-# \u1e45 [LATIN SMALL LETTER N WITH DOT ABOVE]
-"\u1E45" => "n"
-
-# \u1e47 [LATIN SMALL LETTER N WITH DOT BELOW]
-"\u1E47" => "n"
-
-# \u1e49 [LATIN SMALL LETTER N WITH LINE BELOW]
-"\u1E49" => "n"
-
-# \u1e4b [LATIN SMALL LETTER N WITH CIRCUMFLEX BELOW]
-"\u1E4B" => "n"
-
-# \u207f [SUPERSCRIPT LATIN SMALL LETTER N]
-"\u207F" => "n"
-
-# \u24dd [CIRCLED LATIN SMALL LETTER N]
-"\u24DD" => "n"
-
-# \uff4e [FULLWIDTH LATIN SMALL LETTER N]
-"\uFF4E" => "n"
-
-# \u01ca [LATIN CAPITAL LETTER NJ]
-"\u01CA" => "NJ"
-
-# \u01cb [LATIN CAPITAL LETTER N WITH SMALL LETTER J]
-"\u01CB" => "Nj"
-
-# \u24a9 [PARENTHESIZED LATIN SMALL LETTER N]
-"\u24A9" => "(n)"
-
-# \u01cc [LATIN SMALL LETTER NJ]
-"\u01CC" => "nj"
-
-# � [LATIN CAPITAL LETTER O WITH GRAVE]
-"\u00D2" => "O"
-
-# � [LATIN CAPITAL LETTER O WITH ACUTE]
-"\u00D3" => "O"
-
-# � [LATIN CAPITAL LETTER O WITH CIRCUMFLEX]
-"\u00D4" => "O"
-
-# � [LATIN CAPITAL LETTER O WITH TILDE]
-"\u00D5" => "O"
-
-# � [LATIN CAPITAL LETTER O WITH DIAERESIS]
-"\u00D6" => "O"
-
-# � [LATIN CAPITAL LETTER O WITH STROKE]
-"\u00D8" => "O"
-
-# \u014c [LATIN CAPITAL LETTER O WITH MACRON]
-"\u014C" => "O"
-
-# \u014e [LATIN CAPITAL LETTER O WITH BREVE]
-"\u014E" => "O"
-
-# \u0150 [LATIN CAPITAL LETTER O WITH DOUBLE ACUTE]
-"\u0150" => "O"
-
-# \u0186 [LATIN CAPITAL LETTER OPEN O]
-"\u0186" => "O"
-
-# \u019f [LATIN CAPITAL LETTER O WITH MIDDLE TILDE]
-"\u019F" => "O"
-
-# \u01a0 [LATIN CAPITAL LETTER O WITH HORN]
-"\u01A0" => "O"
-
-# \u01d1 [LATIN CAPITAL LETTER O WITH CARON]
-"\u01D1" => "O"
-
-# \u01ea [LATIN CAPITAL LETTER O WITH OGONEK]
-"\u01EA" => "O"
-
-# \u01ec [LATIN CAPITAL LETTER O WITH OGONEK AND MACRON]
-"\u01EC" => "O"
-
-# \u01fe [LATIN CAPITAL LETTER O WITH STROKE AND ACUTE]
-"\u01FE" => "O"
-
-# \u020c [LATIN CAPITAL LETTER O WITH DOUBLE GRAVE]
-"\u020C" => "O"
-
-# \u020e [LATIN CAPITAL LETTER O WITH INVERTED BREVE]
-"\u020E" => "O"
-
-# \u022a [LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON]
-"\u022A" => "O"
-
-# \u022c [LATIN CAPITAL LETTER O WITH TILDE AND MACRON]
-"\u022C" => "O"
-
-# \u022e [LATIN CAPITAL LETTER O WITH DOT ABOVE]
-"\u022E" => "O"
-
-# \u0230 [LATIN CAPITAL LETTER O WITH DOT ABOVE AND MACRON]
-"\u0230" => "O"
-
-# \u1d0f [LATIN LETTER SMALL CAPITAL O]
-"\u1D0F" => "O"
-
-# \u1d10 [LATIN LETTER SMALL CAPITAL OPEN O]
-"\u1D10" => "O"
-
-# \u1e4c [LATIN CAPITAL LETTER O WITH TILDE AND ACUTE]
-"\u1E4C" => "O"
-
-# \u1e4e [LATIN CAPITAL LETTER O WITH TILDE AND DIAERESIS]
-"\u1E4E" => "O"
-
-# \u1e50 [LATIN CAPITAL LETTER O WITH MACRON AND GRAVE]
-"\u1E50" => "O"
-
-# \u1e52 [LATIN CAPITAL LETTER O WITH MACRON AND ACUTE]
-"\u1E52" => "O"
-
-# \u1ecc [LATIN CAPITAL LETTER O WITH DOT BELOW]
-"\u1ECC" => "O"
-
-# \u1ece [LATIN CAPITAL LETTER O WITH HOOK ABOVE]
-"\u1ECE" => "O"
-
-# \u1ed0 [LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND ACUTE]
-"\u1ED0" => "O"
-
-# \u1ed2 [LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND GRAVE]
-"\u1ED2" => "O"
-
-# \u1ed4 [LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND HOOK ABOVE]
-"\u1ED4" => "O"
-
-# \u1ed6 [LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND TILDE]
-"\u1ED6" => "O"
-
-# \u1ed8 [LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND DOT BELOW]
-"\u1ED8" => "O"
-
-# \u1eda [LATIN CAPITAL LETTER O WITH HORN AND ACUTE]
-"\u1EDA" => "O"
-
-# \u1edc [LATIN CAPITAL LETTER O WITH HORN AND GRAVE]
-"\u1EDC" => "O"
-
-# \u1ede [LATIN CAPITAL LETTER O WITH HORN AND HOOK ABOVE]
-"\u1EDE" => "O"
-
-# \u1ee0 [LATIN CAPITAL LETTER O WITH HORN AND TILDE]
-"\u1EE0" => "O"
-
-# \u1ee2 [LATIN CAPITAL LETTER O WITH HORN AND DOT BELOW]
-"\u1EE2" => "O"
-
-# \u24c4 [CIRCLED LATIN CAPITAL LETTER O]
-"\u24C4" => "O"
-
-# \ua74a [LATIN CAPITAL LETTER O WITH LONG STROKE OVERLAY]
-"\uA74A" => "O"
-
-# \ua74c [LATIN CAPITAL LETTER O WITH LOOP]
-"\uA74C" => "O"
-
-# \uff2f [FULLWIDTH LATIN CAPITAL LETTER O]
-"\uFF2F" => "O"
-
-# � [LATIN SMALL LETTER O WITH GRAVE]
-"\u00F2" => "o"
-
-# � [LATIN SMALL LETTER O WITH ACUTE]
-"\u00F3" => "o"
-
-# � [LATIN SMALL LETTER O WITH CIRCUMFLEX]
-"\u00F4" => "o"
-
-# � [LATIN SMALL LETTER O WITH TILDE]
-"\u00F5" => "o"
-
-# � [LATIN SMALL LETTER O WITH DIAERESIS]
-"\u00F6" => "o"
-
-# � [LATIN SMALL LETTER O WITH STROKE]
-"\u00F8" => "o"
-
-# \u014d [LATIN SMALL LETTER O WITH MACRON]
-"\u014D" => "o"
-
-# \u014f [LATIN SMALL LETTER O WITH BREVE]
-"\u014F" => "o"
-
-# \u0151 [LATIN SMALL LETTER O WITH DOUBLE ACUTE]
-"\u0151" => "o"
-
-# \u01a1 [LATIN SMALL LETTER O WITH HORN]
-"\u01A1" => "o"
-
-# \u01d2 [LATIN SMALL LETTER O WITH CARON]
-"\u01D2" => "o"
-
-# \u01eb [LATIN SMALL LETTER O WITH OGONEK]
-"\u01EB" => "o"
-
-# \u01ed [LATIN SMALL LETTER O WITH OGONEK AND MACRON]
-"\u01ED" => "o"
-
-# \u01ff [LATIN SMALL LETTER O WITH STROKE AND ACUTE]
-"\u01FF" => "o"
-
-# \u020d [LATIN SMALL LETTER O WITH DOUBLE GRAVE]
-"\u020D" => "o"
-
-# \u020f [LATIN SMALL LETTER O WITH INVERTED BREVE]
-"\u020F" => "o"
-
-# \u022b [LATIN SMALL LETTER O WITH DIAERESIS AND MACRON]
-"\u022B" => "o"
-
-# \u022d [LATIN SMALL LETTER O WITH TILDE AND MACRON]
-"\u022D" => "o"
-
-# \u022f [LATIN SMALL LETTER O WITH DOT ABOVE]
-"\u022F" => "o"
-
-# \u0231 [LATIN SMALL LETTER O WITH DOT ABOVE AND MACRON]
-"\u0231" => "o"
-
-# \u0254 [LATIN SMALL LETTER OPEN O]
-"\u0254" => "o"
-
-# \u0275 [LATIN SMALL LETTER BARRED O]
-"\u0275" => "o"
-
-# \u1d16 [LATIN SMALL LETTER TOP HALF O]
-"\u1D16" => "o"
-
-# \u1d17 [LATIN SMALL LETTER BOTTOM HALF O]
-"\u1D17" => "o"
-
-# \u1d97 [LATIN SMALL LETTER OPEN O WITH RETROFLEX HOOK]
-"\u1D97" => "o"
-
-# \u1e4d [LATIN SMALL LETTER O WITH TILDE AND ACUTE]
-"\u1E4D" => "o"
-
-# \u1e4f [LATIN SMALL LETTER O WITH TILDE AND DIAERESIS]
-"\u1E4F" => "o"
-
-# \u1e51 [LATIN SMALL LETTER O WITH MACRON AND GRAVE]
-"\u1E51" => "o"
-
-# \u1e53 [LATIN SMALL LETTER O WITH MACRON AND ACUTE]
-"\u1E53" => "o"
-
-# \u1ecd [LATIN SMALL LETTER O WITH DOT BELOW]
-"\u1ECD" => "o"
-
-# \u1ecf [LATIN SMALL LETTER O WITH HOOK ABOVE]
-"\u1ECF" => "o"
-
-# \u1ed1 [LATIN SMALL LETTER O WITH CIRCUMFLEX AND ACUTE]
-"\u1ED1" => "o"
-
-# \u1ed3 [LATIN SMALL LETTER O WITH CIRCUMFLEX AND GRAVE]
-"\u1ED3" => "o"
-
-# \u1ed5 [LATIN SMALL LETTER O WITH CIRCUMFLEX AND HOOK ABOVE]
-"\u1ED5" => "o"
-
-# \u1ed7 [LATIN SMALL LETTER O WITH CIRCUMFLEX AND TILDE]
-"\u1ED7" => "o"
-
-# \u1ed9 [LATIN SMALL LETTER O WITH CIRCUMFLEX AND DOT BELOW]
-"\u1ED9" => "o"
-
-# \u1edb [LATIN SMALL LETTER O WITH HORN AND ACUTE]
-"\u1EDB" => "o"
-
-# \u1edd [LATIN SMALL LETTER O WITH HORN AND GRAVE]
-"\u1EDD" => "o"
-
-# \u1edf [LATIN SMALL LETTER O WITH HORN AND HOOK ABOVE]
-"\u1EDF" => "o"
-
-# \u1ee1 [LATIN SMALL LETTER O WITH HORN AND TILDE]
-"\u1EE1" => "o"
-
-# \u1ee3 [LATIN SMALL LETTER O WITH HORN AND DOT BELOW]
-"\u1EE3" => "o"
-
-# \u2092 [LATIN SUBSCRIPT SMALL LETTER O]
-"\u2092" => "o"
-
-# \u24de [CIRCLED LATIN SMALL LETTER O]
-"\u24DE" => "o"
-
-# \u2c7a [LATIN SMALL LETTER O WITH LOW RING INSIDE]
-"\u2C7A" => "o"
-
-# \ua74b [LATIN SMALL LETTER O WITH LONG STROKE OVERLAY]
-"\uA74B" => "o"
-
-# \ua74d [LATIN SMALL LETTER O WITH LOOP]
-"\uA74D" => "o"
-
-# \uff4f [FULLWIDTH LATIN SMALL LETTER O]
-"\uFF4F" => "o"
-
-# \u0152 [LATIN CAPITAL LIGATURE OE]
-"\u0152" => "OE"
-
-# \u0276 [LATIN LETTER SMALL CAPITAL OE]
-"\u0276" => "OE"
-
-# \ua74e [LATIN CAPITAL LETTER OO]
-"\uA74E" => "OO"
-
-# \u0222 http://en.wikipedia.org/wiki/OU [LATIN CAPITAL LETTER OU]
-"\u0222" => "OU"
-
-# \u1d15 [LATIN LETTER SMALL CAPITAL OU]
-"\u1D15" => "OU"
-
-# \u24aa [PARENTHESIZED LATIN SMALL LETTER O]
-"\u24AA" => "(o)"
-
-# \u0153 [LATIN SMALL LIGATURE OE]
-"\u0153" => "oe"
-
-# \u1d14 [LATIN SMALL LETTER TURNED OE]
-"\u1D14" => "oe"
-
-# \ua74f [LATIN SMALL LETTER OO]
-"\uA74F" => "oo"
-
-# \u0223 http://en.wikipedia.org/wiki/OU [LATIN SMALL LETTER OU]
-"\u0223" => "ou"
-
-# \u01a4 [LATIN CAPITAL LETTER P WITH HOOK]
-"\u01A4" => "P"
-
-# \u1d18 [LATIN LETTER SMALL CAPITAL P]
-"\u1D18" => "P"
-
-# \u1e54 [LATIN CAPITAL LETTER P WITH ACUTE]
-"\u1E54" => "P"
-
-# \u1e56 [LATIN CAPITAL LETTER P WITH DOT ABOVE]
-"\u1E56" => "P"
-
-# \u24c5 [CIRCLED LATIN CAPITAL LETTER P]
-"\u24C5" => "P"
-
-# \u2c63 [LATIN CAPITAL LETTER P WITH STROKE]
-"\u2C63" => "P"
-
-# \ua750 [LATIN CAPITAL LETTER P WITH STROKE THROUGH DESCENDER]
-"\uA750" => "P"
-
-# \ua752 [LATIN CAPITAL LETTER P WITH FLOURISH]
-"\uA752" => "P"
-
-# \ua754 [LATIN CAPITAL LETTER P WITH SQUIRREL TAIL]
-"\uA754" => "P"
-
-# \uff30 [FULLWIDTH LATIN CAPITAL LETTER P]
-"\uFF30" => "P"
-
-# \u01a5 [LATIN SMALL LETTER P WITH HOOK]
-"\u01A5" => "p"
-
-# \u1d71 [LATIN SMALL LETTER P WITH MIDDLE TILDE]
-"\u1D71" => "p"
-
-# \u1d7d [LATIN SMALL LETTER P WITH STROKE]
-"\u1D7D" => "p"
-
-# \u1d88 [LATIN SMALL LETTER P WITH PALATAL HOOK]
-"\u1D88" => "p"
-
-# \u1e55 [LATIN SMALL LETTER P WITH ACUTE]
-"\u1E55" => "p"
-
-# \u1e57 [LATIN SMALL LETTER P WITH DOT ABOVE]
-"\u1E57" => "p"
-
-# \u24df [CIRCLED LATIN SMALL LETTER P]
-"\u24DF" => "p"
-
-# \ua751 [LATIN SMALL LETTER P WITH STROKE THROUGH DESCENDER]
-"\uA751" => "p"
-
-# \ua753 [LATIN SMALL LETTER P WITH FLOURISH]
-"\uA753" => "p"
-
-# \ua755 [LATIN SMALL LETTER P WITH SQUIRREL TAIL]
-"\uA755" => "p"
-
-# \ua7fc [LATIN EPIGRAPHIC LETTER REVERSED P]
-"\uA7FC" => "p"
-
-# \uff50 [FULLWIDTH LATIN SMALL LETTER P]
-"\uFF50" => "p"
-
-# \u24ab [PARENTHESIZED LATIN SMALL LETTER P]
-"\u24AB" => "(p)"
-
-# \u024a [LATIN CAPITAL LETTER SMALL Q WITH HOOK TAIL]
-"\u024A" => "Q"
-
-# \u24c6 [CIRCLED LATIN CAPITAL LETTER Q]
-"\u24C6" => "Q"
-
-# \ua756 [LATIN CAPITAL LETTER Q WITH STROKE THROUGH DESCENDER]
-"\uA756" => "Q"
-
-# \ua758 [LATIN CAPITAL LETTER Q WITH DIAGONAL STROKE]
-"\uA758" => "Q"
-
-# \uff31 [FULLWIDTH LATIN CAPITAL LETTER Q]
-"\uFF31" => "Q"
-
-# \u0138 http://en.wikipedia.org/wiki/Kra_(letter) [LATIN SMALL LETTER KRA]
-"\u0138" => "q"
-
-# \u024b [LATIN SMALL LETTER Q WITH HOOK TAIL]
-"\u024B" => "q"
-
-# \u02a0 [LATIN SMALL LETTER Q WITH HOOK]
-"\u02A0" => "q"
-
-# \u24e0 [CIRCLED LATIN SMALL LETTER Q]
-"\u24E0" => "q"
-
-# \ua757 [LATIN SMALL LETTER Q WITH STROKE THROUGH DESCENDER]
-"\uA757" => "q"
-
-# \ua759 [LATIN SMALL LETTER Q WITH DIAGONAL STROKE]
-"\uA759" => "q"
-
-# \uff51 [FULLWIDTH LATIN SMALL LETTER Q]
-"\uFF51" => "q"
-
-# \u24ac [PARENTHESIZED LATIN SMALL LETTER Q]
-"\u24AC" => "(q)"
-
-# \u0239 [LATIN SMALL LETTER QP DIGRAPH]
-"\u0239" => "qp"
-
-# \u0154 [LATIN CAPITAL LETTER R WITH ACUTE]
-"\u0154" => "R"
-
-# \u0156 [LATIN CAPITAL LETTER R WITH CEDILLA]
-"\u0156" => "R"
-
-# \u0158 [LATIN CAPITAL LETTER R WITH CARON]
-"\u0158" => "R"
-
-# \u0212 [LATIN CAPITAL LETTER R WITH DOUBLE GRAVE]
-"\u0210" => "R"
-
-# \u0212 [LATIN CAPITAL LETTER R WITH INVERTED BREVE]
-"\u0212" => "R"
-
-# \u024c [LATIN CAPITAL LETTER R WITH STROKE]
-"\u024C" => "R"
-
-# \u0280 [LATIN LETTER SMALL CAPITAL R]
-"\u0280" => "R"
-
-# \u0281 [LATIN LETTER SMALL CAPITAL INVERTED R]
-"\u0281" => "R"
-
-# \u1d19 [LATIN LETTER SMALL CAPITAL REVERSED R]
-"\u1D19" => "R"
-
-# \u1d1a [LATIN LETTER SMALL CAPITAL TURNED R]
-"\u1D1A" => "R"
-
-# \u1e58 [LATIN CAPITAL LETTER R WITH DOT ABOVE]
-"\u1E58" => "R"
-
-# \u1e5a [LATIN CAPITAL LETTER R WITH DOT BELOW]
-"\u1E5A" => "R"
-
-# \u1e5c [LATIN CAPITAL LETTER R WITH DOT BELOW AND MACRON]
-"\u1E5C" => "R"
-
-# \u1e5e [LATIN CAPITAL LETTER R WITH LINE BELOW]
-"\u1E5E" => "R"
-
-# \u24c7 [CIRCLED LATIN CAPITAL LETTER R]
-"\u24C7" => "R"
-
-# \u2c64 [LATIN CAPITAL LETTER R WITH TAIL]
-"\u2C64" => "R"
-
-# \ua75a [LATIN CAPITAL LETTER R ROTUNDA]
-"\uA75A" => "R"
-
-# \ua782 [LATIN CAPITAL LETTER INSULAR R]
-"\uA782" => "R"
-
-# \uff32 [FULLWIDTH LATIN CAPITAL LETTER R]
-"\uFF32" => "R"
-
-# \u0155 [LATIN SMALL LETTER R WITH ACUTE]
-"\u0155" => "r"
-
-# \u0157 [LATIN SMALL LETTER R WITH CEDILLA]
-"\u0157" => "r"
-
-# \u0159 [LATIN SMALL LETTER R WITH CARON]
-"\u0159" => "r"
-
-# \u0211 [LATIN SMALL LETTER R WITH DOUBLE GRAVE]
-"\u0211" => "r"
-
-# \u0213 [LATIN SMALL LETTER R WITH INVERTED BREVE]
-"\u0213" => "r"
-
-# \u024d [LATIN SMALL LETTER R WITH STROKE]
-"\u024D" => "r"
-
-# \u027c [LATIN SMALL LETTER R WITH LONG LEG]
-"\u027C" => "r"
-
-# \u027d [LATIN SMALL LETTER R WITH TAIL]
-"\u027D" => "r"
-
-# \u027e [LATIN SMALL LETTER R WITH FISHHOOK]
-"\u027E" => "r"
-
-# \u027f [LATIN SMALL LETTER REVERSED R WITH FISHHOOK]
-"\u027F" => "r"
-
-# \u1d63 [LATIN SUBSCRIPT SMALL LETTER R]
-"\u1D63" => "r"
-
-# \u1d72 [LATIN SMALL LETTER R WITH MIDDLE TILDE]
-"\u1D72" => "r"
-
-# \u1d73 [LATIN SMALL LETTER R WITH FISHHOOK AND MIDDLE TILDE]
-"\u1D73" => "r"
-
-# \u1d89 [LATIN SMALL LETTER R WITH PALATAL HOOK]
-"\u1D89" => "r"
-
-# \u1e59 [LATIN SMALL LETTER R WITH DOT ABOVE]
-"\u1E59" => "r"
-
-# \u1e5b [LATIN SMALL LETTER R WITH DOT BELOW]
-"\u1E5B" => "r"
-
-# \u1e5d [LATIN SMALL LETTER R WITH DOT BELOW AND MACRON]
-"\u1E5D" => "r"
-
-# \u1e5f [LATIN SMALL LETTER R WITH LINE BELOW]
-"\u1E5F" => "r"
-
-# \u24e1 [CIRCLED LATIN SMALL LETTER R]
-"\u24E1" => "r"
-
-# \ua75b [LATIN SMALL LETTER R ROTUNDA]
-"\uA75B" => "r"
-
-# \ua783 [LATIN SMALL LETTER INSULAR R]
-"\uA783" => "r"
-
-# \uff52 [FULLWIDTH LATIN SMALL LETTER R]
-"\uFF52" => "r"
-
-# \u24ad [PARENTHESIZED LATIN SMALL LETTER R]
-"\u24AD" => "(r)"
-
-# \u015a [LATIN CAPITAL LETTER S WITH ACUTE]
-"\u015A" => "S"
-
-# \u015c [LATIN CAPITAL LETTER S WITH CIRCUMFLEX]
-"\u015C" => "S"
-
-# \u015e [LATIN CAPITAL LETTER S WITH CEDILLA]
-"\u015E" => "S"
-
-# \u0160 [LATIN CAPITAL LETTER S WITH CARON]
-"\u0160" => "S"
-
-# \u0218 [LATIN CAPITAL LETTER S WITH COMMA BELOW]
-"\u0218" => "S"
-
-# \u1e60 [LATIN CAPITAL LETTER S WITH DOT ABOVE]
-"\u1E60" => "S"
-
-# \u1e62 [LATIN CAPITAL LETTER S WITH DOT BELOW]
-"\u1E62" => "S"
-
-# \u1e64 [LATIN CAPITAL LETTER S WITH ACUTE AND DOT ABOVE]
-"\u1E64" => "S"
-
-# \u1e66 [LATIN CAPITAL LETTER S WITH CARON AND DOT ABOVE]
-"\u1E66" => "S"
-
-# \u1e68 [LATIN CAPITAL LETTER S WITH DOT BELOW AND DOT ABOVE]
-"\u1E68" => "S"
-
-# \u24c8 [CIRCLED LATIN CAPITAL LETTER S]
-"\u24C8" => "S"
-
-# \ua731 [LATIN LETTER SMALL CAPITAL S]
-"\uA731" => "S"
-
-# \ua785 [LATIN SMALL LETTER INSULAR S]
-"\uA785" => "S"
-
-# \uff33 [FULLWIDTH LATIN CAPITAL LETTER S]
-"\uFF33" => "S"
-
-# \u015b [LATIN SMALL LETTER S WITH ACUTE]
-"\u015B" => "s"
-
-# \u015d [LATIN SMALL LETTER S WITH CIRCUMFLEX]
-"\u015D" => "s"
-
-# \u015f [LATIN SMALL LETTER S WITH CEDILLA]
-"\u015F" => "s"
-
-# \u0161 [LATIN SMALL LETTER S WITH CARON]
-"\u0161" => "s"
-
-# \u017f http://en.wikipedia.org/wiki/Long_S [LATIN SMALL LETTER LONG S]
-"\u017F" => "s"
-
-# \u0219 [LATIN SMALL LETTER S WITH COMMA BELOW]
-"\u0219" => "s"
-
-# \u023f [LATIN SMALL LETTER S WITH SWASH TAIL]
-"\u023F" => "s"
-
-# \u0282 [LATIN SMALL LETTER S WITH HOOK]
-"\u0282" => "s"
-
-# \u1d74 [LATIN SMALL LETTER S WITH MIDDLE TILDE]
-"\u1D74" => "s"
-
-# \u1d8a [LATIN SMALL LETTER S WITH PALATAL HOOK]
-"\u1D8A" => "s"
-
-# \u1e61 [LATIN SMALL LETTER S WITH DOT ABOVE]
-"\u1E61" => "s"
-
-# \u1e63 [LATIN SMALL LETTER S WITH DOT BELOW]
-"\u1E63" => "s"
-
-# \u1e65 [LATIN SMALL LETTER S WITH ACUTE AND DOT ABOVE]
-"\u1E65" => "s"
-
-# \u1e67 [LATIN SMALL LETTER S WITH CARON AND DOT ABOVE]
-"\u1E67" => "s"
-
-# \u1e69 [LATIN SMALL LETTER S WITH DOT BELOW AND DOT ABOVE]
-"\u1E69" => "s"
-
-# \u1e9c [LATIN SMALL LETTER LONG S WITH DIAGONAL STROKE]
-"\u1E9C" => "s"
-
-# \u1e9d [LATIN SMALL LETTER LONG S WITH HIGH STROKE]
-"\u1E9D" => "s"
-
-# \u24e2 [CIRCLED LATIN SMALL LETTER S]
-"\u24E2" => "s"
-
-# \ua784 [LATIN CAPITAL LETTER INSULAR S]
-"\uA784" => "s"
-
-# \uff53 [FULLWIDTH LATIN SMALL LETTER S]
-"\uFF53" => "s"
-
-# \u1e9e [LATIN CAPITAL LETTER SHARP S]
-"\u1E9E" => "SS"
-
-# \u24ae [PARENTHESIZED LATIN SMALL LETTER S]
-"\u24AE" => "(s)"
-
-# � [LATIN SMALL LETTER SHARP S]
-"\u00DF" => "ss"
-
-# \ufb06 [LATIN SMALL LIGATURE ST]
-"\uFB06" => "st"
-
-# \u0162 [LATIN CAPITAL LETTER T WITH CEDILLA]
-"\u0162" => "T"
-
-# \u0164 [LATIN CAPITAL LETTER T WITH CARON]
-"\u0164" => "T"
-
-# \u0166 [LATIN CAPITAL LETTER T WITH STROKE]
-"\u0166" => "T"
-
-# \u01ac [LATIN CAPITAL LETTER T WITH HOOK]
-"\u01AC" => "T"
-
-# \u01ae [LATIN CAPITAL LETTER T WITH RETROFLEX HOOK]
-"\u01AE" => "T"
-
-# \u021a [LATIN CAPITAL LETTER T WITH COMMA BELOW]
-"\u021A" => "T"
-
-# \u023e [LATIN CAPITAL LETTER T WITH DIAGONAL STROKE]
-"\u023E" => "T"
-
-# \u1d1b [LATIN LETTER SMALL CAPITAL T]
-"\u1D1B" => "T"
-
-# \u1e6a [LATIN CAPITAL LETTER T WITH DOT ABOVE]
-"\u1E6A" => "T"
-
-# \u1e6c [LATIN CAPITAL LETTER T WITH DOT BELOW]
-"\u1E6C" => "T"
-
-# \u1e6e [LATIN CAPITAL LETTER T WITH LINE BELOW]
-"\u1E6E" => "T"
-
-# \u1e70 [LATIN CAPITAL LETTER T WITH CIRCUMFLEX BELOW]
-"\u1E70" => "T"
-
-# \u24c9 [CIRCLED LATIN CAPITAL LETTER T]
-"\u24C9" => "T"
-
-# \ua786 [LATIN CAPITAL LETTER INSULAR T]
-"\uA786" => "T"
-
-# \uff34 [FULLWIDTH LATIN CAPITAL LETTER T]
-"\uFF34" => "T"
-
-# \u0163 [LATIN SMALL LETTER T WITH CEDILLA]
-"\u0163" => "t"
-
-# \u0165 [LATIN SMALL LETTER T WITH CARON]
-"\u0165" => "t"
-
-# \u0167 [LATIN SMALL LETTER T WITH STROKE]
-"\u0167" => "t"
-
-# \u01ab [LATIN SMALL LETTER T WITH PALATAL HOOK]
-"\u01AB" => "t"
-
-# \u01ad [LATIN SMALL LETTER T WITH HOOK]
-"\u01AD" => "t"
-
-# \u021b [LATIN SMALL LETTER T WITH COMMA BELOW]
-"\u021B" => "t"
-
-# \u0236 [LATIN SMALL LETTER T WITH CURL]
-"\u0236" => "t"
-
-# \u0287 [LATIN SMALL LETTER TURNED T]
-"\u0287" => "t"
-
-# \u0288 [LATIN SMALL LETTER T WITH RETROFLEX HOOK]
-"\u0288" => "t"
-
-# \u1d75 [LATIN SMALL LETTER T WITH MIDDLE TILDE]
-"\u1D75" => "t"
-
-# \u1e6b [LATIN SMALL LETTER T WITH DOT ABOVE]
-"\u1E6B" => "t"
-
-# \u1e6d [LATIN SMALL LETTER T WITH DOT BELOW]
-"\u1E6D" => "t"
-
-# \u1e6f [LATIN SMALL LETTER T WITH LINE BELOW]
-"\u1E6F" => "t"
-
-# \u1e71 [LATIN SMALL LETTER T WITH CIRCUMFLEX BELOW]
-"\u1E71" => "t"
-
-# \u1e97 [LATIN SMALL LETTER T WITH DIAERESIS]
-"\u1E97" => "t"
-
-# \u24e3 [CIRCLED LATIN SMALL LETTER T]
-"\u24E3" => "t"
-
-# \u2c66 [LATIN SMALL LETTER T WITH DIAGONAL STROKE]
-"\u2C66" => "t"
-
-# \uff54 [FULLWIDTH LATIN SMALL LETTER T]
-"\uFF54" => "t"
-
-# � [LATIN CAPITAL LETTER THORN]
-"\u00DE" => "TH"
-
-# \ua766 [LATIN CAPITAL LETTER THORN WITH STROKE THROUGH DESCENDER]
-"\uA766" => "TH"
-
-# \ua728 [LATIN CAPITAL LETTER TZ]
-"\uA728" => "TZ"
-
-# \u24af [PARENTHESIZED LATIN SMALL LETTER T]
-"\u24AF" => "(t)"
-
-# \u02a8 [LATIN SMALL LETTER TC DIGRAPH WITH CURL]
-"\u02A8" => "tc"
-
-# � [LATIN SMALL LETTER THORN]
-"\u00FE" => "th"
-
-# \u1d7a [LATIN SMALL LETTER TH WITH STRIKETHROUGH]
-"\u1D7A" => "th"
-
-# \ua767 [LATIN SMALL LETTER THORN WITH STROKE THROUGH DESCENDER]
-"\uA767" => "th"
-
-# \u02a6 [LATIN SMALL LETTER TS DIGRAPH]
-"\u02A6" => "ts"
-
-# \ua729 [LATIN SMALL LETTER TZ]
-"\uA729" => "tz"
-
-# � [LATIN CAPITAL LETTER U WITH GRAVE]
-"\u00D9" => "U"
-
-# � [LATIN CAPITAL LETTER U WITH ACUTE]
-"\u00DA" => "U"
-
-# � [LATIN CAPITAL LETTER U WITH CIRCUMFLEX]
-"\u00DB" => "U"
-
-# � [LATIN CAPITAL LETTER U WITH DIAERESIS]
-"\u00DC" => "U"
-
-# \u0168 [LATIN CAPITAL LETTER U WITH TILDE]
-"\u0168" => "U"
-
-# \u016a [LATIN CAPITAL LETTER U WITH MACRON]
-"\u016A" => "U"
-
-# \u016c [LATIN CAPITAL LETTER U WITH BREVE]
-"\u016C" => "U"
-
-# \u016e [LATIN CAPITAL LETTER U WITH RING ABOVE]
-"\u016E" => "U"
-
-# \u0170 [LATIN CAPITAL LETTER U WITH DOUBLE ACUTE]
-"\u0170" => "U"
-
-# \u0172 [LATIN CAPITAL LETTER U WITH OGONEK]
-"\u0172" => "U"
-
-# \u01af [LATIN CAPITAL LETTER U WITH HORN]
-"\u01AF" => "U"
-
-# \u01d3 [LATIN CAPITAL LETTER U WITH CARON]
-"\u01D3" => "U"
-
-# \u01d5 [LATIN CAPITAL LETTER U WITH DIAERESIS AND MACRON]
-"\u01D5" => "U"
-
-# \u01d7 [LATIN CAPITAL LETTER U WITH DIAERESIS AND ACUTE]
-"\u01D7" => "U"
-
-# \u01d9 [LATIN CAPITAL LETTER U WITH DIAERESIS AND CARON]
-"\u01D9" => "U"
-
-# \u01db [LATIN CAPITAL LETTER U WITH DIAERESIS AND GRAVE]
-"\u01DB" => "U"
-
-# \u0214 [LATIN CAPITAL LETTER U WITH DOUBLE GRAVE]
-"\u0214" => "U"
-
-# \u0216 [LATIN CAPITAL LETTER U WITH INVERTED BREVE]
-"\u0216" => "U"
-
-# \u0244 [LATIN CAPITAL LETTER U BAR]
-"\u0244" => "U"
-
-# \u1d1c [LATIN LETTER SMALL CAPITAL U]
-"\u1D1C" => "U"
-
-# \u1d7e [LATIN SMALL CAPITAL LETTER U WITH STROKE]
-"\u1D7E" => "U"
-
-# \u1e72 [LATIN CAPITAL LETTER U WITH DIAERESIS BELOW]
-"\u1E72" => "U"
-
-# \u1e74 [LATIN CAPITAL LETTER U WITH TILDE BELOW]
-"\u1E74" => "U"
-
-# \u1e76 [LATIN CAPITAL LETTER U WITH CIRCUMFLEX BELOW]
-"\u1E76" => "U"
-
-# \u1e78 [LATIN CAPITAL LETTER U WITH TILDE AND ACUTE]
-"\u1E78" => "U"
-
-# \u1e7a [LATIN CAPITAL LETTER U WITH MACRON AND DIAERESIS]
-"\u1E7A" => "U"
-
-# \u1ee4 [LATIN CAPITAL LETTER U WITH DOT BELOW]
-"\u1EE4" => "U"
-
-# \u1ee6 [LATIN CAPITAL LETTER U WITH HOOK ABOVE]
-"\u1EE6" => "U"
-
-# \u1ee8 [LATIN CAPITAL LETTER U WITH HORN AND ACUTE]
-"\u1EE8" => "U"
-
-# \u1eea [LATIN CAPITAL LETTER U WITH HORN AND GRAVE]
-"\u1EEA" => "U"
-
-# \u1eec [LATIN CAPITAL LETTER U WITH HORN AND HOOK ABOVE]
-"\u1EEC" => "U"
-
-# \u1eee [LATIN CAPITAL LETTER U WITH HORN AND TILDE]
-"\u1EEE" => "U"
-
-# \u1ef0 [LATIN CAPITAL LETTER U WITH HORN AND DOT BELOW]
-"\u1EF0" => "U"
-
-# \u24ca [CIRCLED LATIN CAPITAL LETTER U]
-"\u24CA" => "U"
-
-# \uff35 [FULLWIDTH LATIN CAPITAL LETTER U]
-"\uFF35" => "U"
-
-# � [LATIN SMALL LETTER U WITH GRAVE]
-"\u00F9" => "u"
-
-# � [LATIN SMALL LETTER U WITH ACUTE]
-"\u00FA" => "u"
-
-# � [LATIN SMALL LETTER U WITH CIRCUMFLEX]
-"\u00FB" => "u"
-
-# � [LATIN SMALL LETTER U WITH DIAERESIS]
-"\u00FC" => "u"
-
-# \u0169 [LATIN SMALL LETTER U WITH TILDE]
-"\u0169" => "u"
-
-# \u016b [LATIN SMALL LETTER U WITH MACRON]
-"\u016B" => "u"
-
-# \u016d [LATIN SMALL LETTER U WITH BREVE]
-"\u016D" => "u"
-
-# \u016f [LATIN SMALL LETTER U WITH RING ABOVE]
-"\u016F" => "u"
-
-# \u0171 [LATIN SMALL LETTER U WITH DOUBLE ACUTE]
-"\u0171" => "u"
-
-# \u0173 [LATIN SMALL LETTER U WITH OGONEK]
-"\u0173" => "u"
-
-# \u01b0 [LATIN SMALL LETTER U WITH HORN]
-"\u01B0" => "u"
-
-# \u01d4 [LATIN SMALL LETTER U WITH CARON]
-"\u01D4" => "u"
-
-# \u01d6 [LATIN SMALL LETTER U WITH DIAERESIS AND MACRON]
-"\u01D6" => "u"
-
-# \u01d8 [LATIN SMALL LETTER U WITH DIAERESIS AND ACUTE]
-"\u01D8" => "u"
-
-# \u01da [LATIN SMALL LETTER U WITH DIAERESIS AND CARON]
-"\u01DA" => "u"
-
-# \u01dc [LATIN SMALL LETTER U WITH DIAERESIS AND GRAVE]
-"\u01DC" => "u"
-
-# \u0215 [LATIN SMALL LETTER U WITH DOUBLE GRAVE]
-"\u0215" => "u"
-
-# \u0217 [LATIN SMALL LETTER U WITH INVERTED BREVE]
-"\u0217" => "u"
-
-# \u0289 [LATIN SMALL LETTER U BAR]
-"\u0289" => "u"
-
-# \u1d64 [LATIN SUBSCRIPT SMALL LETTER U]
-"\u1D64" => "u"
-
-# \u1d99 [LATIN SMALL LETTER U WITH RETROFLEX HOOK]
-"\u1D99" => "u"
-
-# \u1e73 [LATIN SMALL LETTER U WITH DIAERESIS BELOW]
-"\u1E73" => "u"
-
-# \u1e75 [LATIN SMALL LETTER U WITH TILDE BELOW]
-"\u1E75" => "u"
-
-# \u1e77 [LATIN SMALL LETTER U WITH CIRCUMFLEX BELOW]
-"\u1E77" => "u"
-
-# \u1e79 [LATIN SMALL LETTER U WITH TILDE AND ACUTE]
-"\u1E79" => "u"
-
-# \u1e7b [LATIN SMALL LETTER U WITH MACRON AND DIAERESIS]
-"\u1E7B" => "u"
-
-# \u1ee5 [LATIN SMALL LETTER U WITH DOT BELOW]
-"\u1EE5" => "u"
-
-# \u1ee7 [LATIN SMALL LETTER U WITH HOOK ABOVE]
-"\u1EE7" => "u"
-
-# \u1ee9 [LATIN SMALL LETTER U WITH HORN AND ACUTE]
-"\u1EE9" => "u"
-
-# \u1eeb [LATIN SMALL LETTER U WITH HORN AND GRAVE]
-"\u1EEB" => "u"
-
-# \u1eed [LATIN SMALL LETTER U WITH HORN AND HOOK ABOVE]
-"\u1EED" => "u"
-
-# \u1eef [LATIN SMALL LETTER U WITH HORN AND TILDE]
-"\u1EEF" => "u"
-
-# \u1ef1 [LATIN SMALL LETTER U WITH HORN AND DOT BELOW]
-"\u1EF1" => "u"
-
-# \u24e4 [CIRCLED LATIN SMALL LETTER U]
-"\u24E4" => "u"
-
-# \uff55 [FULLWIDTH LATIN SMALL LETTER U]
-"\uFF55" => "u"
-
-# \u24b0 [PARENTHESIZED LATIN SMALL LETTER U]
-"\u24B0" => "(u)"
-
-# \u1d6b [LATIN SMALL LETTER UE]
-"\u1D6B" => "ue"
-
-# \u01b2 [LATIN CAPITAL LETTER V WITH HOOK]
-"\u01B2" => "V"
-
-# \u0245 [LATIN CAPITAL LETTER TURNED V]
-"\u0245" => "V"
-
-# \u1d20 [LATIN LETTER SMALL CAPITAL V]
-"\u1D20" => "V"
-
-# \u1e7c [LATIN CAPITAL LETTER V WITH TILDE]
-"\u1E7C" => "V"
-
-# \u1e7e [LATIN CAPITAL LETTER V WITH DOT BELOW]
-"\u1E7E" => "V"
-
-# \u1efc [LATIN CAPITAL LETTER MIDDLE-WELSH V]
-"\u1EFC" => "V"
-
-# \u24cb [CIRCLED LATIN CAPITAL LETTER V]
-"\u24CB" => "V"
-
-# \ua75e [LATIN CAPITAL LETTER V WITH DIAGONAL STROKE]
-"\uA75E" => "V"
-
-# \ua768 [LATIN CAPITAL LETTER VEND]
-"\uA768" => "V"
-
-# \uff36 [FULLWIDTH LATIN CAPITAL LETTER V]
-"\uFF36" => "V"
-
-# \u028b [LATIN SMALL LETTER V WITH HOOK]
-"\u028B" => "v"
-
-# \u028c [LATIN SMALL LETTER TURNED V]
-"\u028C" => "v"
-
-# \u1d65 [LATIN SUBSCRIPT SMALL LETTER V]
-"\u1D65" => "v"
-
-# \u1d8c [LATIN SMALL LETTER V WITH PALATAL HOOK]
-"\u1D8C" => "v"
-
-# \u1e7d [LATIN SMALL LETTER V WITH TILDE]
-"\u1E7D" => "v"
-
-# \u1e7f [LATIN SMALL LETTER V WITH DOT BELOW]
-"\u1E7F" => "v"
-
-# \u24e5 [CIRCLED LATIN SMALL LETTER V]
-"\u24E5" => "v"
-
-# \u2c71 [LATIN SMALL LETTER V WITH RIGHT HOOK]
-"\u2C71" => "v"
-
-# \u2c74 [LATIN SMALL LETTER V WITH CURL]
-"\u2C74" => "v"
-
-# \ua75f [LATIN SMALL LETTER V WITH DIAGONAL STROKE]
-"\uA75F" => "v"
-
-# \uff56 [FULLWIDTH LATIN SMALL LETTER V]
-"\uFF56" => "v"
-
-# \ua760 [LATIN CAPITAL LETTER VY]
-"\uA760" => "VY"
-
-# \u24b1 [PARENTHESIZED LATIN SMALL LETTER V]
-"\u24B1" => "(v)"
-
-# \ua761 [LATIN SMALL LETTER VY]
-"\uA761" => "vy"
-
-# \u0174 [LATIN CAPITAL LETTER W WITH CIRCUMFLEX]
-"\u0174" => "W"
-
-# \u01f7 http://en.wikipedia.org/wiki/Wynn [LATIN CAPITAL LETTER WYNN]
-"\u01F7" => "W"
-
-# \u1d21 [LATIN LETTER SMALL CAPITAL W]
-"\u1D21" => "W"
-
-# \u1e80 [LATIN CAPITAL LETTER W WITH GRAVE]
-"\u1E80" => "W"
-
-# \u1e82 [LATIN CAPITAL LETTER W WITH ACUTE]
-"\u1E82" => "W"
-
-# \u1e84 [LATIN CAPITAL LETTER W WITH DIAERESIS]
-"\u1E84" => "W"
-
-# \u1e86 [LATIN CAPITAL LETTER W WITH DOT ABOVE]
-"\u1E86" => "W"
-
-# \u1e88 [LATIN CAPITAL LETTER W WITH DOT BELOW]
-"\u1E88" => "W"
-
-# \u24cc [CIRCLED LATIN CAPITAL LETTER W]
-"\u24CC" => "W"
-
-# \u2c72 [LATIN CAPITAL LETTER W WITH HOOK]
-"\u2C72" => "W"
-
-# \uff37 [FULLWIDTH LATIN CAPITAL LETTER W]
-"\uFF37" => "W"
-
-# \u0175 [LATIN SMALL LETTER W WITH CIRCUMFLEX]
-"\u0175" => "w"
-
-# \u01bf http://en.wikipedia.org/wiki/Wynn [LATIN LETTER WYNN]
-"\u01BF" => "w"
-
-# \u028d [LATIN SMALL LETTER TURNED W]
-"\u028D" => "w"
-
-# \u1e81 [LATIN SMALL LETTER W WITH GRAVE]
-"\u1E81" => "w"
-
-# \u1e83 [LATIN SMALL LETTER W WITH ACUTE]
-"\u1E83" => "w"
-
-# \u1e85 [LATIN SMALL LETTER W WITH DIAERESIS]
-"\u1E85" => "w"
-
-# \u1e87 [LATIN SMALL LETTER W WITH DOT ABOVE]
-"\u1E87" => "w"
-
-# \u1e89 [LATIN SMALL LETTER W WITH DOT BELOW]
-"\u1E89" => "w"
-
-# \u1e98 [LATIN SMALL LETTER W WITH RING ABOVE]
-"\u1E98" => "w"
-
-# \u24e6 [CIRCLED LATIN SMALL LETTER W]
-"\u24E6" => "w"
-
-# \u2c73 [LATIN SMALL LETTER W WITH HOOK]
-"\u2C73" => "w"
-
-# \uff57 [FULLWIDTH LATIN SMALL LETTER W]
-"\uFF57" => "w"
-
-# \u24b2 [PARENTHESIZED LATIN SMALL LETTER W]
-"\u24B2" => "(w)"
-
-# \u1e8a [LATIN CAPITAL LETTER X WITH DOT ABOVE]
-"\u1E8A" => "X"
-
-# \u1e8c [LATIN CAPITAL LETTER X WITH DIAERESIS]
-"\u1E8C" => "X"
-
-# \u24cd [CIRCLED LATIN CAPITAL LETTER X]
-"\u24CD" => "X"
-
-# \uff38 [FULLWIDTH LATIN CAPITAL LETTER X]
-"\uFF38" => "X"
-
-# \u1d8d [LATIN SMALL LETTER X WITH PALATAL HOOK]
-"\u1D8D" => "x"
-
-# \u1e8b [LATIN SMALL LETTER X WITH DOT ABOVE]
-"\u1E8B" => "x"
-
-# \u1e8d [LATIN SMALL LETTER X WITH DIAERESIS]
-"\u1E8D" => "x"
-
-# \u2093 [LATIN SUBSCRIPT SMALL LETTER X]
-"\u2093" => "x"
-
-# \u24e7 [CIRCLED LATIN SMALL LETTER X]
-"\u24E7" => "x"
-
-# \uff58 [FULLWIDTH LATIN SMALL LETTER X]
-"\uFF58" => "x"
-
-# \u24b3 [PARENTHESIZED LATIN SMALL LETTER X]
-"\u24B3" => "(x)"
-
-# � [LATIN CAPITAL LETTER Y WITH ACUTE]
-"\u00DD" => "Y"
-
-# \u0176 [LATIN CAPITAL LETTER Y WITH CIRCUMFLEX]
-"\u0176" => "Y"
-
-# \u0178 [LATIN CAPITAL LETTER Y WITH DIAERESIS]
-"\u0178" => "Y"
-
-# \u01b3 [LATIN CAPITAL LETTER Y WITH HOOK]
-"\u01B3" => "Y"
-
-# \u0232 [LATIN CAPITAL LETTER Y WITH MACRON]
-"\u0232" => "Y"
-
-# \u024e [LATIN CAPITAL LETTER Y WITH STROKE]
-"\u024E" => "Y"
-
-# \u028f [LATIN LETTER SMALL CAPITAL Y]
-"\u028F" => "Y"
-
-# \u1e8e [LATIN CAPITAL LETTER Y WITH DOT ABOVE]
-"\u1E8E" => "Y"
-
-# \u1ef2 [LATIN CAPITAL LETTER Y WITH GRAVE]
-"\u1EF2" => "Y"
-
-# \u1ef4 [LATIN CAPITAL LETTER Y WITH DOT BELOW]
-"\u1EF4" => "Y"
-
-# \u1ef6 [LATIN CAPITAL LETTER Y WITH HOOK ABOVE]
-"\u1EF6" => "Y"
-
-# \u1ef8 [LATIN CAPITAL LETTER Y WITH TILDE]
-"\u1EF8" => "Y"
-
-# \u1efe [LATIN CAPITAL LETTER Y WITH LOOP]
-"\u1EFE" => "Y"
-
-# \u24ce [CIRCLED LATIN CAPITAL LETTER Y]
-"\u24CE" => "Y"
-
-# \uff39 [FULLWIDTH LATIN CAPITAL LETTER Y]
-"\uFF39" => "Y"
-
-# � [LATIN SMALL LETTER Y WITH ACUTE]
-"\u00FD" => "y"
-
-# � [LATIN SMALL LETTER Y WITH DIAERESIS]
-"\u00FF" => "y"
-
-# \u0177 [LATIN SMALL LETTER Y WITH CIRCUMFLEX]
-"\u0177" => "y"
-
-# \u01b4 [LATIN SMALL LETTER Y WITH HOOK]
-"\u01B4" => "y"
-
-# \u0233 [LATIN SMALL LETTER Y WITH MACRON]
-"\u0233" => "y"
-
-# \u024f [LATIN SMALL LETTER Y WITH STROKE]
-"\u024F" => "y"
-
-# \u028e [LATIN SMALL LETTER TURNED Y]
-"\u028E" => "y"
-
-# \u1e8f [LATIN SMALL LETTER Y WITH DOT ABOVE]
-"\u1E8F" => "y"
-
-# \u1e99 [LATIN SMALL LETTER Y WITH RING ABOVE]
-"\u1E99" => "y"
-
-# \u1ef3 [LATIN SMALL LETTER Y WITH GRAVE]
-"\u1EF3" => "y"
-
-# \u1ef5 [LATIN SMALL LETTER Y WITH DOT BELOW]
-"\u1EF5" => "y"
-
-# \u1ef7 [LATIN SMALL LETTER Y WITH HOOK ABOVE]
-"\u1EF7" => "y"
-
-# \u1ef9 [LATIN SMALL LETTER Y WITH TILDE]
-"\u1EF9" => "y"
-
-# \u1eff [LATIN SMALL LETTER Y WITH LOOP]
-"\u1EFF" => "y"
-
-# \u24e8 [CIRCLED LATIN SMALL LETTER Y]
-"\u24E8" => "y"
-
-# \uff59 [FULLWIDTH LATIN SMALL LETTER Y]
-"\uFF59" => "y"
-
-# \u24b4 [PARENTHESIZED LATIN SMALL LETTER Y]
-"\u24B4" => "(y)"
-
-# \u0179 [LATIN CAPITAL LETTER Z WITH ACUTE]
-"\u0179" => "Z"
-
-# \u017b [LATIN CAPITAL LETTER Z WITH DOT ABOVE]
-"\u017B" => "Z"
-
-# \u017d [LATIN CAPITAL LETTER Z WITH CARON]
-"\u017D" => "Z"
-
-# \u01b5 [LATIN CAPITAL LETTER Z WITH STROKE]
-"\u01B5" => "Z"
-
-# \u021c http://en.wikipedia.org/wiki/Yogh [LATIN CAPITAL LETTER YOGH]
-"\u021C" => "Z"
-
-# \u0224 [LATIN CAPITAL LETTER Z WITH HOOK]
-"\u0224" => "Z"
-
-# \u1d22 [LATIN LETTER SMALL CAPITAL Z]
-"\u1D22" => "Z"
-
-# \u1e90 [LATIN CAPITAL LETTER Z WITH CIRCUMFLEX]
-"\u1E90" => "Z"
-
-# \u1e92 [LATIN CAPITAL LETTER Z WITH DOT BELOW]
-"\u1E92" => "Z"
-
-# \u1e94 [LATIN CAPITAL LETTER Z WITH LINE BELOW]
-"\u1E94" => "Z"
-
-# \u24cf [CIRCLED LATIN CAPITAL LETTER Z]
-"\u24CF" => "Z"
-
-# \u2c6b [LATIN CAPITAL LETTER Z WITH DESCENDER]
-"\u2C6B" => "Z"
-
-# \ua762 [LATIN CAPITAL LETTER VISIGOTHIC Z]
-"\uA762" => "Z"
-
-# \uff3a [FULLWIDTH LATIN CAPITAL LETTER Z]
-"\uFF3A" => "Z"
-
-# \u017a [LATIN SMALL LETTER Z WITH ACUTE]
-"\u017A" => "z"
-
-# \u017c [LATIN SMALL LETTER Z WITH DOT ABOVE]
-"\u017C" => "z"
-
-# \u017e [LATIN SMALL LETTER Z WITH CARON]
-"\u017E" => "z"
-
-# \u01b6 [LATIN SMALL LETTER Z WITH STROKE]
-"\u01B6" => "z"
-
-# \u021d http://en.wikipedia.org/wiki/Yogh [LATIN SMALL LETTER YOGH]
-"\u021D" => "z"
-
-# \u0225 [LATIN SMALL LETTER Z WITH HOOK]
-"\u0225" => "z"
-
-# \u0240 [LATIN SMALL LETTER Z WITH SWASH TAIL]
-"\u0240" => "z"
-
-# \u0290 [LATIN SMALL LETTER Z WITH RETROFLEX HOOK]
-"\u0290" => "z"
-
-# \u0291 [LATIN SMALL LETTER Z WITH CURL]
-"\u0291" => "z"
-
-# \u1d76 [LATIN SMALL LETTER Z WITH MIDDLE TILDE]
-"\u1D76" => "z"
-
-# \u1d8e [LATIN SMALL LETTER Z WITH PALATAL HOOK]
-"\u1D8E" => "z"
-
-# \u1e91 [LATIN SMALL LETTER Z WITH CIRCUMFLEX]
-"\u1E91" => "z"
-
-# \u1e93 [LATIN SMALL LETTER Z WITH DOT BELOW]
-"\u1E93" => "z"
-
-# \u1e95 [LATIN SMALL LETTER Z WITH LINE BELOW]
-"\u1E95" => "z"
-
-# \u24e9 [CIRCLED LATIN SMALL LETTER Z]
-"\u24E9" => "z"
-
-# \u2c6c [LATIN SMALL LETTER Z WITH DESCENDER]
-"\u2C6C" => "z"
-
-# \ua763 [LATIN SMALL LETTER VISIGOTHIC Z]
-"\uA763" => "z"
-
-# \uff5a [FULLWIDTH LATIN SMALL LETTER Z]
-"\uFF5A" => "z"
-
-# \u24b5 [PARENTHESIZED LATIN SMALL LETTER Z]
-"\u24B5" => "(z)"
-
-# \u2070 [SUPERSCRIPT ZERO]
-"\u2070" => "0"
-
-# \u2080 [SUBSCRIPT ZERO]
-"\u2080" => "0"
-
-# \u24ea [CIRCLED DIGIT ZERO]
-"\u24EA" => "0"
-
-# \u24ff [NEGATIVE CIRCLED DIGIT ZERO]
-"\u24FF" => "0"
-
-# \uff10 [FULLWIDTH DIGIT ZERO]
-"\uFF10" => "0"
-
-# � [SUPERSCRIPT ONE]
-"\u00B9" => "1"
-
-# \u2081 [SUBSCRIPT ONE]
-"\u2081" => "1"
-
-# \u2460 [CIRCLED DIGIT ONE]
-"\u2460" => "1"
-
-# \u24f5 [DOUBLE CIRCLED DIGIT ONE]
-"\u24F5" => "1"
-
-# \u2776 [DINGBAT NEGATIVE CIRCLED DIGIT ONE]
-"\u2776" => "1"
-
-# \u2780 [DINGBAT CIRCLED SANS-SERIF DIGIT ONE]
-"\u2780" => "1"
-
-# \u278a [DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT ONE]
-"\u278A" => "1"
-
-# \uff11 [FULLWIDTH DIGIT ONE]
-"\uFF11" => "1"
-
-# \u2488 [DIGIT ONE FULL STOP]
-"\u2488" => "1."
-
-# \u2474 [PARENTHESIZED DIGIT ONE]
-"\u2474" => "(1)"
-
-# � [SUPERSCRIPT TWO]
-"\u00B2" => "2"
-
-# \u2082 [SUBSCRIPT TWO]
-"\u2082" => "2"
-
-# \u2461 [CIRCLED DIGIT TWO]
-"\u2461" => "2"
-
-# \u24f6 [DOUBLE CIRCLED DIGIT TWO]
-"\u24F6" => "2"
-
-# \u2777 [DINGBAT NEGATIVE CIRCLED DIGIT TWO]
-"\u2777" => "2"
-
-# \u2781 [DINGBAT CIRCLED SANS-SERIF DIGIT TWO]
-"\u2781" => "2"
-
-# \u278b [DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT TWO]
-"\u278B" => "2"
-
-# \uff12 [FULLWIDTH DIGIT TWO]
-"\uFF12" => "2"
-
-# \u2489 [DIGIT TWO FULL STOP]
-"\u2489" => "2."
-
-# \u2475 [PARENTHESIZED DIGIT TWO]
-"\u2475" => "(2)"
-
-# � [SUPERSCRIPT THREE]
-"\u00B3" => "3"
-
-# \u2083 [SUBSCRIPT THREE]
-"\u2083" => "3"
-
-# \u2462 [CIRCLED DIGIT THREE]
-"\u2462" => "3"
-
-# \u24f7 [DOUBLE CIRCLED DIGIT THREE]
-"\u24F7" => "3"
-
-# \u2778 [DINGBAT NEGATIVE CIRCLED DIGIT THREE]
-"\u2778" => "3"
-
-# \u2782 [DINGBAT CIRCLED SANS-SERIF DIGIT THREE]
-"\u2782" => "3"
-
-# \u278c [DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT THREE]
-"\u278C" => "3"
-
-# \uff13 [FULLWIDTH DIGIT THREE]
-"\uFF13" => "3"
-
-# \u248a [DIGIT THREE FULL STOP]
-"\u248A" => "3."
-
-# \u2476 [PARENTHESIZED DIGIT THREE]
-"\u2476" => "(3)"
-
-# \u2074 [SUPERSCRIPT FOUR]
-"\u2074" => "4"
-
-# \u2084 [SUBSCRIPT FOUR]
-"\u2084" => "4"
-
-# \u2463 [CIRCLED DIGIT FOUR]
-"\u2463" => "4"
-
-# \u24f8 [DOUBLE CIRCLED DIGIT FOUR]
-"\u24F8" => "4"
-
-# \u2779 [DINGBAT NEGATIVE CIRCLED DIGIT FOUR]
-"\u2779" => "4"
-
-# \u2783 [DINGBAT CIRCLED SANS-SERIF DIGIT FOUR]
-"\u2783" => "4"
-
-# \u278d [DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT FOUR]
-"\u278D" => "4"
-
-# \uff14 [FULLWIDTH DIGIT FOUR]
-"\uFF14" => "4"
-
-# \u248b [DIGIT FOUR FULL STOP]
-"\u248B" => "4."
-
-# \u2477 [PARENTHESIZED DIGIT FOUR]
-"\u2477" => "(4)"
-
-# \u2075 [SUPERSCRIPT FIVE]
-"\u2075" => "5"
-
-# \u2085 [SUBSCRIPT FIVE]
-"\u2085" => "5"
-
-# \u2464 [CIRCLED DIGIT FIVE]
-"\u2464" => "5"
-
-# \u24f9 [DOUBLE CIRCLED DIGIT FIVE]
-"\u24F9" => "5"
-
-# \u277a [DINGBAT NEGATIVE CIRCLED DIGIT FIVE]
-"\u277A" => "5"
-
-# \u2784 [DINGBAT CIRCLED SANS-SERIF DIGIT FIVE]
-"\u2784" => "5"
-
-# \u278e [DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT FIVE]
-"\u278E" => "5"
-
-# \uff15 [FULLWIDTH DIGIT FIVE]
-"\uFF15" => "5"
-
-# \u248c [DIGIT FIVE FULL STOP]
-"\u248C" => "5."
-
-# \u2478 [PARENTHESIZED DIGIT FIVE]
-"\u2478" => "(5)"
-
-# \u2076 [SUPERSCRIPT SIX]
-"\u2076" => "6"
-
-# \u2086 [SUBSCRIPT SIX]
-"\u2086" => "6"
-
-# \u2465 [CIRCLED DIGIT SIX]
-"\u2465" => "6"
-
-# \u24fa [DOUBLE CIRCLED DIGIT SIX]
-"\u24FA" => "6"
-
-# \u277b [DINGBAT NEGATIVE CIRCLED DIGIT SIX]
-"\u277B" => "6"
-
-# \u2785 [DINGBAT CIRCLED SANS-SERIF DIGIT SIX]
-"\u2785" => "6"
-
-# \u278f [DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT SIX]
-"\u278F" => "6"
-
-# \uff16 [FULLWIDTH DIGIT SIX]
-"\uFF16" => "6"
-
-# \u248d [DIGIT SIX FULL STOP]
-"\u248D" => "6."
-
-# \u2479 [PARENTHESIZED DIGIT SIX]
-"\u2479" => "(6)"
-
-# \u2077 [SUPERSCRIPT SEVEN]
-"\u2077" => "7"
-
-# \u2087 [SUBSCRIPT SEVEN]
-"\u2087" => "7"
-
-# \u2466 [CIRCLED DIGIT SEVEN]
-"\u2466" => "7"
-
-# \u24fb [DOUBLE CIRCLED DIGIT SEVEN]
-"\u24FB" => "7"
-
-# \u277c [DINGBAT NEGATIVE CIRCLED DIGIT SEVEN]
-"\u277C" => "7"
-
-# \u2786 [DINGBAT CIRCLED SANS-SERIF DIGIT SEVEN]
-"\u2786" => "7"
-
-# \u2790 [DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT SEVEN]
-"\u2790" => "7"
-
-# \uff17 [FULLWIDTH DIGIT SEVEN]
-"\uFF17" => "7"
-
-# \u248e [DIGIT SEVEN FULL STOP]
-"\u248E" => "7."
-
-# \u247a [PARENTHESIZED DIGIT SEVEN]
-"\u247A" => "(7)"
-
-# \u2078 [SUPERSCRIPT EIGHT]
-"\u2078" => "8"
-
-# \u2088 [SUBSCRIPT EIGHT]
-"\u2088" => "8"
-
-# \u2467 [CIRCLED DIGIT EIGHT]
-"\u2467" => "8"
-
-# \u24fc [DOUBLE CIRCLED DIGIT EIGHT]
-"\u24FC" => "8"
-
-# \u277d [DINGBAT NEGATIVE CIRCLED DIGIT EIGHT]
-"\u277D" => "8"
-
-# \u2787 [DINGBAT CIRCLED SANS-SERIF DIGIT EIGHT]
-"\u2787" => "8"
-
-# \u2791 [DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT EIGHT]
-"\u2791" => "8"
-
-# \uff18 [FULLWIDTH DIGIT EIGHT]
-"\uFF18" => "8"
-
-# \u248f [DIGIT EIGHT FULL STOP]
-"\u248F" => "8."
-
-# \u247b [PARENTHESIZED DIGIT EIGHT]
-"\u247B" => "(8)"
-
-# \u2079 [SUPERSCRIPT NINE]
-"\u2079" => "9"
-
-# \u2089 [SUBSCRIPT NINE]
-"\u2089" => "9"
-
-# \u2468 [CIRCLED DIGIT NINE]
-"\u2468" => "9"
-
-# \u24fd [DOUBLE CIRCLED DIGIT NINE]
-"\u24FD" => "9"
-
-# \u277e [DINGBAT NEGATIVE CIRCLED DIGIT NINE]
-"\u277E" => "9"
-
-# \u2788 [DINGBAT CIRCLED SANS-SERIF DIGIT NINE]
-"\u2788" => "9"
-
-# \u2792 [DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT NINE]
-"\u2792" => "9"
-
-# \uff19 [FULLWIDTH DIGIT NINE]
-"\uFF19" => "9"
-
-# \u2490 [DIGIT NINE FULL STOP]
-"\u2490" => "9."
-
-# \u247c [PARENTHESIZED DIGIT NINE]
-"\u247C" => "(9)"
-
-# \u2469 [CIRCLED NUMBER TEN]
-"\u2469" => "10"
-
-# \u24fe [DOUBLE CIRCLED NUMBER TEN]
-"\u24FE" => "10"
-
-# \u277f [DINGBAT NEGATIVE CIRCLED NUMBER TEN]
-"\u277F" => "10"
-
-# \u2789 [DINGBAT CIRCLED SANS-SERIF NUMBER TEN]
-"\u2789" => "10"
-
-# \u2793 [DINGBAT NEGATIVE CIRCLED SANS-SERIF NUMBER TEN]
-"\u2793" => "10"
-
-# \u2491 [NUMBER TEN FULL STOP]
-"\u2491" => "10."
-
-# \u247d [PARENTHESIZED NUMBER TEN]
-"\u247D" => "(10)"
-
-# \u246a [CIRCLED NUMBER ELEVEN]
-"\u246A" => "11"
-
-# \u24eb [NEGATIVE CIRCLED NUMBER ELEVEN]
-"\u24EB" => "11"
-
-# \u2492 [NUMBER ELEVEN FULL STOP]
-"\u2492" => "11."
-
-# \u247e [PARENTHESIZED NUMBER ELEVEN]
-"\u247E" => "(11)"
-
-# \u246b [CIRCLED NUMBER TWELVE]
-"\u246B" => "12"
-
-# \u24ec [NEGATIVE CIRCLED NUMBER TWELVE]
-"\u24EC" => "12"
-
-# \u2493 [NUMBER TWELVE FULL STOP]
-"\u2493" => "12."
-
-# \u247f [PARENTHESIZED NUMBER TWELVE]
-"\u247F" => "(12)"
-
-# \u246c [CIRCLED NUMBER THIRTEEN]
-"\u246C" => "13"
-
-# \u24ed [NEGATIVE CIRCLED NUMBER THIRTEEN]
-"\u24ED" => "13"
-
-# \u2494 [NUMBER THIRTEEN FULL STOP]
-"\u2494" => "13."
-
-# \u2480 [PARENTHESIZED NUMBER THIRTEEN]
-"\u2480" => "(13)"
-
-# \u246d [CIRCLED NUMBER FOURTEEN]
-"\u246D" => "14"
-
-# \u24ee [NEGATIVE CIRCLED NUMBER FOURTEEN]
-"\u24EE" => "14"
-
-# \u2495 [NUMBER FOURTEEN FULL STOP]
-"\u2495" => "14."
-
-# \u2481 [PARENTHESIZED NUMBER FOURTEEN]
-"\u2481" => "(14)"
-
-# \u246e [CIRCLED NUMBER FIFTEEN]
-"\u246E" => "15"
-
-# \u24ef [NEGATIVE CIRCLED NUMBER FIFTEEN]
-"\u24EF" => "15"
-
-# \u2496 [NUMBER FIFTEEN FULL STOP]
-"\u2496" => "15."
-
-# \u2482 [PARENTHESIZED NUMBER FIFTEEN]
-"\u2482" => "(15)"
-
-# \u246f [CIRCLED NUMBER SIXTEEN]
-"\u246F" => "16"
-
-# \u24f0 [NEGATIVE CIRCLED NUMBER SIXTEEN]
-"\u24F0" => "16"
-
-# \u2497 [NUMBER SIXTEEN FULL STOP]
-"\u2497" => "16."
-
-# \u2483 [PARENTHESIZED NUMBER SIXTEEN]
-"\u2483" => "(16)"
-
-# \u2470 [CIRCLED NUMBER SEVENTEEN]
-"\u2470" => "17"
-
-# \u24f1 [NEGATIVE CIRCLED NUMBER SEVENTEEN]
-"\u24F1" => "17"
-
-# \u2498 [NUMBER SEVENTEEN FULL STOP]
-"\u2498" => "17."
-
-# \u2484 [PARENTHESIZED NUMBER SEVENTEEN]
-"\u2484" => "(17)"
-
-# \u2471 [CIRCLED NUMBER EIGHTEEN]
-"\u2471" => "18"
-
-# \u24f2 [NEGATIVE CIRCLED NUMBER EIGHTEEN]
-"\u24F2" => "18"
-
-# \u2499 [NUMBER EIGHTEEN FULL STOP]
-"\u2499" => "18."
-
-# \u2485 [PARENTHESIZED NUMBER EIGHTEEN]
-"\u2485" => "(18)"
-
-# \u2472 [CIRCLED NUMBER NINETEEN]
-"\u2472" => "19"
-
-# \u24f3 [NEGATIVE CIRCLED NUMBER NINETEEN]
-"\u24F3" => "19"
-
-# \u249a [NUMBER NINETEEN FULL STOP]
-"\u249A" => "19."
-
-# \u2486 [PARENTHESIZED NUMBER NINETEEN]
-"\u2486" => "(19)"
-
-# \u2473 [CIRCLED NUMBER TWENTY]
-"\u2473" => "20"
-
-# \u24f4 [NEGATIVE CIRCLED NUMBER TWENTY]
-"\u24F4" => "20"
-
-# \u249b [NUMBER TWENTY FULL STOP]
-"\u249B" => "20."
-
-# \u2487 [PARENTHESIZED NUMBER TWENTY]
-"\u2487" => "(20)"
-
-# � [LEFT-POINTING DOUBLE ANGLE QUOTATION MARK]
-"\u00AB" => "\""
-
-# � [RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK]
-"\u00BB" => "\""
-
-# \u201c [LEFT DOUBLE QUOTATION MARK]
-"\u201C" => "\""
-
-# \u201d [RIGHT DOUBLE QUOTATION MARK]
-"\u201D" => "\""
-
-# \u201e [DOUBLE LOW-9 QUOTATION MARK]
-"\u201E" => "\""
-
-# \u2033 [DOUBLE PRIME]
-"\u2033" => "\""
-
-# \u2036 [REVERSED DOUBLE PRIME]
-"\u2036" => "\""
-
-# \u275d [HEAVY DOUBLE TURNED COMMA QUOTATION MARK ORNAMENT]
-"\u275D" => "\""
-
-# \u275e [HEAVY DOUBLE COMMA QUOTATION MARK ORNAMENT]
-"\u275E" => "\""
-
-# \u276e [HEAVY LEFT-POINTING ANGLE QUOTATION MARK ORNAMENT]
-"\u276E" => "\""
-
-# \u276f [HEAVY RIGHT-POINTING ANGLE QUOTATION MARK ORNAMENT]
-"\u276F" => "\""
-
-# \uff02 [FULLWIDTH QUOTATION MARK]
-"\uFF02" => "\""
-
-# \u2018 [LEFT SINGLE QUOTATION MARK]
-"\u2018" => "\'"
-
-# \u2019 [RIGHT SINGLE QUOTATION MARK]
-"\u2019" => "\'"
-
-# \u201a [SINGLE LOW-9 QUOTATION MARK]
-"\u201A" => "\'"
-
-# \u201b [SINGLE HIGH-REVERSED-9 QUOTATION MARK]
-"\u201B" => "\'"
-
-# \u2032 [PRIME]
-"\u2032" => "\'"
-
-# \u2035 [REVERSED PRIME]
-"\u2035" => "\'"
-
-# \u2039 [SINGLE LEFT-POINTING ANGLE QUOTATION MARK]
-"\u2039" => "\'"
-
-# \u203a [SINGLE RIGHT-POINTING ANGLE QUOTATION MARK]
-"\u203A" => "\'"
-
-# \u275b [HEAVY SINGLE TURNED COMMA QUOTATION MARK ORNAMENT]
-"\u275B" => "\'"
-
-# \u275c [HEAVY SINGLE COMMA QUOTATION MARK ORNAMENT]
-"\u275C" => "\'"
-
-# \uff07 [FULLWIDTH APOSTROPHE]
-"\uFF07" => "\'"
-
-# \u2010 [HYPHEN]
-"\u2010" => "-"
-
-# \u2011 [NON-BREAKING HYPHEN]
-"\u2011" => "-"
-
-# \u2012 [FIGURE DASH]
-"\u2012" => "-"
-
-# \u2013 [EN DASH]
-"\u2013" => "-"
-
-# \u2014 [EM DASH]
-"\u2014" => "-"
-
-# \u207b [SUPERSCRIPT MINUS]
-"\u207B" => "-"
-
-# \u208b [SUBSCRIPT MINUS]
-"\u208B" => "-"
-
-# \uff0d [FULLWIDTH HYPHEN-MINUS]
-"\uFF0D" => "-"
-
-# \u2045 [LEFT SQUARE BRACKET WITH QUILL]
-"\u2045" => "["
-
-# \u2772 [LIGHT LEFT TORTOISE SHELL BRACKET ORNAMENT]
-"\u2772" => "["
-
-# \uff3b [FULLWIDTH LEFT SQUARE BRACKET]
-"\uFF3B" => "["
-
-# \u2046 [RIGHT SQUARE BRACKET WITH QUILL]
-"\u2046" => "]"
-
-# \u2773 [LIGHT RIGHT TORTOISE SHELL BRACKET ORNAMENT]
-"\u2773" => "]"
-
-# \uff3d [FULLWIDTH RIGHT SQUARE BRACKET]
-"\uFF3D" => "]"
-
-# \u207d [SUPERSCRIPT LEFT PARENTHESIS]
-"\u207D" => "("
-
-# \u208d [SUBSCRIPT LEFT PARENTHESIS]
-"\u208D" => "("
-
-# \u2768 [MEDIUM LEFT PARENTHESIS ORNAMENT]
-"\u2768" => "("
-
-# \u276a [MEDIUM FLATTENED LEFT PARENTHESIS ORNAMENT]
-"\u276A" => "("
-
-# \uff08 [FULLWIDTH LEFT PARENTHESIS]
-"\uFF08" => "("
-
-# \u2e28 [LEFT DOUBLE PARENTHESIS]
-"\u2E28" => "(("
-
-# \u207e [SUPERSCRIPT RIGHT PARENTHESIS]
-"\u207E" => ")"
-
-# \u208e [SUBSCRIPT RIGHT PARENTHESIS]
-"\u208E" => ")"
-
-# \u2769 [MEDIUM RIGHT PARENTHESIS ORNAMENT]
-"\u2769" => ")"
-
-# \u276b [MEDIUM FLATTENED RIGHT PARENTHESIS ORNAMENT]
-"\u276B" => ")"
-
-# \uff09 [FULLWIDTH RIGHT PARENTHESIS]
-"\uFF09" => ")"
-
-# \u2e29 [RIGHT DOUBLE PARENTHESIS]
-"\u2E29" => "))"
-
-# \u276c [MEDIUM LEFT-POINTING ANGLE BRACKET ORNAMENT]
-"\u276C" => "<"
-
-# \u2770 [HEAVY LEFT-POINTING ANGLE BRACKET ORNAMENT]
-"\u2770" => "<"
-
-# \uff1c [FULLWIDTH LESS-THAN SIGN]
-"\uFF1C" => "<"
-
-# \u276d [MEDIUM RIGHT-POINTING ANGLE BRACKET ORNAMENT]
-"\u276D" => ">"
-
-# \u2771 [HEAVY RIGHT-POINTING ANGLE BRACKET ORNAMENT]
-"\u2771" => ">"
-
-# \uff1e [FULLWIDTH GREATER-THAN SIGN]
-"\uFF1E" => ">"
-
-# \u2774 [MEDIUM LEFT CURLY BRACKET ORNAMENT]
-"\u2774" => "{"
-
-# \uff5b [FULLWIDTH LEFT CURLY BRACKET]
-"\uFF5B" => "{"
-
-# \u2775 [MEDIUM RIGHT CURLY BRACKET ORNAMENT]
-"\u2775" => "}"
-
-# \uff5d [FULLWIDTH RIGHT CURLY BRACKET]
-"\uFF5D" => "}"
-
-# \u207a [SUPERSCRIPT PLUS SIGN]
-"\u207A" => "+"
-
-# \u208a [SUBSCRIPT PLUS SIGN]
-"\u208A" => "+"
-
-# \uff0b [FULLWIDTH PLUS SIGN]
-"\uFF0B" => "+"
-
-# \u207c [SUPERSCRIPT EQUALS SIGN]
-"\u207C" => "="
-
-# \u208c [SUBSCRIPT EQUALS SIGN]
-"\u208C" => "="
-
-# \uff1d [FULLWIDTH EQUALS SIGN]
-"\uFF1D" => "="
-
-# \uff01 [FULLWIDTH EXCLAMATION MARK]
-"\uFF01" => "!"
-
-# \u203c [DOUBLE EXCLAMATION MARK]
-"\u203C" => "!!"
-
-# \u2049 [EXCLAMATION QUESTION MARK]
-"\u2049" => "!?"
-
-# \uff03 [FULLWIDTH NUMBER SIGN]
-"\uFF03" => "#"
-
-# \uff04 [FULLWIDTH DOLLAR SIGN]
-"\uFF04" => "$"
-
-# \u2052 [COMMERCIAL MINUS SIGN]
-"\u2052" => "%"
-
-# \uff05 [FULLWIDTH PERCENT SIGN]
-"\uFF05" => "%"
-
-# \uff06 [FULLWIDTH AMPERSAND]
-"\uFF06" => "&"
-
-# \u204e [LOW ASTERISK]
-"\u204E" => "*"
-
-# \uff0a [FULLWIDTH ASTERISK]
-"\uFF0A" => "*"
-
-# \uff0c [FULLWIDTH COMMA]
-"\uFF0C" => ","
-
-# \uff0e [FULLWIDTH FULL STOP]
-"\uFF0E" => "."
-
-# \u2044 [FRACTION SLASH]
-"\u2044" => "/"
-
-# \uff0f [FULLWIDTH SOLIDUS]
-"\uFF0F" => "/"
-
-# \uff1a [FULLWIDTH COLON]
-"\uFF1A" => ":"
-
-# \u204f [REVERSED SEMICOLON]
-"\u204F" => ";"
-
-# \uff1b [FULLWIDTH SEMICOLON]
-"\uFF1B" => ";"
-
-# \uff1f [FULLWIDTH QUESTION MARK]
-"\uFF1F" => "?"
-
-# \u2047 [DOUBLE QUESTION MARK]
-"\u2047" => "??"
-
-# \u2048 [QUESTION EXCLAMATION MARK]
-"\u2048" => "?!"
-
-# \uff20 [FULLWIDTH COMMERCIAL AT]
-"\uFF20" => "@"
-
-# \uff3c [FULLWIDTH REVERSE SOLIDUS]
-"\uFF3C" => "\\"
-
-# \u2038 [CARET]
-"\u2038" => "^"
-
-# \uff3e [FULLWIDTH CIRCUMFLEX ACCENT]
-"\uFF3E" => "^"
-
-# \uff3f [FULLWIDTH LOW LINE]
-"\uFF3F" => "_"
-
-# \u2053 [SWUNG DASH]
-"\u2053" => "~"
-
-# \uff5e [FULLWIDTH TILDE]
-"\uFF5E" => "~"
-
-################################################################
-# Below is the Perl script used to generate the above mappings #
-# from ASCIIFoldingFilter.java: #
-################################################################
-#
-# #!/usr/bin/perl
-#
-# use warnings;
-# use strict;
-#
-# my @source_chars = ();
-# my @source_char_descriptions = ();
-# my $target = '';
-#
-# while (<>) {
-# if (/case\s+'(\\u[A-F0-9]+)':\s*\/\/\s*(.*)/i) {
-# push @source_chars, $1;
-# push @source_char_descriptions, $2;
-# next;
-# }
-# if (/output\[[^\]]+\]\s*=\s*'(\\'|\\\\|.)'/) {
-# $target .= $1;
-# next;
-# }
-# if (/break;/) {
-# $target = "\\\"" if ($target eq '"');
-# for my $source_char_num (0..$#source_chars) {
-# print "# $source_char_descriptions[$source_char_num]\n";
-# print "\"$source_chars[$source_char_num]\" => \"$target\"\n\n";
-# }
-# @source_chars = ();
-# @source_char_descriptions = ();
-# $target = '';
-# }
-# }
http://git-wip-us.apache.org/repos/asf/lucene-solr/blob/580f6e98/solr/example/example-DIH/solr/rss/conf/mapping-ISOLatin1Accent.txt
----------------------------------------------------------------------
diff --git a/solr/example/example-DIH/solr/rss/conf/mapping-ISOLatin1Accent.txt b/solr/example/example-DIH/solr/rss/conf/mapping-ISOLatin1Accent.txt
deleted file mode 100644
index ede7742..0000000
--- a/solr/example/example-DIH/solr/rss/conf/mapping-ISOLatin1Accent.txt
+++ /dev/null
@@ -1,246 +0,0 @@
-# The ASF licenses this file to You under the Apache License, Version 2.0
-# (the "License"); you may not use this file except in compliance with
-# the License. You may obtain a copy of the License at
-#
-# http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-# Syntax:
-# "source" => "target"
-# "source".length() > 0 (source cannot be empty.)
-# "target".length() >= 0 (target can be empty.)
-
-# example:
-# "�" => "A"
-# "\u00C0" => "A"
-# "\u00C0" => "\u0041"
-# "�" => "ss"
-# "\t" => " "
-# "\n" => ""
-
-# � => A
-"\u00C0" => "A"
-
-# � => A
-"\u00C1" => "A"
-
-# � => A
-"\u00C2" => "A"
-
-# � => A
-"\u00C3" => "A"
-
-# � => A
-"\u00C4" => "A"
-
-# � => A
-"\u00C5" => "A"
-
-# � => AE
-"\u00C6" => "AE"
-
-# � => C
-"\u00C7" => "C"
-
-# � => E
-"\u00C8" => "E"
-
-# � => E
-"\u00C9" => "E"
-
-# � => E
-"\u00CA" => "E"
-
-# � => E
-"\u00CB" => "E"
-
-# � => I
-"\u00CC" => "I"
-
-# � => I
-"\u00CD" => "I"
-
-# � => I
-"\u00CE" => "I"
-
-# � => I
-"\u00CF" => "I"
-
-# \u0132 => IJ
-"\u0132" => "IJ"
-
-# � => D
-"\u00D0" => "D"
-
-# � => N
-"\u00D1" => "N"
-
-# � => O
-"\u00D2" => "O"
-
-# � => O
-"\u00D3" => "O"
-
-# � => O
-"\u00D4" => "O"
-
-# � => O
-"\u00D5" => "O"
-
-# � => O
-"\u00D6" => "O"
-
-# � => O
-"\u00D8" => "O"
-
-# \u0152 => OE
-"\u0152" => "OE"
-
-# �
-"\u00DE" => "TH"
-
-# � => U
-"\u00D9" => "U"
-
-# � => U
-"\u00DA" => "U"
-
-# � => U
-"\u00DB" => "U"
-
-# � => U
-"\u00DC" => "U"
-
-# � => Y
-"\u00DD" => "Y"
-
-# \u0178 => Y
-"\u0178" => "Y"
-
-# � => a
-"\u00E0" => "a"
-
-# � => a
-"\u00E1" => "a"
-
-# � => a
-"\u00E2" => "a"
-
-# � => a
-"\u00E3" => "a"
-
-# � => a
-"\u00E4" => "a"
-
-# � => a
-"\u00E5" => "a"
-
-# � => ae
-"\u00E6" => "ae"
-
-# � => c
-"\u00E7" => "c"
-
-# � => e
-"\u00E8" => "e"
-
-# � => e
-"\u00E9" => "e"
-
-# � => e
-"\u00EA" => "e"
-
-# � => e
-"\u00EB" => "e"
-
-# � => i
-"\u00EC" => "i"
-
-# � => i
-"\u00ED" => "i"
-
-# � => i
-"\u00EE" => "i"
-
-# � => i
-"\u00EF" => "i"
-
-# \u0133 => ij
-"\u0133" => "ij"
-
-# � => d
-"\u00F0" => "d"
-
-# � => n
-"\u00F1" => "n"
-
-# � => o
-"\u00F2" => "o"
-
-# � => o
-"\u00F3" => "o"
-
-# � => o
-"\u00F4" => "o"
-
-# � => o
-"\u00F5" => "o"
-
-# � => o
-"\u00F6" => "o"
-
-# � => o
-"\u00F8" => "o"
-
-# \u0153 => oe
-"\u0153" => "oe"
-
-# � => ss
-"\u00DF" => "ss"
-
-# � => th
-"\u00FE" => "th"
-
-# � => u
-"\u00F9" => "u"
-
-# � => u
-"\u00FA" => "u"
-
-# � => u
-"\u00FB" => "u"
-
-# � => u
-"\u00FC" => "u"
-
-# � => y
-"\u00FD" => "y"
-
-# � => y
-"\u00FF" => "y"
-
-# \ufb00 => ff
-"\uFB00" => "ff"
-
-# \ufb01 => fi
-"\uFB01" => "fi"
-
-# \ufb02 => fl
-"\uFB02" => "fl"
-
-# \ufb03 => ffi
-"\uFB03" => "ffi"
-
-# \ufb04 => ffl
-"\uFB04" => "ffl"
-
-# \ufb05 => ft
-"\uFB05" => "ft"
-
-# \ufb06 => st
-"\uFB06" => "st"
http://git-wip-us.apache.org/repos/asf/lucene-solr/blob/580f6e98/solr/example/example-DIH/solr/rss/conf/protwords.txt
----------------------------------------------------------------------
diff --git a/solr/example/example-DIH/solr/rss/conf/protwords.txt b/solr/example/example-DIH/solr/rss/conf/protwords.txt
deleted file mode 100644
index 1dfc0ab..0000000
--- a/solr/example/example-DIH/solr/rss/conf/protwords.txt
+++ /dev/null
@@ -1,21 +0,0 @@
-# The ASF licenses this file to You under the Apache License, Version 2.0
-# (the "License"); you may not use this file except in compliance with
-# the License. You may obtain a copy of the License at
-#
-# http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-#-----------------------------------------------------------------------
-# Use a protected word file to protect against the stemmer reducing two
-# unrelated words to the same base word.
-
-# Some non-words that normally won't be encountered,
-# just to test that they won't be stemmed.
-dontstems
-zwhacky
-
http://git-wip-us.apache.org/repos/asf/lucene-solr/blob/580f6e98/solr/example/example-DIH/solr/rss/conf/rss-data-config.xml
----------------------------------------------------------------------
diff --git a/solr/example/example-DIH/solr/rss/conf/rss-data-config.xml b/solr/example/example-DIH/solr/rss/conf/rss-data-config.xml
deleted file mode 100644
index 704325b..0000000
--- a/solr/example/example-DIH/solr/rss/conf/rss-data-config.xml
+++ /dev/null
@@ -1,26 +0,0 @@
-<dataConfig>
- <dataSource type="URLDataSource" />
- <document>
- <entity name="slashdot"
- pk="link"
- url="http://rss.slashdot.org/Slashdot/slashdot"
- processor="XPathEntityProcessor"
- forEach="/rss/channel/item"
- transformer="DateFormatTransformer">
-
- <field column="source" xpath="/rss/channel/title" commonField="true" />
- <field column="source-link" xpath="/rss/channel/link" commonField="true" />
- <field column="subject" xpath="/rss/channel/subject" commonField="true" />
-
- <field column="title" xpath="/rss/channel/item/title" />
- <field column="link" xpath="/rss/channel/item/link" />
- <field column="description" xpath="/rss/channel/item/description" />
- <field column="creator" xpath="/rss/channel/item/creator" />
- <field column="item-subject" xpath="/rss/channel/item/subject" />
- <field column="date" xpath="/rss/channel/item/date" dateTimeFormat="yyyy-MM-dd'T'HH:mm:ss" />
- <field column="slash-department" xpath="/rss/channel/item/department" />
- <field column="slash-section" xpath="/rss/channel/item/section" />
- <field column="slash-comments" xpath="/rss/channel/item/comments" />
- </entity>
- </document>
-</dataConfig>