# The ASF licenses this file to You under the Apache License, Version 2.0
# (the "License"); you may not use this file except in compliance with
# the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# This map converts alphabetic, numeric, and symbolic Unicode characters
# which are not in the first 127 ASCII characters (the "Basic Latin" Unicode
# block) into their ASCII equivalents, if one exists.
#
# Characters from the following Unicode blocks are converted; however, only
# those characters with reasonable ASCII alternatives are converted:
#
# - C1 Controls and Latin-1 Supplement: http://www.unicode.org/charts/PDF/U0080.pdf
# - Latin Extended-A: http://www.unicode.org/charts/PDF/U0100.pdf
# - Latin Extended-B: http://www.unicode.org/charts/PDF/U0180.pdf
# - Latin Extended Additional: http://www.unicode.org/charts/PDF/U1E00.pdf
# - Latin Extended-C: http://www.unicode.org/charts/PDF/U2C60.pdf
# - Latin Extended-D: http://www.unicode.org/charts/PDF/UA720.pdf
# - IPA Extensions: http://www.unicode.org/charts/PDF/U0250.pdf
# - Phonetic Extensions: http://www.unicode.org/charts/PDF/U1D00.pdf
# - Phonetic Extensions Supplement: http://www.unicode.org/charts/PDF/U1D80.pdf
# - General Punctuation: http://www.unicode.org/charts/PDF/U2000.pdf
# - Superscripts and Subscripts: http://www.unicode.org/charts/PDF/U2070.pdf
# - Enclosed Alphanumerics: http://www.unicode.org/charts/PDF/U2460.pdf
# - Dingbats: http://www.unicode.org/charts/PDF/U2700.pdf
# - Supplemental Punctuation: http://www.unicode.org/charts/PDF/U2E00.pdf
# - Alphabetic Presentation Forms: http://www.unicode.org/charts/PDF/UFB00.pdf
# - Halfwidth and Fullwidth Forms: http://www.unicode.org/charts/PDF/UFF00.pdf
#
# See: http://en.wikipedia.org/wiki/Latin_characters_in_Unicode
#
# The set of character conversions supported by this map is a superset of
# those supported by the map represented by mapping-ISOLatin1Accent.txt.
#
# See the bottom of this file for the Perl script used to generate the contents
# of this file (without this header) from ASCIIFoldingFilter.java.
# Syntax:
# "source" => "target"
# "source".length() > 0 (source cannot be empty.)
# "target".length() >= 0 (target can be empty.)
# À [LATIN CAPITAL LETTER A WITH GRAVE]
"\u00C0" => "A"
# Á [LATIN CAPITAL LETTER A WITH ACUTE]
"\u00C1" => "A"
# Â [LATIN CAPITAL LETTER A WITH CIRCUMFLEX]
"\u00C2" => "A"
# Ã [LATIN CAPITAL LETTER A WITH TILDE]
"\u00C3" => "A"
# Ä [LATIN CAPITAL LETTER A WITH DIAERESIS]
"\u00C4" => "A"
# Å [LATIN CAPITAL LETTER A WITH RING ABOVE]
"\u00C5" => "A"
# Ā [LATIN CAPITAL LETTER A WITH MACRON]
"\u0100" => "A"
# Ă [LATIN CAPITAL LETTER A WITH BREVE]
"\u0102" => "A"
# Ą [LATIN CAPITAL LETTER A WITH OGONEK]
"\u0104" => "A"
# Ə http://en.wikipedia.org/wiki/Schwa [LATIN CAPITAL LETTER SCHWA]
"\u018F" => "A"
# Ǎ [LATIN CAPITAL LETTER A WITH CARON]
"\u01CD" => "A"
# Ǟ [LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON]
"\u01DE" => "A"
# Ǡ [LATIN CAPITAL LETTER A WITH DOT ABOVE AND MACRON]
"\u01E0" => "A"
# Ǻ [LATIN CAPITAL LETTER A WITH RING ABOVE AND ACUTE]
"\u01FA" => "A"
# Ȁ [LATIN CAPITAL LETTER A WITH DOUBLE GRAVE]
"\u0200" => "A"
# Ȃ [LATIN CAPITAL LETTER A WITH INVERTED BREVE]
"\u0202" => "A"
# Ȧ [LATIN CAPITAL LETTER A WITH DOT ABOVE]
"\u0226" => "A"
# Ⱥ [LATIN CAPITAL LETTER A WITH STROKE]
"\u023A" => "A"
# ᴀ [LATIN LETTER SMALL CAPITAL A]
"\u1D00" => "A"
# Ḁ [LATIN CAPITAL LETTER A WITH RING BELOW]
"\u1E00" => "A"
# Ạ [LATIN CAPITAL LETTER A WITH DOT BELOW]
"\u1EA0" => "A"
# Ả [LATIN CAPITAL LETTER A WITH HOOK ABOVE]
"\u1EA2" => "A"
# Ấ [LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND ACUTE]
"\u1EA4" => "A"
# Ầ [LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND GRAVE]
"\u1EA6" => "A"
# Ẩ [LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND HOOK ABOVE]
"\u1EA8" => "A"
# Ẫ [LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND TILDE]
"\u1EAA" => "A"
# Ậ [LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND DOT BELOW]
"\u1EAC" => "A"
# Ắ [LATIN CAPITAL LETTER A WITH BREVE AND ACUTE]
"\u1EAE" => "A"
# Ằ [LATIN CAPITAL LETTER A WITH BREVE AND GRAVE]
"\u1EB0" => "A"
# Ẳ [LATIN CAPITAL LETTER A WITH BREVE AND HOOK ABOVE]
"\u1EB2" => "A"
# Ẵ [LATIN CAPITAL LETTER A WITH BREVE AND TILDE]
"\u1EB4" => "A"
# Ặ [LATIN CAPITAL LETTER A WITH BREVE AND DOT BELOW]
"\u1EB6" => "A"
# Ⓐ [CIRCLED LATIN CAPITAL LETTER A]
"\u24B6" => "A"
# A [FULLWIDTH LATIN CAPITAL LETTER A]
"\uFF21" => "A"
# à [LATIN SMALL LETTER A WITH GRAVE]
"\u00E0" => "a"
# á [LATIN SMALL LETTER A WITH ACUTE]
"\u00E1" => "a"
# â [LATIN SMALL LETTER A WITH CIRCUMFLEX]
"\u00E2" => "a"
# ã [LATIN SMALL LETTER A WITH TILDE]
"\u00E3" => "a"
# ä [LATIN SMALL LETTER A WITH DIAERESIS]
"\u00E4" => "a"
# å [LATIN SMALL LETTER A WITH RING ABOVE]
"\u00E5" => "a"
# ā [LATIN SMALL LETTER A WITH MACRON]
"\u0101" => "a"
# ă [LATIN SMALL LETTER A WITH BREVE]
"\u0103" => "a"
# ą [LATIN SMALL LETTER A WITH OGONEK]
"\u0105" => "a"
# ǎ [LATIN SMALL LETTER A WITH CARON]
"\u01CE" => "a"
# ǟ [LATIN SMALL LETTER A WITH DIAERESIS AND MACRON]
"\u01DF" => "a"
# ǡ [LATIN SMALL LETTER A WITH DOT ABOVE AND MACRON]
"\u01E1" => "a"
# ǻ [LATIN SMALL LETTER A WITH RING ABOVE AND ACUTE]
"\u01FB" => "a"
# ȁ [LATIN SMALL LETTER A WITH DOUBLE GRAVE]
"\u0201" => "a"
# ȃ [LATIN SMALL LETTER A WITH INVERTED BREVE]
"\u0203" => "a"
# ȧ [LATIN SMALL LETTER A WITH DOT ABOVE]
"\u0227" => "a"
# ɐ [LATIN SMALL LETTER TURNED A]
"\u0250" => "a"
# ə [LATIN SMALL LETTER SCHWA]
"\u0259" => "a"
# ɚ [LATIN SMALL LETTER SCHWA WITH HOOK]
"\u025A" => "a"
# ᶏ [LATIN SMALL LETTER A WITH RETROFLEX HOOK]
"\u1D8F" => "a"
# ᶕ [LATIN SMALL LETTER SCHWA WITH RETROFLEX HOOK]
"\u1D95" => "a"
# ạ [LATIN SMALL LETTER A WITH RING BELOW]
"\u1E01" => "a"
# ả [LATIN SMALL LETTER A WITH RIGHT HALF RING]
"\u1E9A" => "a"
# ạ [LATIN SMALL LETTER A WITH DOT BELOW]
"\u1EA1" => "a"
# ả [LATIN SMALL LETTER A WITH HOOK ABOVE]
"\u1EA3" => "a"
# ấ [LATIN SMALL LETTER A WITH CIRCUMFLEX AND ACUTE]
"\u1EA5" => "a"
# ầ [LATIN SMALL LETTER A WITH CIRCUMFLEX AND GRAVE]
"\u1EA7" => "a"
# ẩ [LATIN SMALL LETTER A WITH CIRCUMFLEX AND HOOK ABOVE]
"\u1EA9" => "a"
# ẫ [LATIN SMALL LETTER A WITH CIRCUMFLEX AND TILDE]
"\u1EAB" => "a"
# ậ [LATIN SMALL LETTER A WITH CIRCUMFLEX AND DOT BELOW]
"\u1EAD" => "a"
# ắ [LATIN SMALL LETTER A WITH BREVE AND ACUTE]
"\u1EAF" => "a"
# ằ [LATIN SMALL LETTER A WITH BREVE AND GRAVE]
"\u1EB1" => "a"
# ẳ [LATIN SMALL LETTER A WITH BREVE AND HOOK ABOVE]
"\u1EB3" => "a"
# ẵ [LATIN SMALL LETTER A WITH BREVE AND TILDE]
"\u1EB5" => "a"
# ặ [LATIN SMALL LETTER A WITH BREVE AND DOT BELOW]
"\u1EB7" => "a"
# ₐ [LATIN SUBSCRIPT SMALL LETTER A]
"\u2090" => "a"
# ₔ [LATIN SUBSCRIPT SMALL LETTER SCHWA]
"\u2094" => "a"
# ⓐ [CIRCLED LATIN SMALL LETTER A]
"\u24D0" => "a"
# ⱥ [LATIN SMALL LETTER A WITH STROKE]
"\u2C65" => "a"
# Ɐ [LATIN CAPITAL LETTER TURNED A]
"\u2C6F" => "a"
# a [FULLWIDTH LATIN SMALL LETTER A]
"\uFF41" => "a"
# Ꜳ [LATIN CAPITAL LETTER AA]
"\uA732" => "AA"
# Æ [LATIN CAPITAL LETTER AE]
"\u00C6" => "AE"
# Ǣ [LATIN CAPITAL LETTER AE WITH MACRON]
"\u01E2" => "AE"
# Ǽ [LATIN CAPITAL LETTER AE WITH ACUTE]
"\u01FC" => "AE"
# ᴁ [L
没有合适的资源?快使用搜索试试~ 我知道了~
资源推荐
资源详情
资源评论
收起资源包目录
conf_parsed.rar (11个子文件)
conf
spellings.txt 16B
solrconfig_parsing.xml 8KB
schema.xml 2KB
protwords.txt 894B
mapping-FoldToASCII.txt 80KB
stopwords.txt 1KB
schema_parsing.xml 4KB
scripts.conf 921B
solrconfig.xml 4KB
synonyms.txt 1KB
mapping-ISOLatin1Accent.txt 3KB
共 11 条
- 1
2哥的成长记录
- 粉丝: 28
- 资源: 53
上传资源 快速赚钱
- 我的内容管理 展开
- 我的资源 快来上传第一个资源
- 我的收益 登录查看自己的收益
- 我的积分 登录查看自己的积分
- 我的C币 登录后查看C币余额
- 我的收藏
- 我的下载
- 下载帮助
安全验证
文档复制为VIP权益,开通VIP直接复制
信息提交成功
- 1
- 2
前往页