X-Git-Url: https://git.mdrn.pl/pylucene.git/blobdiff_plain/a2e61f0c04805cfcb8706176758d1283c7e3a55c..aaeed5504b982cf3545252ab528713250aa33eed:/lucene-java-3.5.0/lucene/contrib/icu/src/data/utr30/BasicFoldings.txt diff --git a/lucene-java-3.5.0/lucene/contrib/icu/src/data/utr30/BasicFoldings.txt b/lucene-java-3.5.0/lucene/contrib/icu/src/data/utr30/BasicFoldings.txt new file mode 100644 index 0000000..6045b5f --- /dev/null +++ b/lucene-java-3.5.0/lucene/contrib/icu/src/data/utr30/BasicFoldings.txt @@ -0,0 +1,111 @@ +# Copyright 2001-2010 Unicode, Inc. +# +# Disclaimer +# +# This source code is provided as is by Unicode, Inc. No claims are +# made as to fitness for any particular purpose. No warranties of any +# kind are expressed or implied. The recipient agrees to determine +# applicability of information provided. If this file has been +# purchased on magnetic or optical media from Unicode, Inc., the +# sole remedy for any claim will be exchange of defective media +# within 90 days of receipt. +# +# Limitations on Rights to Redistribute This Code +# +# Unicode, Inc. hereby grants the right to freely use the information +# supplied in this file in the creation of products supporting the +# Unicode Standard, and to make copies of this file in any form +# for internal or external distribution as long as this notice +# remains attached. + +### Custom Normalization mappings for UTR#30 +### (http://www.unicode.org/reports/tr30/tr30-4.html) +### +### Created from Unicode 5.2 UCD +### + +## Accent removal +# See DiacriticFolding.txt +## Case Folding (done by cf) +## Canonical Duplicates Folding (done by cd) +## Dashes folding +# [[:Dash:][:Pd:]]-2053(swung dash) > U+002D +058A>002D +05BE>002D +1400>002D +1806>002D +2010..2015>002D +2E17>002D +2E1A>002D +301C>002D +3030>002D +30A0>002D +#2053>002D +2212>002D +# FE31,FE32,FE58,FE63,FF0D done by kd + +## Greek letterforms folding (done by kd) +## Hebrew alternates folding (done by kd) +## Jamo folding (done by kd) +## Math symbol folding (done by kd) +## Native digit folding +# See NativeDigitFolding.txt +## Nobreak folding (done by kd) +## Overline Folding +FE49..FE4C>203E +## Positional forms folding (done by kd) +## Small forms folding (done by kd) +## Space Folding +# [:Zs:] > U+0020 +1680>0020 +180E>0020 +# 00A0, 2000..200A,202F,205F,3000 done by kd +## Spacing Accents folding (done by kd) +## Subscript folding (done by kd) +## Symbol folding (done by kd) +## Underline Folding +2017>005E +FE4D..FE4F>005E +## Diacritic Folding +# + +## Vertical forms folding (done by kd) +## Han Radical Folding +# See HanRadicalFolding.txt +## Letter Form Folding (done by kd) +## Superscript folding +# Additions to kd: +02C0>0294 +02C1>0295 +06E5>0648 +06E6>064A +## Suzhou Numeral Folding +# Additions to kd: +3021>4E00 +3022>4E8C +3023>4E09 +3024>56DB +3025>4E94 +3026>516D +3027>4E03 +3028>516B +3029>4E5D +## Width Folding (done by kd) +# Punctuation Folding +00AB>0022 +00BB>0022 +201C..201E>0022 +2018..201B>0027 +2032>0027 +2035>0027 +2039..203A>0027 +2045>005B +2046>005D +2E28>0028 0028 +2E29>0029 0029 +2052>0025 +204E>002A +2044>002F +204F>003B +2038>005E +2053>007E