Index: solr/contrib/extraction/lib/icu4j-4_6.jar =================================================================== Cannot display: file marked as a binary type. svn:mime-type = application/octet-stream Property changes on: solr\contrib\extraction\lib\icu4j-4_6.jar ___________________________________________________________________ Added: svn:mime-type + application/octet-stream Index: solr/contrib/extraction/lib/icu4j-4_4_2.jar =================================================================== Cannot display: file marked as a binary type. svn:mime-type = application/octet-stream Index: solr/contrib/analysis-extras/lib/icu4j-4_6.jar =================================================================== Cannot display: file marked as a binary type. svn:mime-type = application/octet-stream Property changes on: solr\contrib\analysis-extras\lib\icu4j-4_6.jar ___________________________________________________________________ Added: svn:mime-type + application/octet-stream Index: solr/contrib/analysis-extras/lib/icu4j-4_4_2.jar =================================================================== Cannot display: file marked as a binary type. svn:mime-type = application/octet-stream Index: modules/analysis/icu/lib/icu4j-4_6.jar =================================================================== Cannot display: file marked as a binary type. svn:mime-type = application/octet-stream Property changes on: modules\analysis\icu\lib\icu4j-4_6.jar ___________________________________________________________________ Added: svn:mime-type + application/octet-stream Index: modules/analysis/icu/lib/icu4j-4_4_2.jar =================================================================== Cannot display: file marked as a binary type. svn:mime-type = application/octet-stream Index: modules/analysis/icu/src/test/org/apache/lucene/collation/TestICUCollationKeyAnalyzer.java =================================================================== --- modules/analysis/icu/src/test/org/apache/lucene/collation/TestICUCollationKeyAnalyzer.java (revision 1042050) +++ modules/analysis/icu/src/test/org/apache/lucene/collation/TestICUCollationKeyAnalyzer.java (working copy) @@ -73,6 +73,7 @@ // The ICU Collator and java.text.Collator implementations differ in their // orderings - "BFJHD" is the ordering for the ICU Collator for Locale.US. testCollationKeySort - (usAnalyzer, franceAnalyzer, swedenAnalyzer, denmarkAnalyzer, "BFJHD"); + (usAnalyzer, franceAnalyzer, swedenAnalyzer, denmarkAnalyzer, + "BFJHD", "ECAGI", "BJDFH", "BJDHF"); } } Index: modules/analysis/icu/src/test/org/apache/lucene/collation/TestICUCollationKeyFilter.java =================================================================== --- modules/analysis/icu/src/test/org/apache/lucene/collation/TestICUCollationKeyFilter.java (revision 1042050) +++ modules/analysis/icu/src/test/org/apache/lucene/collation/TestICUCollationKeyFilter.java (working copy) @@ -91,6 +91,7 @@ // The ICU Collator and java.text.Collator implementations differ in their // orderings - "BFJHD" is the ordering for the ICU Collator for Locale.US. testCollationKeySort - (usAnalyzer, franceAnalyzer, swedenAnalyzer, denmarkAnalyzer, "BFJHD"); + (usAnalyzer, franceAnalyzer, swedenAnalyzer, denmarkAnalyzer, + "BFJHD", "ECAGI", "BJDFH", "BJDHF"); } } Index: modules/analysis/icu/src/java/overview.html =================================================================== --- modules/analysis/icu/src/java/overview.html (revision 1042050) +++ modules/analysis/icu/src/java/overview.html (working copy) @@ -358,7 +358,7 @@
This module exists to provide up-to-date Unicode functionality that supports
-the most recent version of Unicode (currently 5.2). However, some users who wish
+the most recent version of Unicode (currently 6.0). However, some users who wish
for stronger backwards compatibility can restrict
{@link org.apache.lucene.analysis.icu.ICUNormalizer2Filter} to operate on only
a specific Unicode Version by using a {@link com.ibm.icu.text.FilteredNormalizer2}.
Index: modules/analysis/icu/src/data/utr30/nfkc.txt
===================================================================
--- modules/analysis/icu/src/data/utr30/nfkc.txt (revision 1042050)
+++ modules/analysis/icu/src/data/utr30/nfkc.txt (working copy)
@@ -26,7 +26,7 @@
#
# file name: nfkc.txt
#
-# machine-generated on: 2009-11-30
+# machine-generated on: 2010-07-23
#
# Round-trip mappings (=) containing [:Diacritic:] (see DiacriticFolding.txt)
# were changed to one-way decompositions, as their non-starters now decompose.
@@ -114,6 +114,7 @@
0657..065B:230
065C:220
065D..065E:230
+065F:220
0670:35
06D6..06DC:230
06DF..06E2:230
@@ -150,6 +151,7 @@
081B..0823:230
0825..0827:230
0829..082D:230
+0859..085B:220
093C:7
094D:9
0951:230
@@ -192,7 +194,7 @@
1037:7
1039..103A:9
108D:220
-135F:230
+135D..135F:230
1714:9
1734:9
17D2:9
@@ -212,6 +214,8 @@
1B6C:220
1B6D..1B73:230
1BAA:9
+1BE6:7
+1BF2..1BF3:9
1C37:7
1CD0..1CD2:230
1CD4:1
@@ -231,6 +235,7 @@
1DCF:220
1DD0:202
1DD1..1DE6:230
+1DFC:233
1DFD:220
1DFE:230
1DFF:220
@@ -248,6 +253,7 @@
20EC..20EF:220
20F0:230
2CEF..2CF1:230
+2D7F:9
2DE0..2DFF:230
302A:218
302B:228
@@ -281,6 +287,7 @@
10A39:1
10A3A:220
10A3F:9
+11046:9
110B9:9
110BA:7
1D165..1D166:216
@@ -1426,6 +1433,14 @@
2092>006F
2093>0078
2094>0259
+2095>0068
+2096>006B
+2097>006C
+2098>006D
+2099>006E
+209A>0070
+209B>0073
+209C>0074
20A8>0052 0073
2100>0061 002F 0063
2101>0061 002F 0073
@@ -5213,18 +5228,42 @@
1F12C>0052
1F12D>0043 0044
1F12E>0057 005A
+1F130>0041
1F131>0042
+1F132>0043
+1F133>0044
+1F134>0045
+1F135>0046
+1F136>0047
+1F137>0048
+1F138>0049
+1F139>004A
+1F13A>004B
+1F13B>004C
+1F13C>004D
1F13D>004E
+1F13E>004F
1F13F>0050
+1F140>0051
+1F141>0052
1F142>0053
+1F143>0054
+1F144>0055
+1F145>0056
1F146>0057
+1F147>0058
+1F148>0059
+1F149>005A
1F14A>0048 0056
1F14B>004D 0056
1F14C>0053 0044
1F14D>0053 0053
1F14E>0050 0050 0056
+1F14F>0057 0043
1F190>0044 004A
1F200>307B 304B
+1F201>30B3 30B3
+1F202>30B5
1F210>624B
1F211>5B57
1F212>53CC
@@ -5259,6 +5298,15 @@
1F22F>6307
1F230>8D70
1F231>6253
+1F232>7981
+1F233>7A7A
+1F234>5408
+1F235>6E80
+1F236>6709
+1F237>6708
+1F238>7533
+1F239>5272
+1F23A>55B6
1F240>3014 672C 3015
1F241>3014 4E09 3015
1F242>3014 4E8C 3015
@@ -5268,6 +5316,8 @@
1F246>3014 76D7 3015
1F247>3014 52DD 3015
1F248>3014 6557 3015
+1F250>5F97
+1F251>53EF
2F800>4E3D
2F801>4E38
2F802>4E41
Index: modules/analysis/icu/src/data/utr30/nfkc_cf.txt
===================================================================
--- modules/analysis/icu/src/data/utr30/nfkc_cf.txt (revision 1042050)
+++ modules/analysis/icu/src/data/utr30/nfkc_cf.txt (working copy)
@@ -19,11 +19,11 @@
# remains attached.
#
# Extracted from:
-# DerivedNormalizationProps-5.2.0.txt
-# Date: 2009-08-26, 18:18:50 GMT [MD]
+# DerivedNormalizationProps-6.0.0.txt
+# Date: 2010-05-20, 15:14:12 GMT [MD]
#
# Unicode Character Database
-# Copyright (c) 1991-2009 Unicode, Inc.
+# Copyright (c) 1991-2010 Unicode, Inc.
# For terms of use, see http://www.unicode.org/terms_of_use.html
# For documentation, see http://www.unicode.org/reports/tr44/
@@ -43,7 +43,7 @@
# WARNING: Application to STRINGS must apply NFC after mapping each character, because characters may interact.
# For more information, see [http://www.unicode.org/reports/tr44/]
# Omitted code points are unchanged by this mapping.
-# @missing: 0000..10FFFF>
+# @missing: 0000..10FFFF; NFKC_CF;
# All code points not explicitly listed for NFKC_Casefold
# have the value