X-Git-Url: http://wien.tomnetworks.com/gitweb/?a=blobdiff_plain;f=mcs%2Fclass%2Fcorlib%2FMono.Globalization.Unicode%2FSimpleCollator.cs;h=cbe4d904eb17cdb8836bd2eb0ef914f839aff62b;hb=623803f165f9917497606d5e514609a71963fffa;hp=8fbe000b55ba5efecd033d39964d4a837ad3363b;hpb=6b9fb84c41e08d187f40a83e9084589b3a91a2d8;p=mono.git

diff --git a/mcs/class/corlib/Mono.Globalization.Unicode/SimpleCollator.cs b/mcs/class/corlib/Mono.Globalization.Unicode/SimpleCollator.cs
index 8fbe000b55b..cbe4d904eb1 100644
--- a/mcs/class/corlib/Mono.Globalization.Unicode/SimpleCollator.cs
+++ b/mcs/class/corlib/Mono.Globalization.Unicode/SimpleCollator.cs
@@ -4,16 +4,60 @@
 // This class will demonstrate CompareInfo functionality that will just work.
 //
 
+//
+// Here's a summary for supporting contractions, expansions and diacritical 
+// remappings.
+//
+// Diacritical mapping is a simple tailoring rule that "remaps" diacritical
+// weight value from one to another. For now it applies to all range of
+// characters, but at some stage we might need to limit the remapping ranges.
+//
+// A Contraction consists of a string (actually char[]) and a sortkey entry
+// (i.e. byte[]). It indicates that a sequence of characters is interpreted
+// as a single character that has the mapped sortkey value. There is no
+// character which goes across "special rules". When the collator encountered
+// such a sequence of characters, it just returns the sortkey value without
+// further replacement.
+//
+// Since it is still likely to happen that a contraction sequence matches
+// other character than the identical sequence (depending on CompareOptions
+// and of course, defined sortkey value itself), comparison cannot be done
+// at source char[] level.
+//
+// In IndexOf(), the first character in the target string or the target char
+// itself is turned into sortkey bytes. If the character has a contraction and
+// that is sortkey map, then it is used instead. If the contraction exists and
+// that is replacement map, then the first character of the replacement string
+// is searched instead. IndexOf() always searches only for the top character,
+// and if it returned negative value, then it returns -1. Otherwise, it then
+// tries IsPrefix() from that location. If it returns true, then it returns
+// the index.
+//
+// LAMESPEC: IndexOf() is lame as a whole API. It never matches in the middle
+// of expansion and there is no proper way to return such indexes within
+// a single int return value.
+//
+// For example, try below in .NET:
+//	IndexOf("\u00E6", "a")
+//	IndexOf("\u00E6", "e")
+//
+
+
 using System;
+using System.Collections;
 using System.Globalization;
 
 using Uni = Mono.Globalization.Unicode.MSCompatUnicodeTable;
+using UUtil = Mono.Globalization.Unicode.MSCompatUnicodeTableUtil;
 
 namespace Mono.Globalization.Unicode
 {
 	internal class SimpleCollator
 	{
-		SortKeyBuffer buf = new SortKeyBuffer ();
+		static SimpleCollator invariant =
+			new SimpleCollator (CultureInfo.InvariantCulture);
+
+		SortKeyBuffer buf;
 		// CompareOptions expanded.
 		bool ignoreNonSpace; // used in IndexOf()
 		bool ignoreSymbols;
@@ -22,11 +66,141 @@ namespace Mono.Globalization.Unicode
 		bool ignoreKanaType;
 		TextInfo textInfo; // for ToLower().
 		bool frenchSort;
+		unsafe readonly byte* cjkCatTable;
+		unsafe readonly byte* cjkLv1Table;
+		readonly CodePointIndexer cjkIndexer;
+		unsafe readonly byte* cjkLv2Table;
+		readonly CodePointIndexer cjkLv2Indexer;
+		readonly int lcid;
+		readonly Contraction [] contractions;
+		readonly Level2Map [] level2Maps;
+
+		// This flag marks characters as "unsafe", where the character
+		// could be used as part of a contraction (whose length > 1).
+		readonly bool [] unsafeFlags;
+
+		const int UnsafeFlagLength = 0x300;
+
+		// temporary sortkey buffer for index search/comparison
+		byte [] charSortKey = new byte [4];
+		byte [] charSortKey2 = new byte [4];
+		byte [] charSortKeyIndexTarget = new byte [4];
+
+		#region .ctor() and split functions
 
 		public SimpleCollator (CultureInfo culture)
 		{
+			lcid = culture.LCID;
 			textInfo = culture.TextInfo;
-			// FIXME: fill frenchSort from CultureInfo.
+			buf = new SortKeyBuffer (culture.LCID);
+
+			unsafe {
+				SetCJKTable (culture, ref cjkIndexer,
+					ref cjkCatTable, ref cjkLv1Table,
+					ref cjkLv2Indexer, ref cjkLv2Table);
+			}
+
+			// Get tailoring info
+			TailoringInfo t = null;
+			for (CultureInfo ci = culture; ci.LCID != 127; ci = ci.Parent) {
+				t = Uni.GetTailoringInfo (ci.LCID);
+				if (t != null)
+					break;
+			}
+			if (t == null) // then use invariant
+				t = Uni.GetTailoringInfo (127);
+
+			frenchSort = t.FrenchSort;
+			Uni.BuildTailoringTables (culture, t, ref contractions,
+				ref level2Maps);
+			unsafeFlags = new bool [UnsafeFlagLength];
+			foreach (Contraction c in contractions)
+				if (c.Source.Length > 1)
+					foreach (char ch in c.Source)
+						unsafeFlags [(int) ch] = true;
+
+			// FIXME: Since tailorings are mostly for latin
+			// (and in some cases Cyrillic) characters, it would
+			// be much better for performance to store "start 
+			// indexes" for > 370 (culture-specific letters).
+
+/*
+// dump tailoring table
+Console.WriteLine ("******** building table for {0} : c - {1} d - {2}",
+culture.LCID, contractions.Length, level2Maps.Length);
+foreach (Contraction c in contractions) {
+foreach (char cc in c.Source)
+Console.Write ("{0:X4} ", (int) cc);
+Console.WriteLine (" -> '{0}'", c.Replacement);
+}
+*/
+		}
+
+		unsafe private void SetCJKTable (
+			CultureInfo culture, ref CodePointIndexer cjkIndexer,
+			ref byte* catTable, ref byte* lv1Table,
+			ref CodePointIndexer lv2Indexer, ref byte* lv2Table)
+		{
+			string name = GetNeutralCulture (culture).Name;
+
+			Uni.FillCJK (name, ref cjkIndexer, ref catTable,
+				ref lv1Table, ref lv2Indexer, ref lv2Table);
+		}
+
+		static CultureInfo GetNeutralCulture (CultureInfo info)
+		{
+			CultureInfo ret = info;
+			while (ret.Parent != null && ret.Parent.LCID != 127)
+				ret = ret.Parent;
+			return ret;
+		}
+
+		#endregion
+
+		unsafe byte Category (int cp)
+		{
+			if (cp < 0x3000 || cjkCatTable == null)
+				return Uni.Category (cp);
+			int idx = cjkIndexer.ToIndex (cp);
+			return idx < 0 ? Uni.Category (cp) : cjkCatTable [idx];
+		}
+
+		unsafe byte Level1 (int cp)
+		{
+			if (cp < 0x3000 || cjkLv1Table == null)
+				return Uni.Level1 (cp);
+			int idx = cjkIndexer.ToIndex (cp);
+			return idx < 0 ? Uni.Level1 (cp) : cjkLv1Table [idx];
+		}
+
+		unsafe byte Level2 (int cp, ExtenderType ext)
+		{
+			if (ext == ExtenderType.Buggy)
+				return 5;
+			else if (ext == ExtenderType.Conditional)
+				return 0;
+
+			if (cp < 0x3000 || cjkLv2Table == null)
+				return Uni.Level2 (cp);
+			int idx = cjkLv2Indexer.ToIndex (cp);
+			byte ret = idx < 0 ? (byte) 0 : cjkLv2Table [idx];
+			if (ret != 0)
+				return ret;
+			ret = Uni.Level2 (cp);
+			if (level2Maps.Length == 0)
+				return ret;
+			for (int i = 0; i < level2Maps.Length; i++) {
+				if (level2Maps [i].Source == ret)
+					return level2Maps [i].Replace;
+				else if (level2Maps [i].Source > ret)
+					break;
+			}
+			return ret;
+		}
+
+		bool IsHalfKana (int cp)
+		{
+			return ignoreWidth || Uni.IsHalfWidthKana ((char) cp);
 		}
 
 		void SetOptions (CompareOptions options)
@@ -36,18 +210,103 @@ namespace Mono.Globalization.Unicode
 			this.ignoreWidth = (options & CompareOptions.IgnoreWidth) != 0;
 			this.ignoreCase = (options & CompareOptions.IgnoreCase) != 0;
 			this.ignoreKanaType = (options & CompareOptions.IgnoreKanaType) != 0;
+			previousChar = previousChar2 = -1;
+			previousSortKey = previousSortKey2 = null;
+			escape1.Source = escape2.Source = null;
 		}
 
-		string GetExpansion (int i)
+		Contraction GetContraction (string s, int start, int end)
 		{
-			// FIXME: handle tailorings
-			return Uni.GetExpansion ((char) i);
+			Contraction c = GetContraction (s, start, end, contractions);
+			if (c != null || lcid == 127)
+				return c;
+			return GetContraction (s, start, end, invariant.contractions);
+		}
+
+		Contraction GetContraction (string s, int start, int end, Contraction [] clist)
+		{
+			for (int i = 0; i < clist.Length; i++) {
+				Contraction ct = clist [i];
+				int diff = ct.Source [0] - s [start];
+				if (diff > 0)
+					return null; // it's already sorted
+				else if (diff < 0)
+					continue;
+				char [] chars = ct.Source;
+				if (end - start < chars.Length)
+					continue;
+				bool match = true;
+				for (int n = 0; n < chars.Length; n++)
+					if (s [start + n] != chars [n]) {
+						match = false;
+						break;
+					}
+				if (match)
+					return ct;
+			}
+			return null;
+		}
+
+		Contraction GetTailContraction (string s, int start, int end)
+		{
+			Contraction c = GetTailContraction (s, start, end, contractions);
+			if (c != null || lcid == 127)
+				return c;
+			return GetTailContraction (s, start, end, invariant.contractions);
+		}
+
+		Contraction GetTailContraction (string s, int start, int end, Contraction [] clist)
+		{
+			for (int i = 0; i < clist.Length; i++) {
+				Contraction ct = clist [i];
+				int diff = ct.Source [0] - s [end];
+				if (diff > 0)
+					return null; // it's already sorted
+				else if (diff < 0)
+					continue;
+				char [] chars = ct.Source;
+				if (start - end + 1 < chars.Length)
+					continue;
+				bool match = true;
+				int offset = start - chars.Length + 1;
+				for (int n = 0; n < chars.Length; n++)
+					if (s [offset + n] != chars [n]) {
+						match = false;
+						break;
+					}
+				if (match)
+					return ct;
+			}
+			return null;
+		}
+
+		Contraction GetContraction (char c)
+		{
+			Contraction ct = GetContraction (c, contractions);
+			if (ct != null || lcid == 127)
+				return ct;
+			return GetContraction (c, invariant.contractions);
+		}
+
+		Contraction GetContraction (char c, Contraction [] clist)
+		{
+			for (int i = 0; i < clist.Length; i++) {
+				Contraction ct = clist [i];
+				if (ct.Source [0] > c)
+					return null; // it's already sorted
+				if (ct.Source [0] == c && ct.Source.Length == 1)
+					return ct;
+			}
+			return null;
 		}
 
 		int FilterOptions (int i)
 		{
-			if (ignoreWidth)
-				i = Uni.ToWidthCompat (i);
+			if (ignoreWidth) {
+				int x = Uni.ToWidthCompat (i);
+				if (x != 0)
+					i = x;
+			}
 			if (ignoreCase)
 				i = textInfo.ToLower ((char) i);
 			if (ignoreKanaType)
@@ -55,6 +314,114 @@ namespace Mono.Globalization.Unicode
 			return i;
 		}
 
+		int previousChar = -1;
+		byte [] previousSortKey = null;
+		int previousChar2 = -1;
+		byte [] previousSortKey2 = null;
+
+		enum ExtenderType {
+			None,
+			Simple,
+			Voiced,
+			Conditional,
+			Buggy,
+		}
+
+		ExtenderType GetExtenderType (int i)
+		{
+			// LAMESPEC: Windows expects true for U+3005, but 
+			// sometimes it does not represent to repeat just
+			// one character.
+			// Windows also expects true for U+3031 and U+3032,
+			// but they should *never* repeat one character.
+
+			// U+2015 becomes an extender only when it is Japanese
+			if (i == 0x2015)
+				return lcid == 16 ? ExtenderType.Conditional :
+					ExtenderType.None;
+
+			if (i < 0x3005 || i > 0xFF70)
+				return ExtenderType.None;
+			if (i >= 0xFE7C) {
+				switch (i) {
+				case 0xFE7C:
+				case 0xFE7D:
+					return ExtenderType.Simple;
+				case 0xFF70:
+					return ExtenderType.Conditional;
+				case 0xFF9E:
+				case 0xFF9F:
+					return ExtenderType.Voiced;
+				}
+			}
+			if (i > 0x30FE)
+				return ExtenderType.None;
+			switch (i) {
+			case 0x3005: // LAMESPEC: see above.
+				return ExtenderType.Buggy;
+			case 0x3031: // LAMESPEC: see above.
+			case 0x3032: // LAMESPEC: see above.
+			case 0x309D:
+			case 0x30FD:
+				return ExtenderType.Simple;
+			case 0x309E:
+			case 0x30FE:
+				return ExtenderType.Voiced;
+			case 0x30FC:
+				return ExtenderType.Conditional;
+			default:
+				return ExtenderType.None;
+			}
+		}
+
+		byte ToDashTypeValue (ExtenderType ext)
+		{
+			if (ignoreNonSpace) // LAMESPEC: huh, why?
+				return 3;
+			switch (ext) {
+			case ExtenderType.None:
+				return 3;
+			case ExtenderType.Conditional:
+				return 5;
+			default:
+				return 4;
+			}
+		}
+
+		int FilterExtender (int i, ExtenderType ext)
+		{
+			if (ext == ExtenderType.Conditional &&
+				Uni.HasSpecialWeight ((char) i)) {
+				bool half = IsHalfKana ((char) i);
+				bool katakana = !Uni.IsHiragana ((char) i);
+				switch (Level1 (i) & 7) {
+				case 2:
+					return half ? 0xFF71 : katakana ? 0x30A2 : 0x3042;
+				case 3:
+					return half ? 0xFF72 : katakana ? 0x30A4 : 0x3044;
+				case 4:
+					return half ? 0xFF73 : katakana ? 0x30A6 : 0x3046;
+				case 5:
+					return half ? 0xFF74 : katakana ? 0x30A8 : 0x3048;
+				case 6:
+					return half ? 0xFF75 : katakana ? 0x30AA : 0x304A;
+				}
+			}
+			return i;
+		}
+
+		bool IsIgnorable (int i)
+		{
+			return Uni.IsIgnorable (i) ||
+				ignoreSymbols && Uni.IsIgnorableSymbol (i) ||
+				ignoreNonSpace && Uni.IsIgnorableNonSpacing (i);
+		}
+
+		bool IsSafe (int i)
+		{
+			return i >= unsafeFlags.Length ? true : !unsafeFlags [i];
+		}
+
 		#region GetSortKey()
 
 		public SortKey GetSortKey (string s)
@@ -71,32 +438,65 @@ namespace Mono.Globalization.Unicode
 		{
 			SetOptions (options);
 
+			buf.Initialize (options, lcid, s, frenchSort);
 			int end = start + length;
-			buf.Initialize (options, s, frenchSort);
+			GetSortKey (s, start, end);
+			return buf.GetResultAndReset ();
+		}
+
+		void GetSortKey (string s, int start, int end)
+		{
 			for (int n = start; n < end; n++) {
 				int i = s [n];
+
+				ExtenderType ext = GetExtenderType (i);
+				if (ext != ExtenderType.None) {
+					i = FilterExtender (previousChar, ext);
+					if (i >= 0)
+						FillSortKeyRaw (i, ext);
+					else if (previousSortKey != null) {
+						byte [] b = previousSortKey;
+						buf.AppendNormal (
+							b [0],
+							b [1],
+							b [2] != 1 ? b [2] : Level2 (i, ext),
+							b [3] != 1 ? b [3] : Uni.Level3 (i));
+					}
+					// otherwise do nothing.
+					// (if the extender is the first char
+					// in the string, then just ignore.)
+					continue;
+				}
+
 				if (IsIgnorable (i))
 					continue;
 				i = FilterOptions (i);
 
-				string expansion = GetExpansion (i);
-				if (expansion != null) {
-					foreach (char e in expansion)
-						FillSortKeyRaw (e);
+				Contraction ct = GetContraction (s, n, end);
+				if (ct != null) {
+					if (ct.Replacement != null) {
+						GetSortKey (ct.Replacement, 0, ct.Replacement.Length);
+					} else {
+						byte [] b = ct.SortKey;
+						buf.AppendNormal (
+							b [0],
+							b [1],
+							b [2] != 1 ? b [2] : Level2 (i, ext),
+							b [3] != 1 ? b [3] : Uni.Level3 (i));
+						previousSortKey = b;
+						previousChar = -1;
+					}
+					n += ct.Source.Length - 1;
+				}
+				else {
+					if (!Uni.IsIgnorableNonSpacing (i))
+						previousChar = i;
+					FillSortKeyRaw (i, ExtenderType.None);
 				}
-				else
-					FillSortKeyRaw (i);
 			}
-			return buf.GetResultAndReset ();
 		}
 
-		bool IsIgnorable (int i)
-		{
-			return Uni.IsIgnorable (i) ||
-				ignoreSymbols && Uni.IsIgnorableSymbol (i);
-		}
-
-		void FillSortKeyRaw (int i)
+		void FillSortKeyRaw (int i, ExtenderType ext)
 		{
 			if (0x3400 <= i && i <= 0x4DB5) {
 				int diff = i - 0x3400;
@@ -121,22 +521,28 @@ namespace Mono.Globalization.Unicode
 				return;
 			}
 
-			if (Uni.HasSpecialWeight ((char) i))
+			byte level2 = Level2 (i, ext);
+			if (Uni.HasSpecialWeight ((char) i)) {
+				byte level1 = Level1 (i);
 				buf.AppendKana (
-					Uni.Categories (i),
-					Uni.Level1 (i),
-					Uni.Level2 (i),
+					Category (i),
+					level1,
+					level2,
 					Uni.Level3 (i),
 					Uni.IsJapaneseSmallLetter ((char) i),
-					Uni.GetJapaneseDashType ((char) i),
+					ToDashTypeValue (ext),
 					!Uni.IsHiragana ((char) i),
-					Uni.IsHalfWidthKana ((char) i)
+					IsHalfKana ((char) i)
 					);
+				if (!ignoreNonSpace && ext == ExtenderType.Voiced)
+					// Append voice weight
+					buf.AppendNormal (1, 1, 1, 0);
+			}
 			else
 				buf.AppendNormal (
-					Uni.Categories (i),
-					Uni.Level1 (i),
-					Uni.Level2 (i),
+					Category (i),
+					Level1 (i),
+					level2,
 					Uni.Level3 (i));
 		}
 
@@ -186,9 +592,50 @@ namespace Mono.Globalization.Unicode
 			return Compare (s1, 0, s1.Length, s2, 0, s2.Length, options);
 		}
 
+		class Escape
+		{
+			public string Source;
+			public int Index;
+			public int Start;
+			public int End;
+			public int Optional;
+		}
+
+		// Those instances are reused not to invoke instantiation
+		// during Compare().
+		Escape escape1 = new Escape ();
+		Escape escape2 = new Escape ();
+
+		private int CompareOrdinal (string s1, int idx1, int len1,
+			string s2, int idx2, int len2)
+		{
+			int min = len1 < len2 ? len1 : len2;
+			int end1 = idx1 + min;
+			int end2 = idx2 + min;
+			for (int i1 = idx1, i2 = idx2;
+				i1 < end1 && i2 < end2; i1++, i2++)
+				if (s1 [i1] != s2 [i2])
+					return s1 [i1] - s2 [i2];
+			return len1 == len2 ? 0 :
+				len1 == min ? - 1 : 1;
+		}
+
 		public int Compare (string s1, int idx1, int len1,
 			string s2, int idx2, int len2, CompareOptions options)
 		{
+			// quick equality check
+			if (idx1 == idx2 && len1 == len2 &&
+				Object.ReferenceEquals (s1, s2))
+				return 0;
+			// FIXME: this should be done inside Compare() at
+			// any time.
+//			int ord = CompareOrdinal (s1, idx1, len1, s2, idx2, len2);
+//			if (ord == 0)
+//				return 0;
+			if (options == CompareOptions.Ordinal)
+				return CompareOrdinal (s1, idx1, len1, s2, idx2, len2);
+
+#if false // stable easy version, depends on GetSortKey().
 			SortKey sk1 = GetSortKey (s1, idx1, len1, options);
 			SortKey sk2 = GetSortKey (s2, idx2, len2, options);
 			byte [] d1 = sk1.KeyData;
@@ -198,158 +645,555 @@ namespace Mono.Globalization.Unicode
 				if (d1 [i] != d2 [i])
 					return d1 [i] < d2 [i] ? -1 : 1;
 			return d1.Length == d2.Length ? 0 : d1.Length < d2.Length ? -1 : 1;
+#else
+			SetOptions (options);
+			bool dummy, dummy2;
+			int ret = CompareInternal (s1, idx1, len1, s2, idx2, len2, (options & CompareOptions.StringSort) != 0, out dummy, out dummy2, true);
+			return ret == 0 ? 0 : ret < 0 ? -1 : 1;
+#endif
 		}
 
-		#endregion
+		int CompareInternal (string s1, int idx1, int len1, string s2,
+			int idx2, int len2, bool stringSort,
+			out bool targetConsumed, out bool sourceConsumed,
+			bool skipHeadingExtenders)
+		{
+			int start1 = idx1;
+			int start2 = idx2;
+			int end1 = idx1 + len1;
+			int end2 = idx2 + len2;
+			targetConsumed = false;
+			sourceConsumed = false;
+
+			// It holds final result that comes from the comparison
+			// at level 2 or lower. Even if Compare() found the
+			// difference at level 2 or lower, it still has to
+			// continue level 1 comparison. FinalResult is used
+			// when there was no further differences.
+			int finalResult = 0;
+			// It holds the comparison level to do. It starts from
+			// 5, and becomes 1 when we do primary-only comparison.
+			int currentLevel = 5;
+
+			int lv5At1 = -1;
+			int lv5At2 = -1;
+			int lv5Value1 = 0;
+			int lv5Value2 = 0;
+
+			// Skip heading extenders
+			if (skipHeadingExtenders) {
+				for (; idx1 < end1; idx1++)
+					if (GetExtenderType (s1 [idx1]) == ExtenderType.None)
+						break;
+				for (; idx2 < end2; idx2++)
+					if (GetExtenderType (s2 [idx2]) == ExtenderType.None)
+						break;
+			}
 
-		#region IsPrefix()
+			ExtenderType ext1 = ExtenderType.None;
+			ExtenderType ext2 = ExtenderType.None;
+
+			int quickCheckPos1 = idx1;
+			int quickCheckPos2 = idx2;
+
+			while (true) {
+				for (; idx1 < end1; idx1++)
+					if (!IsIgnorable (s1 [idx1]))
+						break;
+				for (; idx2 < end2; idx2++)
+					if (!IsIgnorable (s2 [idx2]))
+						break;
+
+				if (idx1 >= end1) {
+					if (escape1.Source == null)
+						break;
+					s1 = escape1.Source;
+					start1 = escape1.Start;
+					idx1 = escape1.Index;
+					end1 = escape1.End;
+					quickCheckPos1 = escape1.Optional;
+					escape1.Source = null;
+					continue;
+				}
+				if (idx2 >= end2) {
+					if (escape2.Source == null)
+						break;
+					s2 = escape2.Source;
+					start2 = escape2.Start;
+					idx2 = escape2.Index;
+					end2 = escape2.End;
+					quickCheckPos2 = escape2.Optional;
+					escape2.Source = null;
+					continue;
+				}
+#if true
+// If comparison is unstable, then this part is one of the most doubtful part.
+// Here we run quick codepoint comparison and run back to "stable" area to
+// compare characters.
+
+				// Strictly to say, even the first character
+				// could be compared here, but it messed
+				// backward step, so I just avoided mess.
+				if (quickCheckPos1 < idx1 && quickCheckPos2 < idx2) {
+					while (idx1 < end1 && idx2 < end2 &&
+						s1 [idx1] == s2 [idx2]) {
+						idx1++;
+						idx2++;
+					}
+					if (idx1 == end1 || idx2 == end2)
+						continue; // check replacement
+
+					int backwardEnd1 = quickCheckPos1;
+					int backwardEnd2 = quickCheckPos2;
+					quickCheckPos1 = idx1;
+					quickCheckPos2 = idx2;
+
+					idx1--;
+					idx2--;
+
+					for (;idx1 > backwardEnd1; idx1--)
+						if (Category (s1 [idx1]) != 1)
+							break;
+					for (;idx2 > backwardEnd2; idx2--)
+						if (Category (s2 [idx2]) != 1)
+							break;
+					for (;idx1 > backwardEnd1; idx1--)
+						if (IsSafe (s1 [idx1]))
+							break;
+					for (;idx2 > backwardEnd2; idx2--)
+						if (IsSafe (s2 [idx2]))
+							break;
+				}
+#endif
+
+				int cur1 = idx1;
+				int cur2 = idx2;
+				byte [] sk1 = null;
+				byte [] sk2 = null;
+				int i1 = FilterOptions (s1 [idx1]);
+				int i2 = FilterOptions (s2 [idx2]);
+				bool special1 = false;
+				bool special2 = false;
+
+				// If current character is an expander, then
+				// repeat the previous character.
+				ext1 = GetExtenderType (i1);
+				if (ext1 != ExtenderType.None) {
+					if (previousChar < 0) {
+						if (previousSortKey == null) {
+							// nothing to extend
+							idx1++;
+							continue;
+						}
+						sk1 = previousSortKey;
+					}
+					else
+						i1 = FilterExtender (previousChar, ext1);
+				}
+				ext2 = GetExtenderType (i2);
+				if (ext2 != ExtenderType.None) {
+					if (previousChar2 < 0) {
+						if (previousSortKey2 == null) {
+							// nothing to extend
+							idx2++;
+							continue;
+						}
+						sk2 = previousSortKey2;
+					}
+					else
+						i2 = FilterExtender (previousChar2, ext2);
+				}
 
-		public bool IsPrefix (string src, string target, CompareOptions opt)
-		{
-			return IsPrefix (src, target, 0, src.Length, opt);
-		}
+				byte cat1 = Category (i1);
+				byte cat2 = Category (i2);
+
+				// Handle special weight characters
+				if (!stringSort && currentLevel > 4) {
+					if (cat1 == 6) {
+						lv5At1 = escape1.Source != null ?
+							escape1.Index - escape1.Start :
+							cur1 - start1;
+						// here Windows has a bug that it does
+						// not consider thirtiary weight.
+						lv5Value1 = Level1 (i1) << 8 + Uni.Level3 (i1);
+						previousChar = i1;
+						idx1++;
+					}
+					if (cat2 == 6) {
+						lv5At2 = escape2.Source != null ?
+							escape2.Index - escape2.Start :
+							cur2 - start2;
+						// here Windows has a bug that it does
+						// not consider thirtiary weight.
+						lv5Value2 = Level1 (i2) << 8 + Uni.Level3 (i2);
+						previousChar2 = i2;
+						idx2++;
+					}
+					if (cat1 == 6 || cat2 == 6) {
+						currentLevel = 4;
+						continue;
+					}
+				}
 
-		public bool IsPrefix (string s, string target, int start, int length, CompareOptions opt)
-		{
-			SetOptions (opt);
+				Contraction ct1 = null;
+				if (ext1 == ExtenderType.None)
+					ct1 = GetContraction (s1, idx1, end1);
+
+				int offset1 = 1;
+				if (sk1 != null)
+					offset1 = 1;
+				else if (ct1 != null) {
+					offset1 = ct1.Source.Length;
+					if (ct1.SortKey != null) {
+						sk1 = charSortKey;
+						for (int i = 0; i < ct1.SortKey.Length; i++)
+							sk1 [i] = ct1.SortKey [i];
+						previousChar = -1;
+						previousSortKey = sk1;
+					}
+					else if (escape1.Source == null) {
+						escape1.Source = s1;
+						escape1.Start = start1;
+						escape1.Index = cur1 + ct1.Source.Length;
+						escape1.End = end1;
+						escape1.Optional = quickCheckPos1;
+						s1 = ct1.Replacement;
+						idx1 = 0;
+						start1 = 0;
+						end1 = s1.Length;
+						quickCheckPos1 = 0;
+						continue;
+					}
+				}
+				else {
+					sk1 = charSortKey;
+					sk1 [0] = cat1;
+					sk1 [1] = Level1 (i1);
+					if (!ignoreNonSpace && currentLevel > 1)
+						sk1 [2] = Level2 (i1, ext1);
+					if (currentLevel > 2)
+						sk1 [3] = Uni.Level3 (i1);
+					if (currentLevel > 3)
+						special1 = Uni.HasSpecialWeight ((char) i1);
+					if (cat1 > 1)
+						previousChar = i1;
+				}
 
-			int min = length > target.Length ? target.Length : length;
-			int si = start;
+				Contraction ct2 = null;
+				if (ext2 == ExtenderType.None)
+					ct2 = GetContraction (s2, idx2, end2);
+
+				if (sk2 != null)
+					idx2++;
+				else if (ct2 != null) {
+					idx2 += ct2.Source.Length;
+					if (ct2.SortKey != null) {
+						sk2 = charSortKey2;
+						for (int i = 0; i < ct2.SortKey.Length; i++)
+							sk2 [i] = ct2.SortKey [i];
+						previousChar2 = -1;
+						previousSortKey2 = sk2;
+					}
+					else if (escape2.Source == null) {
+						escape2.Source = s2;
+						escape2.Start = start2;
+						escape2.Index = cur2 + ct2.Source.Length;
+						escape2.End = end2;
+						escape2.Optional = quickCheckPos2;
+						s2 = ct2.Replacement;
+						idx2 = 0;
+						start2 = 0;
+						end2 = s2.Length;
+						quickCheckPos2 = 0;
+						continue;
+					}
+				}
+				else {
+					sk2 = charSortKey2;
+					sk2 [0] = cat2;
+					sk2 [1] = Level1 (i2);
+					if (!ignoreNonSpace && currentLevel > 1)
+						sk2 [2] = Level2 (i2, ext2);
+					if (currentLevel > 2)
+						sk2 [3] = Uni.Level3 (i2);
+					if (currentLevel > 3)
+						special2 = Uni.HasSpecialWeight ((char) i2);
+					if (cat2 > 1)
+						previousChar2 = i2;
+					idx2++;
+				}
 
-			// FIXME: this is not enough to handle tailorings.
-			for (int j = 0; j < min; j++, si++) {
-				int ci = FilterOptions (s [si]);
-				int cj = FilterOptions (target [j]);
-				if (ci == cj)
+				// Add offset here so that it does not skip
+				// idx1 while s2 has a replacement.
+				idx1 += offset1;
+
+				// add diacritical marks in s1 here
+				if (!ignoreNonSpace) {
+					while (idx1 < end1) {
+						if (Category (s1 [idx1]) != 1)
+							break;
+						if (sk1 [2] == 0)
+							sk1 [2] = 2;
+						sk1 [2] = (byte) (sk1 [2] + 
+							Level2 (s1 [idx1], ExtenderType.None));
+						idx1++;
+					}
+
+					// add diacritical marks in s2 here
+					while (idx2 < end2) {
+						if (Category (s2 [idx2]) != 1)
+							break;
+						if (sk2 [2] == 0)
+							sk2 [2] = 2;
+						sk2 [2] = (byte) (sk2 [2] + 
+							Level2 (s2 [idx2], ExtenderType.None));
+						idx2++;
+					}
+				}
+
+				int ret = sk1 [0] - sk2 [0];
+				ret = ret != 0 ? ret : sk1 [1] - sk2 [1];
+				if (ret != 0)
+					return ret;
+				if (currentLevel == 1)
+					continue;
+				if (!ignoreNonSpace) {
+					ret = sk1 [2] - sk2 [2];
+					if (ret != 0) {
+						finalResult = ret;
+						currentLevel = frenchSort ? 2 : 1;
+						continue;
+					}
+				}
+				if (currentLevel == 2)
 					continue;
-				if (IsIgnorable (s [si])) {
-					if (!IsIgnorable (target [j]))
-						j--;
+				ret = sk1 [3] - sk2 [3];
+				if (ret != 0) {
+					finalResult = ret;
+					currentLevel = 2;
 					continue;
 				}
-				else if (IsIgnorable (target [j])) {
-					si--;
+				if (currentLevel == 3)
+					continue;
+				if (special1 != special2) {
+					finalResult = special1 ? 1 : -1;
+					currentLevel = 3;
 					continue;
 				}
+				if (special1) {
+					ret = CompareFlagPair (
+						!Uni.IsJapaneseSmallLetter ((char) i1),
+						!Uni.IsJapaneseSmallLetter ((char) i2));
+					ret = ret != 0 ? ret :
+						ToDashTypeValue (ext1) -
+						ToDashTypeValue (ext2);
+					ret = ret != 0 ? ret : CompareFlagPair (
+						Uni.IsHiragana ((char) i1),
+						Uni.IsHiragana ((char) i2));
+					ret = ret != 0 ? ret : CompareFlagPair (
+						!IsHalfKana ((char) i1),
+						!IsHalfKana ((char) i2));
+					if (ret != 0) {
+						finalResult = ret;
+						currentLevel = 3;
+						continue;
+					}
+				}
+			}
 
-				// FIXME: should handle expansions (and it 
-				// should be before codepoint comparison).
-				string expansion = GetExpansion (s [si]);
-				if (expansion != null)
-					return false;
-				expansion = GetExpansion (target [j]);
-				if (expansion != null)
-					return false;
-
-				if (Uni.Categories (ci) != Uni.Categories (cj) ||
-					Uni.Level1 (ci) != Uni.Level1 (cj) ||
-					!ignoreNonSpace && Uni.Level2 (ci) != Uni.Level2 (cj) ||
-					Uni.Level3 (ci) != Uni.Level3 (cj))
-					return false;
-				if (!Uni.HasSpecialWeight ((char) ci))
-					continue;
-				if (Uni.IsJapaneseSmallLetter ((char) ci) !=
-					Uni.IsJapaneseSmallLetter ((char) cj) ||
-					Uni.GetJapaneseDashType ((char) ci) !=
-					Uni.GetJapaneseDashType ((char) cj) ||
-					!Uni.IsHiragana ((char) ci) !=
-					!Uni.IsHiragana ((char) cj) ||
-					Uni.IsHalfWidthKana ((char) ci) !=
-					Uni.IsHalfWidthKana ((char) cj))
-					return false;
+			// If there were only level 3 or lower differences,
+			// then we still have to find diacritical differences
+			// if any.
+			if (!ignoreNonSpace &&
+				finalResult != 0 && currentLevel > 2) {
+				while (idx1 < end1 && idx2 < end2) {
+					if (!Uni.IsIgnorableNonSpacing (s1 [idx1]))
+						break;
+					if (!Uni.IsIgnorableNonSpacing (s2 [idx2]))
+						break;
+					finalResult = Level2 (FilterOptions ((s1 [idx1])), ext1) - Level2 (FilterOptions (s2 [idx2]), ext2);
+					if (finalResult != 0)
+						break;
+					idx1++;
+					idx2++;
+					// they should work only for the first character
+					ext1 = ExtenderType.None;
+					ext2 = ExtenderType.None;
+				}
 			}
-			if (si == min) {
-				// All codepoints in the compared range
-				// matches. In that case, what matters 
-				// is whether the remaining part of 
-				// "target" is ignorable or not.
-				for (int i = min; i < target.Length; i++)
-					if (!IsIgnorable (target [i]))
-						return false;
-				return true;
+			if (currentLevel == 1 && finalResult != 0) {
+				while (idx1 < end1)
+					if (Uni.IsIgnorableNonSpacing (s1 [idx1]))
+						idx1++;
+				while (idx2 < end2)
+					if (Uni.IsIgnorableNonSpacing (s2 [idx2]))
+						idx2++;
 			}
-			return true;
+			// we still have to handle level 5
+			if (finalResult == 0) {
+				finalResult = lv5At1 - lv5At2;
+				if (finalResult == 0)
+					finalResult = lv5Value1 - lv5Value2;
+			}
+			if (finalResult == 0) {
+				if (idx2 == end2)
+					targetConsumed = true;
+				if (idx1 == end1)
+					sourceConsumed = true;
+			}
+			return idx1 != end1 ? 1 : idx2 == end2 ? finalResult : -1;
+		}
+
+		int CompareFlagPair (bool b1, bool b2)
+		{
+			return b1 == b2 ? 0 : b1 ? 1 : -1;
 		}
 
 		#endregion
 
-		#region IsSuffix()
+		#region IsPrefix() and IsSuffix()
 
-		public bool IsSuffix (string src, string target, CompareOptions opt)
+		public bool IsPrefix (string src, string target, CompareOptions opt)
 		{
-			return IsSuffix (src, target, 0, src.Length, opt);
+			return IsPrefix (src, target, 0, src.Length, opt);
 		}
 
-		// It is mostly copy of IsPrefix().
-		public bool IsSuffix (string s, string target, int start, int length, CompareOptions opt)
+		public bool IsPrefix (string s, string target, int start, int length, CompareOptions opt)
 		{
 			SetOptions (opt);
+			return IsPrefix (s, target, start, length, 
+				(opt & CompareOptions.StringSort) != 0, true);
+		}
 
-			int min = length > target.Length ? target.Length : length;
-			int si = start + length - 1;
+		public bool IsPrefix (string s, string target, int start, int length, bool stringSort, bool skipHeadingExtenders)
+		{
+			bool consumed, dummy;
+			int ret = CompareInternal (s, start, length,
+				target, 0, target.Length, stringSort,
+				out consumed, out dummy, skipHeadingExtenders);
+			return consumed;
+		}
 
-			// FIXME: this is not enough to handle tailorings.
-			for (int j = min - 1; j >= 0; j--, si--) {
-				int ci = FilterOptions (s [si]);
-				int cj = FilterOptions (target [j]);
-				if (ci == cj)
-					continue;
-				if (IsIgnorable (s [si])) {
-					if (!IsIgnorable (target [j]))
-						j++;
-					continue;
-				}
-				else if (IsIgnorable (target [j])) {
-					si++;
-					continue;
-				}
+		// IsSuffix()
 
-				// FIXME: should handle expansions (and it 
-				// should be before codepoint comparison).
-				string expansion = GetExpansion (s [si]);
-				if (expansion != null)
-					return false;
-				expansion = GetExpansion (target [j]);
-				if (expansion != null)
-					return false;
+		public bool IsSuffix (string src, string target, CompareOptions opt)
+		{
+			return IsSuffix (src, target, src.Length - 1, src.Length, opt);
+		}
 
-				if (Uni.Categories (ci) != Uni.Categories (cj) ||
-					Uni.Level1 (ci) != Uni.Level1 (cj) ||
-					!ignoreNonSpace && Uni.Level2 (ci) != Uni.Level2 (cj) ||
-					Uni.Level3 (ci) != Uni.Level3 (cj))
+		public bool IsSuffix (string s, string target, int start, int length, CompareOptions opt)
+		{
+			// quick check : simple codepoint comparison
+			if (s.Length >= target.Length) {
+				int si = start;
+				int se = start - length;
+				for (int i = target.Length - 1; si >= se && i >= 0; i--, si--)
+					if (s [si] != target [i])
+						break;
+				if (si == start + target.Length)
+					return true;
+			}
+
+			SetOptions (opt);
+			return IsSuffix (s, target, start, length,
+				(opt & CompareOptions.StringSort) != 0);
+		}
+
+		bool IsSuffix (string s, string t, int start, int length,
+			bool stringSort)
+		{
+			int tstart = 0;
+			for (;tstart < t.Length; tstart++)
+				if (!IsIgnorable (t [tstart]))
+					break;
+			if (tstart == t.Length)
+				return true; // as if target is String.Empty.
+
+#if false
+// This is still not working. If it is not likely to get working, then just remove it.
+			int si = start;
+			int send = start - length;
+			int ti = t.Length - 1;
+			int tend = -1;
+
+			int sStep = start + 1;
+			int tStep = t.Length;
+			bool sourceConsumed, targetConsumed;
+			while (true) {
+				for (; send < si; si--)
+					if (!IsIgnorable (s [si]))
+						break;
+				for (; tend < ti; ti--)
+					if (!IsIgnorable (t [ti]))
+						break;
+				if (tend == ti)
+					break;
+				for (; send < si; si--)
+					if (IsSafe (s [si]))
+						break;
+				for (; tend < ti; ti--)
+					if (IsSafe (t [ti]))
+						break;
+Console.WriteLine ("==== {0} {1} {2} {3} {4} {5} {6} {7} {8}", s, si, send, length, t, ti, tstart, sStep - si, tStep - ti);
+				if (CompareInternal (s, si, sStep - si,
+					t, ti, tStep - ti, stringSort,
+					out targetConsumed, out sourceConsumed,
+					true) != 0)
 					return false;
-				if (!Uni.HasSpecialWeight ((char) ci))
-					continue;
-				if (Uni.IsJapaneseSmallLetter ((char) ci) !=
-					Uni.IsJapaneseSmallLetter ((char) cj) ||
-					Uni.GetJapaneseDashType ((char) ci) !=
-					Uni.GetJapaneseDashType ((char) cj) ||
-					!Uni.IsHiragana ((char) ci) !=
-					!Uni.IsHiragana ((char) cj) ||
-					Uni.IsHalfWidthKana ((char) ci) !=
-					Uni.IsHalfWidthKana ((char) cj))
+				if (send == si)
 					return false;
+				sStep = si;
+				tStep = ti;
+				si--;
+				ti--;
 			}
-			if (si == min) {
-				// All codepoints in the compared range
-				// matches. In that case, what matters 
-				// is whether the remaining part of 
-				// "target" is ignorable or not.
-				for (int i = target.Length - min - 1; i >= 0; i--)
-					if (!IsIgnorable (target [i]))
+			return true;
+#else
+			// FIXME: it is not efficient for very long target.
+			bool sourceConsumed, targetConsumed;
+			int mismatchCount = 0;
+			for (int i = 0; i < length; i++) {
+				escape1.Source = escape2.Source = null;
+				previousSortKey = previousSortKey2 = null;
+				previousChar = previousChar2 = -1;
+
+				int ret = CompareInternal (s, start - i, i + 1,
+					t, tstart, t.Length - tstart,
+					stringSort, out targetConsumed,
+					out sourceConsumed, true);
+				if (ret == 0)
+					return true;
+				if (!sourceConsumed && targetConsumed)
+					return false;
+				if (!targetConsumed) {
+					mismatchCount++;
+					if (mismatchCount > Uni.MaxExpansionLength)
+						// The largest length of an
+						// expansion is 3, so if the
+						// target was not consumed more
+						// than 3 times, then the tail
+						// character does not match.
 						return false;
-				return true;
+				}
 			}
-			return true;
+			return false;
+#endif
 		}
 
 		#endregion
 
-		#region IndexOf()
+		#region IndexOf() / LastIndexOf()
+
+		public int IndexOf (string s, string target, CompareOptions opt)
+		{
+			return IndexOf (s, target, 0, s.Length, opt);
+		}
 
-		public int IndexOf (string s, char target)
+		public int IndexOf (string s, string target, int start, int length, CompareOptions opt)
 		{
-			return IndexOf (s, target, 0, s.Length, CompareOptions.None);
+			SetOptions (opt);
+			return IndexOf (s, target, start, length,
+				(opt & CompareOptions.StringSort) != 0);
 		}
 
 		public int IndexOf (string s, char target, CompareOptions opt)
@@ -359,153 +1203,404 @@ namespace Mono.Globalization.Unicode
 
 		public int IndexOf (string s, char target, int start, int length, CompareOptions opt)
 		{
-			// If target has an expansion, then use string search.
-			string expansion = GetExpansion (target);
-			if (expansion != null)
-				return IndexOf (s, expansion, start, length, opt);
-
 			SetOptions (opt);
 
-			int ti = FilterOptions ((int) target);
-			for (int idx = start; idx < length; idx++) {
-				switch (char.GetUnicodeCategory (s [idx])) {
-				case UnicodeCategory.PrivateUse:
-				case UnicodeCategory.Surrogate:
-					if (s [idx] != target)
-						continue;
-					return idx;
-				}
-
-				expansion = GetExpansion (s [idx]);
-				if (expansion != null)
-					continue; // since target cannot be expansion as conditioned above.
-				if (s [idx] == target)
-					return idx;
-				int si = FilterOptions ((int) s [idx]);
-				if (Uni.Categories (si) != Uni.Categories (ti) ||
-					Uni.Level1 (si) != Uni.Level1 (ti) ||
-					!ignoreNonSpace && Uni.Level2 (si) != Uni.Level2 (ti) ||
-					Uni.Level3 (si) != Uni.Level3 (ti))
-					continue;
-				if (!Uni.HasSpecialWeight ((char) si))
-					return idx;
-				if (Uni.IsJapaneseSmallLetter ((char) si) !=
-					Uni.IsJapaneseSmallLetter ((char) ti) ||
-					Uni.GetJapaneseDashType ((char) si) !=
-					Uni.GetJapaneseDashType ((char) ti) ||
-					!Uni.IsHiragana ((char) si) !=
-					!Uni.IsHiragana ((char) ti) ||
-					Uni.IsHalfWidthKana ((char) si) !=
-					Uni.IsHalfWidthKana ((char) ti))
-					continue;
+			// If target is contraction, then use string search.
+			Contraction ct = GetContraction (target);
+			if (ct != null) {
+				if (ct.Replacement != null)
+					return IndexOf (s, ct.Replacement, start, length,
+						(opt & CompareOptions.StringSort) != 0);
+				else
+					return IndexOfSortKey (s, start, length, ct.SortKey, char.MinValue, -1, true);
+			} else {
+				int ti = FilterOptions ((int) target);
+				charSortKeyIndexTarget [0] = Category (ti);
+				charSortKeyIndexTarget [1] = Level1 (ti);
+				if (!ignoreNonSpace)
+					charSortKeyIndexTarget [2] =
+						Level2 (ti, ExtenderType.None);
+				charSortKeyIndexTarget [3] = Uni.Level3 (ti);
+				return IndexOfSortKey (s, start, length,
+					charSortKeyIndexTarget, target, ti,
+					!Uni.HasSpecialWeight ((char) ti));
 			}
-			return -1;
 		}
 
-		public int IndexOf (string s, string target, CompareOptions opt)
+		// Searches target byte[] keydata
+		int IndexOfSortKey (string s, int start, int length, byte [] sortkey, char target, int ti, bool noLv4)
 		{
-			return IndexOf (s, target, 0, s.Length, opt);
+			int end = start + length;
+			int idx = start;
+			while (idx < end) {
+				int cur = idx;
+				if (MatchesForward (s, ref idx, end, ti, sortkey, noLv4))
+					return cur;
+			}
+			return -1;
 		}
 
-		public int IndexOf (string s, string target, int start, int length, CompareOptions opt)
+		// Searches string. Search head character (or keydata when
+		// the head is contraction sortkey) and try IsPrefix().
+		int IndexOf (string s, string target, int start, int length, bool stringSort)
 		{
-			SetOptions (opt);
+			int tidx = 0;
+			for (; tidx < target.Length; tidx++)
+				if (!IsIgnorable (target [tidx]))
+					break;
+			if (tidx == target.Length)
+				return start;
+			Contraction ct = GetContraction (target, tidx, target.Length - tidx);
+			string replace = ct != null ? ct.Replacement : null;
+			byte [] sk = replace == null ? charSortKeyIndexTarget : null;
+			bool noLv4 = true;
+			char tc = char.MinValue;
+			int ti = -1;
+			if (ct != null && sk != null) {
+				for (int i = 0; i < ct.SortKey.Length; i++)
+					sk [i] = ct.SortKey [i];
+			} else if (sk != null) {
+				tc = target [tidx];
+				ti = FilterOptions (target [tidx]);
+				sk [0] = Category (ti);
+				sk [1] = Level1 (ti);
+				if (!ignoreNonSpace)
+					sk [2] = Level2 (ti, ExtenderType.None);
+				sk [3] = Uni.Level3 (ti);
+				noLv4 = !Uni.HasSpecialWeight ((char) ti);
+			}
+			if (sk != null) {
+				for (tidx++; tidx < target.Length; tidx++) {
+					if (Category (target [tidx]) != 1)
+						break;
+					if (sk [2] == 0)
+						sk [2] = 2;
+					sk [2] = (byte) (sk [2] + Level2 (target [tidx], ExtenderType.None));
+				}
+			}
+
 			do {
-				// FIXME: this should be modified to handle
-				// expansions
-				int idx = IndexOf (s, target [0], start, length, opt);
+				int idx = 0;
+				if (replace != null)
+					idx = IndexOf (s, replace, start, length, stringSort);
+				else
+					idx = IndexOfSortKey (s, start, length, sk, tc, ti, noLv4);
 				if (idx < 0)
 					return -1;
-				if (IsPrefix (s, target, idx, length - (idx - start), opt))
+				length -= idx - start;
+				start = idx;
+				if (IsPrefix (s, target, start, length, stringSort, false))
 					return idx;
-				start++;
-				length--;
+				Contraction cts = GetContraction (s, start, length);
+				if (cts != null) {
+					start += cts.Source.Length;
+					length -= cts.Source.Length;
+				} else {
+					start++;
+					length--;
+				}
 			} while (length > 0);
 			return -1;
 		}
 
-		#endregion
+		//
+		// There are the same number of IndexOf() related methods,
+		// with the same functionalities for each.
+		//
 
-		#region LastIndexOf()
+		public int LastIndexOf (string s, string target, CompareOptions opt)
+		{
+			return LastIndexOf (s, target, s.Length - 1, s.Length, opt);
+		}
 
-		public int LastIndexOf (string s, char target)
+		public int LastIndexOf (string s, string target, int start, int length, CompareOptions opt)
 		{
-			return LastIndexOf (s, target, 0, s.Length, CompareOptions.None);
+			SetOptions (opt);
+			return LastIndexOf (s, target, start, length,
+				(opt & CompareOptions.StringSort) != 0);
 		}
 
 		public int LastIndexOf (string s, char target, CompareOptions opt)
 		{
-			return LastIndexOf (s, target, 0, s.Length, opt);
+			return LastIndexOf (s, target, s.Length - 1, s.Length, opt);
 		}
 
 		public int LastIndexOf (string s, char target, int start, int length, CompareOptions opt)
 		{
-			// If target has an expansion, then use string search.
-			string expansion = GetExpansion (target);
-			if (expansion != null)
-				return LastIndexOf (s, expansion, start, length, opt);
-
 			SetOptions (opt);
 
-			int ti = FilterOptions ((int) target);
-			for (int idx = start + length - 1; idx >= start; idx--) {
-				switch (char.GetUnicodeCategory (s [idx])) {
-				case UnicodeCategory.PrivateUse:
-				case UnicodeCategory.Surrogate:
-					if (s [idx] != target)
-						continue;
-					return idx;
-				}
-
-				expansion = GetExpansion (s [idx]);
-				if (expansion != null)
-					continue; // since target cannot be expansion as conditioned above.
-				if (s [idx] == target)
-					return idx;
-				int si = FilterOptions ((int) s [idx]);
-				if (Uni.Categories (si) != Uni.Categories (ti) ||
-					Uni.Level1 (si) != Uni.Level1 (ti) ||
-					!ignoreNonSpace && Uni.Level2 (si) != Uni.Level2 (ti) ||
-					Uni.Level3 (si) != Uni.Level3 (ti))
-					continue;
-				if (!Uni.HasSpecialWeight ((char) si))
-					return idx;
-				if (Uni.IsJapaneseSmallLetter ((char) si) !=
-					Uni.IsJapaneseSmallLetter ((char) ti) ||
-					Uni.GetJapaneseDashType ((char) si) !=
-					Uni.GetJapaneseDashType ((char) ti) ||
-					!Uni.IsHiragana ((char) si) !=
-					!Uni.IsHiragana ((char) ti) ||
-					Uni.IsHalfWidthKana ((char) si) !=
-					Uni.IsHalfWidthKana ((char) ti))
-					continue;
+			// If target is contraction, then use string search.
+			Contraction ct = GetContraction (target);
+			if (ct != null) {
+				if (ct.Replacement != null)
+					return LastIndexOf (s, ct.Replacement, start, length, (opt & CompareOptions.StringSort) != 0);
+				else
+					return LastIndexOfSortKey (s, start, start, length, ct.SortKey, char.MinValue, -1, true);
+			}
+			else {
+				int ti = FilterOptions ((int) target);
+				charSortKeyIndexTarget [0] = Category (ti);
+				charSortKeyIndexTarget [1] = Level1 (ti);
+				if (!ignoreNonSpace)
+					charSortKeyIndexTarget [2] = Level2 (ti, ExtenderType.None);
+				charSortKeyIndexTarget [3] = Uni.Level3 (ti);
+				return LastIndexOfSortKey (s, start, start, length, charSortKeyIndexTarget, target, ti, !Uni.HasSpecialWeight ((char) ti));
 			}
-			return -1;
 		}
 
-		public int LastIndexOf (string s, string target, CompareOptions opt)
+		// Searches target byte[] keydata
+		int LastIndexOfSortKey (string s, int start, int orgStart, int length, byte [] sortkey, char target, int ti, bool noLv4)
 		{
-			return LastIndexOf (s, target, 0, s.Length, opt);
+			int end = start - length;
+			int idx = start;
+			while (idx > end) {
+				int cur = idx;
+				if (MatchesBackward (s, ref idx, end, orgStart, ti, sortkey, noLv4))
+					return cur;
+			}
+			return -1;
 		}
 
-		public int LastIndexOf (string s, string target, int start, int length, CompareOptions opt)
+		// Searches string. Search head character (or keydata when
+		// the head is contraction sortkey) and try IsPrefix().
+		int LastIndexOf (string s, string target, int start, int length, bool stringSort)
 		{
-			SetOptions (opt);
+			int orgStart = start;
+			int tidx = 0;
+			for (; tidx < target.Length; tidx++)
+				if (!IsIgnorable (target [tidx]))
+					break;
+			if (tidx == target.Length)
+				return start;
+			Contraction ct = GetContraction (target, tidx, target.Length - tidx);
+			string replace = ct != null ? ct.Replacement : null;
+			byte [] sk = replace == null ? charSortKeyIndexTarget : null;
+
+			bool noLv4 = true;
+			char tc = char.MinValue;
+			int ti = -1;
+			if (ct != null && sk != null) {
+				for (int i = 0; i < ct.SortKey.Length; i++)
+					sk [i] = ct.SortKey [i];
+			} else if (sk != null) {
+				tc = target [tidx];
+				ti = FilterOptions (target [tidx]);
+				sk [0] = Category (ti);
+				sk [1] = Level1 (ti);
+				if (!ignoreNonSpace)
+					sk [2] = Level2 (ti, ExtenderType.None);
+				sk [3] = Uni.Level3 (ti);
+				noLv4 = !Uni.HasSpecialWeight ((char) ti);
+			}
+			if (sk != null) {
+				for (tidx++; tidx < target.Length; tidx++) {
+					if (Category (target [tidx]) != 1)
+						break;
+					if (sk [2] == 0)
+						sk [2] = 2;
+					sk [2] = (byte) (sk [2] + Level2 (target [tidx], ExtenderType.None));
+				}
+			}
 
 			do {
-				// FIXME: this should be modified to handle
-				// expansions
-				int idx = LastIndexOf (s, target [0], start, length, opt);
+				int idx = 0;
+
+				if (replace != null)
+					idx = LastIndexOf (s, replace, start, length, stringSort);
+				else
+					idx = LastIndexOfSortKey (s, start, orgStart, length, sk, tc, ti, noLv4);
 				if (idx < 0)
 					return -1;
+				length -= start - idx;
+				start = idx;
 
-				if (IsPrefix (s, target, idx, length - (idx - start), opt))
+				if (IsPrefix (s, target, idx, orgStart - idx + 1, stringSort, false)) {
+					for (;idx < orgStart; idx++)
+						if (!IsIgnorable (s [idx]))
+							break;
 					return idx;
-				length = idx - start - 1;
+				}
+				Contraction cts = GetContraction (s, idx, orgStart - idx + 1);
+				if (cts != null) {
+					start -= cts.Source.Length;
+					length -= cts.Source.Length;
+				} else {
+					start--;
+					length--;
+				}
 			} while (length > 0);
 			return -1;
 		}
 
+		private bool MatchesForward (string s, ref int idx, int end, int ti, byte [] sortkey, bool noLv4)
+		{
+			int si = -1;
+			ExtenderType ext = GetExtenderType (s [idx]);
+			Contraction ct = null;
+			if (ext == ExtenderType.None)
+				ct = GetContraction (s, idx, end);
+			else if (previousChar < 0) {
+				if (previousSortKey == null) {
+					idx++;
+					return false;
+				}
+				charSortKey = previousSortKey;
+			}
+			else
+				si = FilterExtender (previousChar, ext);
+			// if lv4 exists, it never matches contraction
+			if (ct != null) {
+				idx += ct.Source.Length;
+				if (!noLv4)
+					return false;
+				if (ct.SortKey != null) {
+					for (int i = 0; i < sortkey.Length; i++)
+						charSortKey [i] = sortkey [i];
+					previousChar = -1;
+					previousSortKey = charSortKey;
+				} else {
+					// Here is the core of LAMESPEC
+					// described at the top of the source.
+					int dummy = 0;
+					return MatchesForward (ct.Replacement, ref dummy,
+						ct.Replacement.Length, ti, sortkey, noLv4);
+				}
+			} else {
+				if (si < 0)
+					si = FilterOptions (s [idx]);
+				charSortKey [0] = Category (si);
+				charSortKey [1] = Level1 (si);
+				if (!ignoreNonSpace)
+					charSortKey [2] = Level2 (si, ext);
+				charSortKey [3] = Uni.Level3 (si);
+				if (charSortKey [0] != 1)
+					previousChar = si;
+				idx++;
+			}
+			for (; idx < end; idx++) {
+				if (Category (s [idx]) != 1)
+					break;
+				if (ignoreNonSpace)
+					continue;
+				if (charSortKey [2] == 0)
+						charSortKey [2] = 2;
+					charSortKey [2] = (byte) (charSortKey [2]
+						+ Level2 (s [idx], ExtenderType.None));
+			}
+
+			return MatchesPrimitive (charSortKey, si, ext, sortkey, ti, noLv4);
+		}
+
+		private bool MatchesPrimitive (byte [] charSortKey, int si, ExtenderType ext, byte [] sortkey, int ti, bool noLv4)
+		{
+			if (charSortKey [0] != sortkey [0] ||
+				charSortKey [1] != sortkey [1] ||
+				(!ignoreNonSpace && charSortKey [2] != sortkey [2]) ||
+				charSortKey [3] != sortkey [3])
+				return false;
+			if (noLv4 && (si < 0 || !Uni.HasSpecialWeight ((char) si)))
+				return true;
+			else if (noLv4)
+				return false;
+			// Since target can never be an extender, if the source
+			// is an expander and it matters, then they never match.
+			if (!ignoreNonSpace && ext == ExtenderType.Conditional)
+				return false;
+			if (Uni.IsJapaneseSmallLetter ((char) si) !=
+				Uni.IsJapaneseSmallLetter ((char) ti) ||
+				ToDashTypeValue (ext) !=
+				// FIXME: we will have to specify correct value for target
+				ToDashTypeValue (ExtenderType.None) ||
+				!Uni.IsHiragana ((char) si) !=
+				!Uni.IsHiragana ((char) ti) ||
+				IsHalfKana ((char) si) !=
+				IsHalfKana ((char) ti))
+				return false;
+			return true;
+		}
+
+		private bool MatchesBackward (string s, ref int idx, int end, int orgStart, int ti, byte [] sortkey, bool noLv4)
+		{
+			int cur = idx;
+			int si = -1;
+			ExtenderType ext = GetExtenderType (s [idx]);
+			// To handle extenders in source, we need to
+			// check next _primary_ character.
+			if (ext != ExtenderType.None) {
+				byte diacritical = 0;
+				for (int tmp = 0; ; tmp--) {
+					if (tmp < 0) // heading extender
+						return false;
+					if (IsIgnorable (s [tmp]))
+						continue;
+					int tmpi = FilterOptions (s [tmp]);
+					byte category = Category (tmpi);
+					if (category == 1) {
+						diacritical = Level2 (tmpi, ExtenderType.None);
+						continue;
+					}
+					si = FilterExtender (tmpi, ext);
+					charSortKey [0] = category;
+					charSortKey [1] = Level1 (si);
+					if (!ignoreNonSpace)
+						charSortKey [2] = Level2 (si, ext);
+					charSortKey [3] = Uni.Level3 (si);
+					if (ext != ExtenderType.Conditional &&
+						diacritical != 0)
+						charSortKey [2] =
+							(charSortKey [2] == 0) ?
+							(byte) (diacritical + 2) :
+							diacritical;
+					break;
+				}
+				idx--;
+			}
+			Contraction ct = null;
+			if (ext == ExtenderType.None)
+				ct = GetContraction (s, idx, end);
+			// if lv4 exists, it never matches contraction
+			if (ct != null) {
+				idx -= ct.Source.Length;
+				if (!noLv4)
+					return false;
+				if (ct.SortKey != null) {
+					for (int i = 0; i < sortkey.Length; i++)
+						charSortKey [i] = sortkey [i];
+					previousChar = -1;
+					previousSortKey = charSortKey;
+				} else {
+					// Here is the core of LAMESPEC
+					// described at the top of the source.
+					int dummy = ct.Replacement.Length - 1;
+					return MatchesBackward (ct.Replacement, 
+						ref dummy, dummy, -1, ti, sortkey, noLv4);
+				}
+			} else if (ext == ExtenderType.None) {
+				if (si < 0)
+					si = FilterOptions (s [idx]);
+				charSortKey [0] = Category (si);
+				charSortKey [1] = Level1 (si);
+				if (!ignoreNonSpace)
+					charSortKey [2] = Level2 (si, ext);
+				charSortKey [3] = Uni.Level3 (si);
+				if (charSortKey [0] != 1)
+					previousChar = si;
+				idx--;
+			}
+			if (ext == ExtenderType.None) {
+				for (int tmp = cur + 1; tmp < orgStart; tmp++) {
+					if (Category (s [tmp]) != 1)
+						break;
+					if (ignoreNonSpace)
+						continue;
+					if (charSortKey [2] == 0)
+							charSortKey [2] = 2;
+					charSortKey [2] = (byte) (charSortKey [2]
+						+ Level2 (s [tmp], ExtenderType.None));
+				}
+			}
+			return MatchesPrimitive (charSortKey, si, ext, sortkey, ti, noLv4);
+		}
 		#endregion
 	}
 }