/* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ using System; using Pattern = System.Text.RegularExpressions.Regex; using NUnit.Framework; using SimpleAnalyzer = Lucene.Net.Analysis.SimpleAnalyzer; using Document = Lucene.Net.Documents.Document; using Field = Lucene.Net.Documents.Field; using IndexReader = Lucene.Net.Index.IndexReader; using IndexWriter = Lucene.Net.Index.IndexWriter; using Term = Lucene.Net.Index.Term; using RAMDirectory = Lucene.Net.Store.RAMDirectory; using DocIdBitSet = Lucene.Net.Util.DocIdBitSet; namespace Lucene.Net.Search { /// Unit tests for sorting code. /// ///

Created: Feb 17, 2004 4:55:10 PM /// ///

/// lucene 1.4 /// /// $Id: TestSort.java 590530 2007-10-31 01:28:25Z gsingers $ /// [Serializable] [TestFixture] public class TestSort { [Serializable] private class AnonymousClassFilter : Filter { public AnonymousClassFilter(Lucene.Net.Search.TopDocs docs1, TestSort enclosingInstance) { InitBlock(docs1, enclosingInstance); } private void InitBlock(Lucene.Net.Search.TopDocs docs1, TestSort enclosingInstance) { this.docs1 = docs1; this.enclosingInstance = enclosingInstance; } private Lucene.Net.Search.TopDocs docs1; private TestSort enclosingInstance; public TestSort Enclosing_Instance { get { return enclosingInstance; } } public override DocIdSet GetDocIdSet(IndexReader reader) { System.Collections.BitArray bs = new System.Collections.BitArray((reader.MaxDoc() % 64 == 0 ? reader.MaxDoc() / 64 : reader.MaxDoc() / 64 + 1) * 64); bs.Set(docs1.scoreDocs[0].doc, true); return new DocIdBitSet(bs); } [System.Obsolete()] public override System.Collections.BitArray Bits(IndexReader reader) { System.Collections.BitArray bs = new System.Collections.BitArray((reader.MaxDoc() % 64 == 0?reader.MaxDoc() / 64:reader.MaxDoc() / 64 + 1) * 64); bs.Set(docs1.scoreDocs[0].doc, true); return bs; } } private Searcher full; private Searcher searchX; private Searcher searchY; private Query queryX; private Query queryY; private Query queryA; private Query queryE; private Query queryF; private Query queryG; private Sort sort; private bool serverStarted = false; private int port; //public TestSort(System.String name) : base(name) //{ //} [STAThread] public static void Main(System.String[] argv) { System.Runtime.Remoting.RemotingConfiguration.Configure("Lucene.Net.Search.TestSort.config", false); System.Runtime.Remoting.Channels.ChannelServices.RegisterChannel(new System.Runtime.Remoting.Channels.Http.HttpChannel(8080), false); if (argv == null || argv.Length < 1) { // NUnit.Core.TestRunner.Run(Suite()); // {{Aroush-1.9}} where is "Run" in NUnit? } else if ("server".Equals(argv[0])) { TestSort test = new TestSort(); try { test.StartServer(); System.Threading.Thread.Sleep(new System.TimeSpan((System.Int64) 10000 * 500000)); } catch (System.Exception e) { System.Console.Out.WriteLine(e); System.Console.Error.WriteLine(e.StackTrace); } } System.Console.ReadLine(); } static string NDS = System.Globalization.CultureInfo.CurrentCulture.NumberFormat.NumberDecimalSeparator; // document data: // the tracer field is used to determine which document was hit // the contents field is used to search and sort by relevance // the int field to sort by int // the float field to sort by float // the string field to sort by string // the i18n field includes accented characters for testing locale-specific sorting private string[][] data = new string[][] { // {dougsale-2.4.0} // As C# doesn't support a signed byte datatype, the byte values of the data array have been adjusted // to work as expected (maintained relative sort-ordering of documents). // All the byte values had 51 added to them except MinValue and MaxValue, as -50 was the lowest value inside of MinValue). // Note: The inconsistent behavior of fields interpreted as byte for sorting purposes could pose a problem for someone // using an index across Lucene and Lucene.NET. // tracer contents int float string custom i18n long double, 'short', byte new string[] { "A", "x a", "5", "4f", "c", "A-3", "p\u00EAche", "10", "-4" + NDS + "0", "3", "177"/*"126"*/},//A,x new string[] { "B", "y a", "5", "3" + NDS + "4028235E38", "i", "B-10", "HAT", "1000000000", "40" + NDS + "0", "24", "52"/*"1"*/},//B,y new string[] { "C", "x a b c", "2147483647", "1" + NDS + "0", "j", "A-2", "p\u00E9ch\u00E9", "99999999", "40" + NDS + "00002343", "125", "66"/*"15"*/},//C,x // {dougsale-2.4.0} // Can't convert from System.Double.MinValue or System.Double.MaxValue to a string and then back to a double // without a System.OverflowException occurring on the way back from string to double - so reduced the // magnitude of the values while maintaining the relative sort orders. Perhaps we should be using decimal instead // of double... new string[] { "D", "y a b c", "-1", "0" + NDS + "0f", "a", "C-0", "HUT", System.Int64.MaxValue.ToString(), "-1.77971620351369E+308" /*System.Double.MinValue.ToString()*/, System.Int16.MinValue.ToString(), System.Byte.MinValue.ToString() },//D,y new string[] { "E", "x a b c d", "5", "2f", "h", "B-8", "peach", System.Int64.MinValue.ToString(), "1.77971620351369E+308" /*System.Double.MaxValue.ToString()*/, System.Int16.MaxValue.ToString(), System.Byte.MaxValue.ToString() },//E,x new string[] { "F", "y a b c d", "2", "3" + NDS + "14159f", "g", "B-1", "H\u00C5T", "-44", "343" + NDS + "034435444", "-3", "51"/*"0"*/},//F,y new string[] { "G", "x a b c d", "3", "-1" + NDS + "0", "f", "C-100", "sin", "323254543543", "4" + NDS + "043544", "5", "151"/*"100"*/},//G,x new string[] { "H", "y a b c d", "0", "1" + NDS + "4E-45", "e", "C-88", "H\u00D8T", "1023423423005","4" + NDS + "043545", "10", "1"/*"-50"*/},//H,y new string[] { "I", "x a b c d e f", "-2147483648", "1" + NDS + "0e+0", "d", "A-10", "s\u00EDn", "332422459999", "4" + NDS + "043546", "-340", "102"/*"51"*/},//I,x new string[] { "J", "y a b c d e f", "4", "" + NDS + "5", "b", "C-7", "HOT", "34334543543", "4" + NDS + "0000220343", "300", "53"/*"2"*/},//J,y new string[] { "W", "g", "1", null, null, null, null, null, null, null, null}, new string[] { "X", "g", "1", "0" + NDS + "1", null, null, null, null, null, null, null}, new string[] { "Y", "g", "1", "0" + NDS + "2", null, null, null, null, null, null, null}, new string[] { "Z", "f g", null, null, null, null, null, null, null, null, null} }; // create an index of all the documents, or just the x, or just the y documents private Searcher GetIndex(bool even, bool odd) { RAMDirectory indexStore = new RAMDirectory(); IndexWriter writer = new IndexWriter(indexStore, new SimpleAnalyzer(), true, IndexWriter.MaxFieldLength.LIMITED); for (int i = 0; i < data.Length; ++i) { if (((i % 2) == 0 && even) || ((i % 2) == 1 && odd)) { Lucene.Net.Documents.Document doc = new Lucene.Net.Documents.Document(); doc.Add(new Field("tracer", data[i][0], Field.Store.YES, Field.Index.NO)); doc.Add(new Field("contents", data[i][1], Field.Store.NO, Field.Index.ANALYZED)); if (data[i][2] != null) doc.Add(new Field("int", data[i][2], Field.Store.NO, Field.Index.NOT_ANALYZED)); if (data[i][3] != null) doc.Add(new Field("float", data[i][3], Field.Store.NO, Field.Index.NOT_ANALYZED)); if (data[i][4] != null) doc.Add(new Field("string", data[i][4], Field.Store.NO, Field.Index.NOT_ANALYZED)); if (data[i][5] != null) doc.Add(new Field("custom", data[i][5], Field.Store.NO, Field.Index.NOT_ANALYZED)); if (data[i][6] != null) doc.Add(new Field("i18n", data[i][6], Field.Store.NO, Field.Index.NOT_ANALYZED)); if (data[i][7] != null) doc.Add(new Field("long", data[i][7], Field.Store.NO, Field.Index.NOT_ANALYZED)); if (data[i][8] != null) doc.Add(new Field("double", data[i][8], Field.Store.NO, Field.Index.NOT_ANALYZED)); if (data[i][8] != null) doc.Add(new Field("short", data[i][9], Field.Store.NO, Field.Index.NOT_ANALYZED)); if (data[i][8] != null) doc.Add(new Field("byte", data[i][10], Field.Store.NO, Field.Index.NOT_ANALYZED)); doc.SetBoost(2); // produce some scores above 1.0 writer.AddDocument(doc); } } writer.Optimize(); writer.Close(); return new IndexSearcher(indexStore); } private Searcher GetFullIndex() { return GetIndex(true, true); } private Searcher GetXIndex() { return GetIndex(true, false); } private Searcher GetYIndex() { return GetIndex(false, true); } private Searcher GetEmptyIndex() { return GetIndex(false, false); } [SetUp] public virtual void SetUp() { full = GetFullIndex(); searchX = GetXIndex(); searchY = GetYIndex(); queryX = new TermQuery(new Term("contents", "x")); queryY = new TermQuery(new Term("contents", "y")); queryA = new TermQuery(new Term("contents", "a")); queryE = new TermQuery(new Term("contents", "e")); queryF = new TermQuery(new Term("contents", "f")); queryG = new TermQuery(new Term("contents", "g")); sort = new Sort(); if (!serverStarted) StartServer(); } // test the sorts by score and document number [Test] public virtual void TestBuiltInSorts() { sort = new Sort(); AssertMatches(full, queryX, sort, "ACEGI"); AssertMatches(full, queryY, sort, "BDFHJ"); sort.SetSort(SortField.FIELD_DOC); AssertMatches(full, queryX, sort, "ACEGI"); AssertMatches(full, queryY, sort, "BDFHJ"); } // test sorts where the type of field is specified [Test] public virtual void TestTypedSort() { sort.SetSort(new SortField[] { new SortField("int", SortField.INT), SortField.FIELD_DOC }); AssertMatches(full, queryX, sort, "IGAEC"); AssertMatches(full, queryY, sort, "DHFJB"); sort.SetSort(new SortField[] { new SortField("float", SortField.FLOAT), SortField.FIELD_DOC }); AssertMatches(full, queryX, sort, "GCIEA"); AssertMatches(full, queryY, sort, "DHJFB"); sort.SetSort(new SortField[] { new SortField("string", SortField.STRING), SortField.FIELD_DOC }); AssertMatches(full, queryX, sort, "AIGEC"); AssertMatches(full, queryY, sort, "DJHFB"); sort.SetSort(new SortField[] { new SortField("double", SortField.DOUBLE), SortField.FIELD_DOC }); AssertMatches(full, queryX, sort, "AGICE"); AssertMatches(full, queryY, sort, "DJHBF"); sort.SetSort(new SortField[] { new SortField("byte", SortField.BYTE), SortField.FIELD_DOC }); AssertMatches(full, queryX, sort, "CIGAE"); AssertMatches(full, queryY, sort, "DHFBJ"); sort.SetSort(new SortField[] { new SortField("short", SortField.SHORT), SortField.FIELD_DOC }); AssertMatches(full, queryX, sort, "IAGCE"); AssertMatches(full, queryY, sort, "DFHBJ"); sort.SetSort(new SortField[] { new SortField("string", SortField.STRING), SortField.FIELD_DOC }); AssertMatches(full, queryX, sort, "AIGEC"); AssertMatches(full, queryY, sort, "DJHFB"); } // test sorts when there's nothing in the index [Test] public virtual void TestEmptyIndex() { Searcher empty = GetEmptyIndex(); sort = new Sort(); AssertMatches(empty, queryX, sort, ""); sort.SetSort(SortField.FIELD_DOC); AssertMatches(empty, queryX, sort, ""); sort.SetSort(new SortField[]{new SortField("int", SortField.INT), SortField.FIELD_DOC}); AssertMatches(empty, queryX, sort, ""); sort.SetSort(new SortField[]{new SortField("string", SortField.STRING, true), SortField.FIELD_DOC}); AssertMatches(empty, queryX, sort, ""); sort.SetSort(new SortField[]{new SortField("float", SortField.FLOAT), new SortField("string", SortField.STRING)}); AssertMatches(empty, queryX, sort, ""); } // test sorts where the type of field is determined dynamically [Test] public virtual void TestAutoSort() { sort.SetSort("int"); AssertMatches(full, queryX, sort, "IGAEC"); AssertMatches(full, queryY, sort, "DHFJB"); sort.SetSort("float"); AssertMatches(full, queryX, sort, "GCIEA"); AssertMatches(full, queryY, sort, "DHJFB"); sort.SetSort("string"); AssertMatches(full, queryX, sort, "AIGEC"); AssertMatches(full, queryY, sort, "DJHFB"); } // test sorts in reverse [Test] public virtual void TestReverseSort() { sort.SetSort(new SortField[]{new SortField(null, SortField.SCORE, true), SortField.FIELD_DOC}); AssertMatches(full, queryX, sort, "IEGCA"); AssertMatches(full, queryY, sort, "JFHDB"); sort.SetSort(new SortField(null, SortField.DOC, true)); AssertMatches(full, queryX, sort, "IGECA"); AssertMatches(full, queryY, sort, "JHFDB"); sort.SetSort("int", true); AssertMatches(full, queryX, sort, "CAEGI"); AssertMatches(full, queryY, sort, "BJFHD"); sort.SetSort("float", true); AssertMatches(full, queryX, sort, "AECIG"); AssertMatches(full, queryY, sort, "BFJHD"); sort.SetSort("string", true); AssertMatches(full, queryX, sort, "CEGIA"); AssertMatches(full, queryY, sort, "BFHJD"); } // test sorting when the sort field is empty (undefined) for some of the documents [Test] public virtual void TestEmptyFieldSort() { sort.SetSort("string"); AssertMatches(full, queryF, sort, "ZJI"); sort.SetSort("string", true); AssertMatches(full, queryF, sort, "IJZ"); sort.SetSort(new SortField("i18n", new System.Globalization.CultureInfo("en"))); AssertMatches(full, queryF, sort, "ZJI"); sort.SetSort(new SortField("i18n", new System.Globalization.CultureInfo("en"), true)); AssertMatches(full, queryF, sort, "IJZ"); sort.SetSort("int"); AssertMatches(full, queryF, sort, "IZJ"); sort.SetSort("int", true); AssertMatches(full, queryF, sort, "JZI"); sort.SetSort("float"); AssertMatches(full, queryF, sort, "ZJI"); // using a nonexisting field as first sort key shouldn't make a difference: sort.SetSort(new SortField[]{new SortField("nosuchfield", SortField.STRING), new SortField("float")}); AssertMatches(full, queryF, sort, "ZJI"); sort.SetSort("float", true); AssertMatches(full, queryF, sort, "IJZ"); // When a field is null for both documents, the next SortField should be used. // Works for sort.SetSort(new SortField[]{new SortField("int"), new SortField("string", SortField.STRING), new SortField("float")}); AssertMatches(full, queryG, sort, "ZWXY"); // Reverse the last criterium to make sure the test didn't pass by chance sort.SetSort(new SortField[]{new SortField("int"), new SortField("string", SortField.STRING), new SortField("float", true)}); AssertMatches(full, queryG, sort, "ZYXW"); // Do the same for a MultiSearcher Searcher multiSearcher = new MultiSearcher(new Lucene.Net.Search.Searchable[]{full}); sort.SetSort(new SortField[]{new SortField("int"), new SortField("string", SortField.STRING), new SortField("float")}); AssertMatches(multiSearcher, queryG, sort, "ZWXY"); sort.SetSort(new SortField[]{new SortField("int"), new SortField("string", SortField.STRING), new SortField("float", true)}); AssertMatches(multiSearcher, queryG, sort, "ZYXW"); // Don't close the multiSearcher. it would close the full searcher too! // Do the same for a ParallelMultiSearcher Searcher parallelSearcher = new ParallelMultiSearcher(new Lucene.Net.Search.Searchable[]{full}); sort.SetSort(new SortField[]{new SortField("int"), new SortField("string", SortField.STRING), new SortField("float")}); AssertMatches(parallelSearcher, queryG, sort, "ZWXY"); sort.SetSort(new SortField[]{new SortField("int"), new SortField("string", SortField.STRING), new SortField("float", true)}); AssertMatches(parallelSearcher, queryG, sort, "ZYXW"); // Don't close the parallelSearcher. it would close the full searcher too! } // test sorts using a series of fields [Test] public virtual void TestSortCombos() { sort.SetSort(new System.String[]{"int", "float"}); AssertMatches(full, queryX, sort, "IGEAC"); sort.SetSort(new SortField[]{new SortField("int", true), new SortField(null, SortField.DOC, true)}); AssertMatches(full, queryX, sort, "CEAGI"); sort.SetSort(new System.String[]{"float", "string"}); AssertMatches(full, queryX, sort, "GICEA"); } // test using a Locale for sorting strings [Test] public virtual void TestLocaleSort() { sort.SetSort(new SortField[]{new SortField("string", new System.Globalization.CultureInfo("en-US"))}); AssertMatches(full, queryX, sort, "AIGEC"); AssertMatches(full, queryY, sort, "DJHFB"); sort.SetSort(new SortField[]{new SortField("string", new System.Globalization.CultureInfo("en-US"), true)}); AssertMatches(full, queryX, sort, "CEGIA"); AssertMatches(full, queryY, sort, "BFHJD"); } // test using various international locales with accented characters // (which sort differently depending on locale) [Test] public virtual void TestInternationalSort() { sort.SetSort(new SortField("i18n", new System.Globalization.CultureInfo("en-US"))); AssertMatches(full, queryY, sort, "BFJHD"); // NOTE: this is "BFJDH" in Java's version sort.SetSort(new SortField("i18n", new System.Globalization.CultureInfo("sv" + "-" + "se"))); AssertMatches(full, queryY, sort, "BJDFH"); sort.SetSort(new SortField("i18n", new System.Globalization.CultureInfo("da" + "-" + "dk"))); AssertMatches(full, queryY, sort, "BJDHF"); sort.SetSort(new SortField("i18n", new System.Globalization.CultureInfo("en-US"))); AssertMatches(full, queryX, sort, "ECAGI"); sort.SetSort(new SortField("i18n", new System.Globalization.CultureInfo("fr-FR"))); AssertMatches(full, queryX, sort, "EACGI"); } // Test the MultiSearcher's ability to preserve locale-sensitive ordering // by wrapping it around a single searcher [Test] public virtual void TestInternationalMultiSearcherSort() { Searcher multiSearcher = new MultiSearcher(new Lucene.Net.Search.Searchable[]{full}); sort.SetSort(new SortField("i18n", new System.Globalization.CultureInfo("sv" + "-" + "se"))); AssertMatches(multiSearcher, queryY, sort, "BJDFH"); sort.SetSort(new SortField("i18n", new System.Globalization.CultureInfo("en-US"))); AssertMatches(multiSearcher, queryY, sort, "BFJHD"); // NOTE: this is "BFJDH" in Java's version sort.SetSort(new SortField("i18n", new System.Globalization.CultureInfo("da" + "-" + "dk"))); AssertMatches(multiSearcher, queryY, sort, "BJDHF"); } // test a custom sort function [Test] public virtual void TestCustomSorts() { sort.SetSort(new SortField("custom", SampleComparable.GetComparatorSource())); AssertMatches(full, queryX, sort, "CAIEG"); sort.SetSort(new SortField("custom", SampleComparable.GetComparatorSource(), true)); AssertMatches(full, queryY, sort, "HJDBF"); SortComparator custom = SampleComparable.GetComparator(); sort.SetSort(new SortField("custom", custom)); AssertMatches(full, queryX, sort, "CAIEG"); sort.SetSort(new SortField("custom", custom, true)); AssertMatches(full, queryY, sort, "HJDBF"); } // test a variety of sorts using more than one searcher [Test] public virtual void TestMultiSort() { MultiSearcher searcher = new MultiSearcher(new Lucene.Net.Search.Searchable[]{searchX, searchY}); RunMultiSorts(searcher); } // test a variety of sorts using a parallel multisearcher [Test] public virtual void TestParallelMultiSort() { Searcher searcher = new ParallelMultiSearcher(new Lucene.Net.Search.Searchable[]{searchX, searchY}); RunMultiSorts(searcher); } // test a variety of sorts using a remote searcher [Test] public virtual void TestRemoteSort() { Lucene.Net.Search.Searchable searcher = GetRemote(); MultiSearcher multi = new MultiSearcher(new Lucene.Net.Search.Searchable[]{searcher}); RunMultiSorts(multi); } // test custom search when remote [Test] public virtual void TestRemoteCustomSort() { Lucene.Net.Search.Searchable searcher = GetRemote(); MultiSearcher multi = new MultiSearcher(new Lucene.Net.Search.Searchable[]{searcher}); sort.SetSort(new SortField("custom", SampleComparable.GetComparatorSource())); AssertMatches(multi, queryX, sort, "CAIEG"); sort.SetSort(new SortField("custom", SampleComparable.GetComparatorSource(), true)); AssertMatches(multi, queryY, sort, "HJDBF"); SortComparator custom = SampleComparable.GetComparator(); sort.SetSort(new SortField("custom", custom)); AssertMatches(multi, queryX, sort, "CAIEG"); sort.SetSort(new SortField("custom", custom, true)); AssertMatches(multi, queryY, sort, "HJDBF"); } // test that the relevancy scores are the same even if // hits are sorted [Test] public virtual void TestNormalizedScores() { // capture relevancy scores System.Collections.Hashtable scoresX = GetScores(full.Search(queryX, null, 1000).scoreDocs, full); System.Collections.Hashtable scoresY = GetScores(full.Search(queryY, null, 1000).scoreDocs, full); System.Collections.Hashtable scoresA = GetScores(full.Search(queryA, null, 1000).scoreDocs, full); // we'll test searching locally, remote and multi MultiSearcher remote = new MultiSearcher(new Lucene.Net.Search.Searchable[]{GetRemote()}); MultiSearcher multi = new MultiSearcher(new Lucene.Net.Search.Searchable[]{searchX, searchY}); // change sorting and make sure relevancy stays the same sort = new Sort(); AssertSameValues(scoresX, GetScores(full.Search(queryX, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresX, GetScores(remote.Search(queryX, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresX, GetScores(multi.Search(queryX, null, 1000, sort).scoreDocs, multi)); AssertSameValues(scoresY, GetScores(full.Search(queryY, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresY, GetScores(remote.Search(queryY, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresY, GetScores(multi.Search(queryY, null, 1000, sort).scoreDocs, multi)); AssertSameValues(scoresA, GetScores(full.Search(queryA, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresA, GetScores(remote.Search(queryA, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresA, GetScores(multi.Search(queryA, null, 1000, sort).scoreDocs, multi)); sort.SetSort(SortField.FIELD_DOC); AssertSameValues(scoresX, GetScores(full.Search(queryX, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresX, GetScores(remote.Search(queryX, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresX, GetScores(multi.Search(queryX, null, 1000, sort).scoreDocs, multi)); AssertSameValues(scoresY, GetScores(full.Search(queryY, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresY, GetScores(remote.Search(queryY, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresY, GetScores(multi.Search(queryY, null, 1000, sort).scoreDocs, multi)); AssertSameValues(scoresA, GetScores(full.Search(queryA, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresA, GetScores(remote.Search(queryA, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresA, GetScores(multi.Search(queryA, null, 1000, sort).scoreDocs, multi)); sort.SetSort("int"); AssertSameValues(scoresX, GetScores(full.Search(queryX, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresX, GetScores(remote.Search(queryX, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresX, GetScores(multi.Search(queryX, null, 1000, sort).scoreDocs, multi)); AssertSameValues(scoresY, GetScores(full.Search(queryY, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresY, GetScores(remote.Search(queryY, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresY, GetScores(multi.Search(queryY, null, 1000, sort).scoreDocs, multi)); AssertSameValues(scoresA, GetScores(full.Search(queryA, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresA, GetScores(remote.Search(queryA, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresA, GetScores(multi.Search(queryA, null, 1000, sort).scoreDocs, multi)); sort.SetSort("float"); AssertSameValues(scoresX, GetScores(full.Search(queryX, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresX, GetScores(remote.Search(queryX, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresX, GetScores(multi.Search(queryX, null, 1000, sort).scoreDocs, multi)); AssertSameValues(scoresY, GetScores(full.Search(queryY, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresY, GetScores(remote.Search(queryY, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresY, GetScores(multi.Search(queryY, null, 1000, sort).scoreDocs, multi)); AssertSameValues(scoresA, GetScores(full.Search(queryA, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresA, GetScores(remote.Search(queryA, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresA, GetScores(multi.Search(queryA, null, 1000, sort).scoreDocs, multi)); sort.SetSort("string"); AssertSameValues(scoresX, GetScores(full.Search(queryX, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresX, GetScores(remote.Search(queryX, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresX, GetScores(multi.Search(queryX, null, 1000, sort).scoreDocs, multi)); AssertSameValues(scoresY, GetScores(full.Search(queryY, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresY, GetScores(remote.Search(queryY, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresY, GetScores(multi.Search(queryY, null, 1000, sort).scoreDocs, multi)); AssertSameValues(scoresA, GetScores(full.Search(queryA, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresA, GetScores(remote.Search(queryA, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresA, GetScores(multi.Search(queryA, null, 1000, sort).scoreDocs, multi)); sort.SetSort(new System.String[]{"int", "float"}); AssertSameValues(scoresX, GetScores(full.Search(queryX, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresX, GetScores(remote.Search(queryX, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresX, GetScores(multi.Search(queryX, null, 1000, sort).scoreDocs, multi)); AssertSameValues(scoresY, GetScores(full.Search(queryY, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresY, GetScores(remote.Search(queryY, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresY, GetScores(multi.Search(queryY, null, 1000, sort).scoreDocs, multi)); AssertSameValues(scoresA, GetScores(full.Search(queryA, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresA, GetScores(remote.Search(queryA, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresA, GetScores(multi.Search(queryA, null, 1000, sort).scoreDocs, multi)); sort.SetSort(new SortField[]{new SortField("int", true), new SortField(null, SortField.DOC, true)}); AssertSameValues(scoresX, GetScores(full.Search(queryX, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresX, GetScores(remote.Search(queryX, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresX, GetScores(multi.Search(queryX, null, 1000, sort).scoreDocs, multi)); AssertSameValues(scoresY, GetScores(full.Search(queryY, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresY, GetScores(remote.Search(queryY, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresY, GetScores(multi.Search(queryY, null, 1000, sort).scoreDocs, multi)); AssertSameValues(scoresA, GetScores(full.Search(queryA, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresA, GetScores(remote.Search(queryA, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresA, GetScores(multi.Search(queryA, null, 1000, sort).scoreDocs, multi)); sort.SetSort(new System.String[]{"float", "string"}); AssertSameValues(scoresX, GetScores(full.Search(queryX, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresX, GetScores(remote.Search(queryX, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresX, GetScores(multi.Search(queryX, null, 1000, sort).scoreDocs, multi)); AssertSameValues(scoresY, GetScores(full.Search(queryY, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresY, GetScores(remote.Search(queryY, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresY, GetScores(multi.Search(queryY, null, 1000, sort).scoreDocs, multi)); AssertSameValues(scoresA, GetScores(full.Search(queryA, null, 1000, sort).scoreDocs, full)); AssertSameValues(scoresA, GetScores(remote.Search(queryA, null, 1000, sort).scoreDocs, remote)); AssertSameValues(scoresA, GetScores(multi.Search(queryA, null, 1000, sort).scoreDocs, multi)); } [Test] public virtual void TestTopDocsScores() { // There was previously a bug in FieldSortedHitQueue.maxscore when only a single // doc was added. That is what the following tests for. Sort sort = new Sort(); int nDocs = 10; // try to pick a query that will result in an unnormalized // score greater than 1 to test for correct normalization TopDocs docs1 = full.Search(queryE, null, nDocs, sort); // a filter that only allows through the first hit Filter filt = new AnonymousClassFilter(docs1, this); TopDocs docs2 = full.Search(queryE, filt, nDocs, sort); Assert.AreEqual(docs1.scoreDocs[0].score, docs2.scoreDocs[0].score, 1e-6); } // runs a variety of sorts useful for multisearchers private void RunMultiSorts(Searcher multi) { sort.SetSort(SortField.FIELD_DOC); AssertMatchesPattern(multi, queryA, sort, "[AB]{2}[CD]{2}[EF]{2}[GH]{2}[IJ]{2}"); sort.SetSort(new SortField("int", SortField.INT)); AssertMatchesPattern(multi, queryA, sort, "IDHFGJ[ABE]{3}C"); sort.SetSort(new SortField[]{new SortField("int", SortField.INT), SortField.FIELD_DOC}); AssertMatchesPattern(multi, queryA, sort, "IDHFGJ[AB]{2}EC"); sort.SetSort("int"); AssertMatchesPattern(multi, queryA, sort, "IDHFGJ[AB]{2}EC"); sort.SetSort(new SortField[]{new SortField("float", SortField.FLOAT), SortField.FIELD_DOC}); AssertMatchesPattern(multi, queryA, sort, "GDHJ[CI]{2}EFAB"); sort.SetSort("float"); AssertMatchesPattern(multi, queryA, sort, "GDHJ[CI]{2}EFAB"); sort.SetSort("string"); AssertMatches(multi, queryA, sort, "DJAIHGFEBC"); sort.SetSort("int", true); AssertMatchesPattern(multi, queryA, sort, "C[AB]{2}EJGFHDI"); sort.SetSort("float", true); AssertMatchesPattern(multi, queryA, sort, "BAFE[IC]{2}JHDG"); sort.SetSort("string", true); AssertMatches(multi, queryA, sort, "CBEFGHIAJD"); sort.SetSort(new SortField[]{new SortField("string", new System.Globalization.CultureInfo("en-US"))}); AssertMatches(multi, queryA, sort, "DJAIHGFEBC"); sort.SetSort(new SortField[]{new SortField("string", new System.Globalization.CultureInfo("en-US"), true)}); AssertMatches(multi, queryA, sort, "CBEFGHIAJD"); sort.SetSort(new System.String[]{"int", "float"}); AssertMatches(multi, queryA, sort, "IDHFGJEABC"); sort.SetSort(new System.String[]{"float", "string"}); AssertMatches(multi, queryA, sort, "GDHJICEFAB"); sort.SetSort("int"); AssertMatches(multi, queryF, sort, "IZJ"); sort.SetSort("int", true); AssertMatches(multi, queryF, sort, "JZI"); sort.SetSort("float"); AssertMatches(multi, queryF, sort, "ZJI"); sort.SetSort("string"); AssertMatches(multi, queryF, sort, "ZJI"); sort.SetSort("string", true); AssertMatches(multi, queryF, sort, "IJZ"); } // make sure the documents returned by the search match the expected list private void AssertMatches(Searcher searcher, Query query, Sort sort, System.String expectedResult) { ScoreDoc[] result = searcher.Search(query, null, 1000, sort).scoreDocs; System.Text.StringBuilder buff = new System.Text.StringBuilder(10); int n = result.Length; for (int i = 0; i < n; ++i) { Lucene.Net.Documents.Document doc = searcher.Doc(result[i].doc); System.String[] v = doc.GetValues("tracer"); for (int j = 0; j < v.Length; ++j) { buff.Append(v[j]); } } Assert.AreEqual(expectedResult, buff.ToString()); } // make sure the documents returned by the search match the expected list pattern private void AssertMatchesPattern(Searcher searcher, Query query, Sort sort, System.String pattern) { ScoreDoc[] result = searcher.Search(query, null, 1000, sort).scoreDocs; System.Text.StringBuilder buff = new System.Text.StringBuilder(10); int n = result.Length; for (int i = 0; i < n; ++i) { Lucene.Net.Documents.Document doc = searcher.Doc(result[i].doc); System.String[] v = doc.GetValues("tracer"); for (int j = 0; j < v.Length; ++j) { buff.Append(v[j]); } } // System.out.println ("matching \""+buff+"\" against pattern \""+pattern+"\""); Pattern p = new System.Text.RegularExpressions.Regex(pattern); Assert.IsTrue(p.Match(buff.ToString()).Success); } private System.Collections.Hashtable GetScores(ScoreDoc[] hits, Searcher searcher) { System.Collections.Hashtable scoreMap = new System.Collections.Hashtable(); int n = hits.Length; for (int i = 0; i < n; ++i) { Lucene.Net.Documents.Document doc = searcher.Doc(hits[i].doc); System.String[] v = doc.GetValues("tracer"); Assert.AreEqual(v.Length, 1); scoreMap[v[0]] = (float)hits[i].score; } return scoreMap; } // make sure all the values in the maps match private void AssertSameValues(System.Collections.Hashtable m1, System.Collections.Hashtable m2) { int n = m1.Count; int m = m2.Count; Assert.AreEqual(n, m); System.Collections.IEnumerator iter = new System.Collections.Hashtable().GetEnumerator(); while (iter.MoveNext()) { System.Object key = iter.Current; System.Object o1 = m1[key]; System.Object o2 = m2[key]; if (o1 is System.Single) { Assert.AreEqual((float) ((System.Single) o1), (float) ((System.Single) o2), 1e-6); } else { Assert.AreEqual(m1[key], m2[key]); } } } private Lucene.Net.Search.Searchable GetRemote() { return LookupRemote(); } private Lucene.Net.Search.Searchable LookupRemote() { return (Lucene.Net.Search.Searchable)Activator.GetObject(typeof(Lucene.Net.Search.Searchable), string.Format("http://localhost:{0}/SortedSearchable", port)); } private System.Runtime.Remoting.Channels.Http.HttpChannel GetHttpChannel() { Random rnd = new Random((int) (DateTime.Now.Ticks & 0x7fffffff)); port = rnd.Next(System.Net.IPEndPoint.MinPort, System.Net.IPEndPoint.MaxPort); System.Runtime.Remoting.Channels.Http.HttpChannel ch = new System.Runtime.Remoting.Channels.Http.HttpChannel(port); return ch; } public void StartServer() { System.Runtime.Remoting.Channels.Http.HttpChannel httpChannel = null; while (httpChannel == null) { try { httpChannel = GetHttpChannel(); } catch (System.Net.Sockets.SocketException ex) { if (ex.ErrorCode != 10048) throw ex; } } try { System.Runtime.Remoting.Channels.ChannelServices.RegisterChannel(httpChannel, false); } catch (System.Net.Sockets.SocketException ex) { if (ex.ErrorCode == 10048) return; // EADDRINUSE? throw ex; } // construct an index Searcher local = GetFullIndex(); // local.search (queryA, new Sort()); // publish it RemoteSearchable impl = new RemoteSearchable(local); System.Runtime.Remoting.RemotingServices.Marshal(impl, "SortedSearchable"); serverStarted = true; } //private Lucene.Net.Search.Searchable LookupRemote() //{ // return (Lucene.Net.Search.Searchable) Activator.GetObject(typeof(Lucene.Net.Search.Searchable), @"http://localhost:1099/SortedSearchable"); //} //public void StartServer() //{ // try // { // System.Runtime.Remoting.Channels.ChannelServices.RegisterChannel(new System.Runtime.Remoting.Channels.Http.HttpChannel(1099), false); // } // catch (System.Net.Sockets.SocketException ex) // { // if (ex.ErrorCode == 10048) return; // EADDRINUSE? // throw ex; // } // // construct an index // Searcher local = GetFullIndex(); // // local.search (queryA, new Sort()); // // publish it // RemoteSearchable impl = new RemoteSearchable(local); // System.Runtime.Remoting.RemotingServices.Marshal(impl, "SortedSearchable"); //} } }