/* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ using System; using System.Collections.Generic; using Lucene.Net.Util; using NUnit.Framework; using Analyzer = Lucene.Net.Analysis.Analyzer; using TokenStream = Lucene.Net.Analysis.TokenStream; using StandardAnalyzer = Lucene.Net.Analysis.Standard.StandardAnalyzer; using Document = Lucene.Net.Documents.Document; using Field = Lucene.Net.Documents.Field; using IndexWriter = Lucene.Net.Index.IndexWriter; using Directory = Lucene.Net.Store.Directory; using RAMDirectory = Lucene.Net.Store.RAMDirectory; using BaseTokenStreamTestCase = Lucene.Net.Test.Analysis.BaseTokenStreamTestCase; using BooleanClause = Lucene.Net.Search.BooleanClause; using IndexSearcher = Lucene.Net.Search.IndexSearcher; using Query = Lucene.Net.Search.Query; using ScoreDoc = Lucene.Net.Search.ScoreDoc; using Occur = Lucene.Net.Search.Occur; namespace Lucene.Net.QueryParsers { /// Tests QueryParser. [TestFixture] public class TestMultiFieldQueryParser : LuceneTestCase { /// test stop words arsing for both the non static form, and for the /// corresponding static form (qtxt, fields[]). /// public virtual void tesStopwordsParsing() { AssertStopQueryEquals("one", "b:one t:one"); AssertStopQueryEquals("one stop", "b:one t:one"); AssertStopQueryEquals("one (stop)", "b:one t:one"); AssertStopQueryEquals("one ((stop))", "b:one t:one"); AssertStopQueryEquals("stop", ""); AssertStopQueryEquals("(stop)", ""); AssertStopQueryEquals("((stop))", ""); } // verify parsing of query using a stopping analyzer private void AssertStopQueryEquals(string qtxt, string expectedRes) { string[] fields = new string[]{"b", "t"}; Occur[] occur = new Occur[]{Occur.SHOULD, Occur.SHOULD}; TestQueryParser.QPTestAnalyzer a = new TestQueryParser.QPTestAnalyzer(); MultiFieldQueryParser mfqp = new MultiFieldQueryParser(Util.Version.LUCENE_CURRENT, fields, a); Query q = mfqp.Parse(qtxt); Assert.AreEqual(expectedRes, q.ToString()); q = MultiFieldQueryParser.Parse(Util.Version.LUCENE_CURRENT, qtxt, fields, occur, a); Assert.AreEqual(expectedRes, q.ToString()); } [Test] public virtual void TestSimple() { string[] fields = new string[]{"b", "t"}; MultiFieldQueryParser mfqp = new MultiFieldQueryParser(Util.Version.LUCENE_CURRENT, fields, new StandardAnalyzer(Util.Version.LUCENE_CURRENT)); Query q = mfqp.Parse("one"); Assert.AreEqual("b:one t:one", q.ToString()); q = mfqp.Parse("one two"); Assert.AreEqual("(b:one t:one) (b:two t:two)", q.ToString()); q = mfqp.Parse("+one +two"); Assert.AreEqual("+(b:one t:one) +(b:two t:two)", q.ToString()); q = mfqp.Parse("+one -two -three"); Assert.AreEqual("+(b:one t:one) -(b:two t:two) -(b:three t:three)", q.ToString()); q = mfqp.Parse("one^2 two"); Assert.AreEqual("((b:one t:one)^2.0) (b:two t:two)", q.ToString()); q = mfqp.Parse("one~ two"); Assert.AreEqual("(b:one~0.5 t:one~0.5) (b:two t:two)", q.ToString()); q = mfqp.Parse("one~0.8 two^2"); Assert.AreEqual("(b:one~0.8 t:one~0.8) ((b:two t:two)^2.0)", q.ToString()); q = mfqp.Parse("one* two*"); Assert.AreEqual("(b:one* t:one*) (b:two* t:two*)", q.ToString()); q = mfqp.Parse("[a TO c] two"); Assert.AreEqual("(b:[a TO c] t:[a TO c]) (b:two t:two)", q.ToString()); q = mfqp.Parse("w?ldcard"); Assert.AreEqual("b:w?ldcard t:w?ldcard", q.ToString()); q = mfqp.Parse("\"foo bar\""); Assert.AreEqual("b:\"foo bar\" t:\"foo bar\"", q.ToString()); q = mfqp.Parse("\"aa bb cc\" \"dd ee\""); Assert.AreEqual("(b:\"aa bb cc\" t:\"aa bb cc\") (b:\"dd ee\" t:\"dd ee\")", q.ToString()); q = mfqp.Parse("\"foo bar\"~4"); Assert.AreEqual("b:\"foo bar\"~4 t:\"foo bar\"~4", q.ToString()); // LUCENE-1213: MultiFieldQueryParser was ignoring slop when phrase had a field. q = mfqp.Parse("b:\"foo bar\"~4"); Assert.AreEqual("b:\"foo bar\"~4", q.ToString()); // make sure that terms which have a field are not touched: q = mfqp.Parse("one f:two"); Assert.AreEqual("(b:one t:one) f:two", q.ToString()); // AND mode: mfqp.DefaultOperator = QueryParser.AND_OPERATOR; q = mfqp.Parse("one two"); Assert.AreEqual("+(b:one t:one) +(b:two t:two)", q.ToString()); q = mfqp.Parse("\"aa bb cc\" \"dd ee\""); Assert.AreEqual("+(b:\"aa bb cc\" t:\"aa bb cc\") +(b:\"dd ee\" t:\"dd ee\")", q.ToString()); } [Test] public virtual void TestBoostsSimple() { IDictionary boosts = new Dictionary(); boosts["b"] = (float) 5; boosts["t"] = (float) 10; string[] fields = new string[]{"b", "t"}; MultiFieldQueryParser mfqp = new MultiFieldQueryParser(Util.Version.LUCENE_CURRENT, fields, new StandardAnalyzer(Util.Version.LUCENE_CURRENT), boosts); //Check for simple Query q = mfqp.Parse("one"); Assert.AreEqual("b:one^5.0 t:one^10.0", q.ToString()); //Check for AND q = mfqp.Parse("one AND two"); Assert.AreEqual("+(b:one^5.0 t:one^10.0) +(b:two^5.0 t:two^10.0)", q.ToString()); //Check for OR q = mfqp.Parse("one OR two"); Assert.AreEqual("(b:one^5.0 t:one^10.0) (b:two^5.0 t:two^10.0)", q.ToString()); //Check for AND and a field q = mfqp.Parse("one AND two AND foo:test"); Assert.AreEqual("+(b:one^5.0 t:one^10.0) +(b:two^5.0 t:two^10.0) +foo:test", q.ToString()); q = mfqp.Parse("one^3 AND two^4"); Assert.AreEqual("+((b:one^5.0 t:one^10.0)^3.0) +((b:two^5.0 t:two^10.0)^4.0)", q.ToString()); } [Test] public virtual void TestStaticMethod1() { var fields = new []{"b", "t"}; var queries = new [] { "one", "two" }; Query q = MultiFieldQueryParser.Parse(Util.Version.LUCENE_CURRENT, queries, fields, new StandardAnalyzer(Util.Version.LUCENE_CURRENT)); Assert.AreEqual("b:one t:two", q.ToString()); var queries2 = new [] { "+one", "+two" }; q = MultiFieldQueryParser.Parse(Util.Version.LUCENE_CURRENT, queries2, fields, new StandardAnalyzer(Util.Version.LUCENE_CURRENT)); Assert.AreEqual("(+b:one) (+t:two)", q.ToString()); var queries3 = new [] { "one", "+two" }; q = MultiFieldQueryParser.Parse(Util.Version.LUCENE_CURRENT, queries3, fields, new StandardAnalyzer(Util.Version.LUCENE_CURRENT)); Assert.AreEqual("b:one (+t:two)", q.ToString()); var queries4 = new [] { "one +more", "+two" }; q = MultiFieldQueryParser.Parse(Util.Version.LUCENE_CURRENT, queries4, fields, new StandardAnalyzer(Util.Version.LUCENE_CURRENT)); Assert.AreEqual("(b:one +b:more) (+t:two)", q.ToString()); var queries5 = new [] { "blah" }; Assert.Throws(() => MultiFieldQueryParser.Parse(Util.Version.LUCENE_CURRENT, queries5, fields, new StandardAnalyzer(Util.Version.LUCENE_CURRENT))); // check also with stop words for this static form (qtxts[], fields[]). var stopA = new TestQueryParser.QPTestAnalyzer(); var queries6 = new [] { "((+stop))", "+((stop))" }; q = MultiFieldQueryParser.Parse(Util.Version.LUCENE_CURRENT, queries6, fields, stopA); Assert.AreEqual("", q.ToString()); var queries7 = new [] { "one ((+stop)) +more", "+((stop)) +two" }; q = MultiFieldQueryParser.Parse(Util.Version.LUCENE_CURRENT, queries7, fields, stopA); Assert.AreEqual("(b:one +b:more) (+t:two)", q.ToString()); } [Test] public virtual void TestStaticMethod2() { string[] fields = new []{"b", "t"}; Occur[] flags = new []{Occur.MUST, Occur.MUST_NOT}; Query q = MultiFieldQueryParser.Parse(Util.Version.LUCENE_CURRENT, "one", fields, flags, new StandardAnalyzer(Util.Version.LUCENE_CURRENT)); Assert.AreEqual("+b:one -t:one", q.ToString()); q = MultiFieldQueryParser.Parse(Util.Version.LUCENE_CURRENT, "one two", fields, flags, new StandardAnalyzer(Util.Version.LUCENE_CURRENT)); Assert.AreEqual("+(b:one b:two) -(t:one t:two)", q.ToString()); Occur[] flags2 = new []{Occur.MUST}; Assert.Throws( () => MultiFieldQueryParser.Parse(Util.Version.LUCENE_CURRENT, "blah", fields, flags2, new StandardAnalyzer(Util.Version.LUCENE_CURRENT))); } [Test] public virtual void TestStaticMethod2Old() { var fields = new[] { "b", "t" }; //int[] flags = {MultiFieldQueryParser.REQUIRED_FIELD, MultiFieldQueryParser.PROHIBITED_FIELD}; var flags = new[] { Occur.MUST, Occur.MUST_NOT }; var parser = new MultiFieldQueryParser(Util.Version.LUCENE_CURRENT, fields, new StandardAnalyzer(Util.Version.LUCENE_CURRENT)); Query q = MultiFieldQueryParser.Parse(Util.Version.LUCENE_CURRENT, "one", fields, flags, new StandardAnalyzer(Util.Version.LUCENE_CURRENT)); //, fields, flags, new StandardAnalyzer(Util.Version.LUCENE_CURRENT)); Assert.AreEqual("+b:one -t:one", q.ToString()); q = MultiFieldQueryParser.Parse(Util.Version.LUCENE_CURRENT, "one two", fields, flags, new StandardAnalyzer(Util.Version.LUCENE_CURRENT)); Assert.AreEqual("+(b:one b:two) -(t:one t:two)", q.ToString()); var flags2 = new []{Occur.MUST}; Assert.Throws( () => MultiFieldQueryParser.Parse(Util.Version.LUCENE_CURRENT, "blah", fields, flags2, new StandardAnalyzer(Util.Version.LUCENE_CURRENT))); } [Test] public virtual void TestStaticMethod3() { var queries = new [] { "one", "two", "three" }; var fields = new [] { "f1", "f2", "f3" }; var flags = new [] { Occur.MUST, Occur.MUST_NOT, Occur.SHOULD }; var q = MultiFieldQueryParser.Parse(Util.Version.LUCENE_CURRENT, queries, fields, flags, new StandardAnalyzer(Util.Version.LUCENE_CURRENT)); Assert.AreEqual("+f1:one -f2:two f3:three", q.ToString()); var flags2 = new[] { Occur.MUST }; Assert.Throws( () => MultiFieldQueryParser.Parse(Util.Version.LUCENE_CURRENT, queries, fields, flags2, new StandardAnalyzer(Util.Version.LUCENE_CURRENT))); } [Test] public virtual void TestStaticMethod3Old() { var queries = new [] { "one", "two" }; var fields = new [] { "b", "t" }; var flags = new [] { Occur.MUST, Occur.MUST_NOT }; var q = MultiFieldQueryParser.Parse(Util.Version.LUCENE_CURRENT, queries, fields, flags, new StandardAnalyzer(Util.Version.LUCENE_CURRENT)); Assert.AreEqual("+b:one -t:two", q.ToString()); var flags2 = new []{Occur.MUST}; Assert.Throws( () => MultiFieldQueryParser.Parse(Util.Version.LUCENE_CURRENT, queries, fields, flags2, new StandardAnalyzer(Util.Version.LUCENE_CURRENT))); } [Test] public virtual void TestAnalyzerReturningNull() { var fields = new string[]{"f1", "f2", "f3"}; var parser = new MultiFieldQueryParser(Util.Version.LUCENE_CURRENT, fields, new AnalyzerReturningNull()); var q = parser.Parse("bla AND blo"); Assert.AreEqual("+(f2:bla f3:bla) +(f2:blo f3:blo)", q.ToString()); // the following queries are not affected as their terms are not analyzed anyway: q = parser.Parse("bla*"); Assert.AreEqual("f1:bla* f2:bla* f3:bla*", q.ToString()); q = parser.Parse("bla~"); Assert.AreEqual("f1:bla~0.5 f2:bla~0.5 f3:bla~0.5", q.ToString()); q = parser.Parse("[a TO c]"); Assert.AreEqual("f1:[a TO c] f2:[a TO c] f3:[a TO c]", q.ToString()); } [Test] public virtual void TestStopWordSearching() { Analyzer analyzer = new StandardAnalyzer(Util.Version.LUCENE_CURRENT); Directory ramDir = new RAMDirectory(); var iw = new IndexWriter(ramDir, analyzer, true, IndexWriter.MaxFieldLength.LIMITED); var doc = new Document(); doc.Add(new Field("body", "blah the footest blah", Field.Store.NO, Field.Index.ANALYZED)); iw.AddDocument(doc); iw.Close(); var mfqp = new MultiFieldQueryParser(Util.Version.LUCENE_CURRENT, new[] { "body" }, analyzer); mfqp.DefaultOperator = QueryParser.Operator.AND; var q = mfqp.Parse("the footest"); var is_Renamed = new IndexSearcher(ramDir, true); var hits = is_Renamed.Search(q, null, 1000).ScoreDocs; Assert.AreEqual(1, hits.Length); is_Renamed.Close(); } [Test(Description = "LUCENENET-513")] public virtual void TestParsingQueryWithoutBoosts() { var analyzer = new StandardAnalyzer(Util.Version.LUCENE_CURRENT); var fields = new[] {"f1", "f2"}; var boosts = new Dictionary { {"f1", 2} // missing f2 intentional }; var parser = new MultiFieldQueryParser(Util.Version.LUCENE_CURRENT, fields, analyzer, boosts); var query = parser.Parse("bazinga"); Assert.AreEqual("f1:bazinga^2.0 f2:bazinga", query.ToString()); } /// Return empty tokens for field "f1". private class AnalyzerReturningNull:Analyzer { internal StandardAnalyzer stdAnalyzer = new StandardAnalyzer(Util.Version.LUCENE_CURRENT); public AnalyzerReturningNull() { } public override TokenStream TokenStream(string fieldName, System.IO.TextReader reader) { if ("f1".Equals(fieldName)) { return new EmptyTokenStream(); } else { return stdAnalyzer.TokenStream(fieldName, reader); } } private class EmptyTokenStream:TokenStream { public override bool IncrementToken() { return false; } protected override void Dispose(bool disposing) { // Do nothing } } } } }