/* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ using System; using NUnit.Framework; using Analyzer = Lucene.Net.Analysis.Analyzer; using TokenStream = Lucene.Net.Analysis.TokenStream; using TermAttribute = Lucene.Net.Analysis.Tokenattributes.TermAttribute; using Document = Lucene.Net.Documents.Document; using Field = Lucene.Net.Documents.Field; using Directory = Lucene.Net.Store.Directory; using RAMDirectory = Lucene.Net.Store.RAMDirectory; using LuceneTestCase = Lucene.Net.Util.LuceneTestCase; namespace Lucene.Net.Index { /// $Id$ /// class RepeatingTokenStream:TokenStream { public int num; internal TermAttribute termAtt; internal System.String value_Renamed; public RepeatingTokenStream(System.String val) { this.value_Renamed = val; this.termAtt = (TermAttribute) AddAttribute(typeof(TermAttribute)); } public override bool IncrementToken() { num--; if (num >= 0) { ClearAttributes(); termAtt.SetTermBuffer(value_Renamed); return true; } return false; } } public class TestTermdocPerf:LuceneTestCase { private class AnonymousClassAnalyzer:Analyzer { public AnonymousClassAnalyzer(System.Random random, float percentDocs, Lucene.Net.Index.RepeatingTokenStream ts, int maxTF, TestTermdocPerf enclosingInstance) { InitBlock(random, percentDocs, ts, maxTF, enclosingInstance); } private void InitBlock(System.Random random, float percentDocs, Lucene.Net.Index.RepeatingTokenStream ts, int maxTF, TestTermdocPerf enclosingInstance) { this.random = random; this.percentDocs = percentDocs; this.ts = ts; this.maxTF = maxTF; this.enclosingInstance = enclosingInstance; } private System.Random random; private float percentDocs; private Lucene.Net.Index.RepeatingTokenStream ts; private int maxTF; private TestTermdocPerf enclosingInstance; public TestTermdocPerf Enclosing_Instance { get { return enclosingInstance; } } public override TokenStream TokenStream(System.String fieldName, System.IO.TextReader reader) { if ((float) random.NextDouble() < percentDocs) ts.num = random.Next(maxTF) + 1; else ts.num = 0; return ts; } } internal virtual void AddDocs(Directory dir, int ndocs, System.String field, System.String val, int maxTF, float percentDocs) { System.Random random = NewRandom(); RepeatingTokenStream ts = new RepeatingTokenStream(val); Analyzer analyzer = new AnonymousClassAnalyzer(random, percentDocs, ts, maxTF, this); Document doc = new Document(); doc.Add(new Field(field, val, Field.Store.NO, Field.Index.NOT_ANALYZED_NO_NORMS)); IndexWriter writer = new IndexWriter(dir, analyzer, true, IndexWriter.MaxFieldLength.LIMITED); writer.SetMaxBufferedDocs(100); writer.SetMergeFactor(100); for (int i = 0; i < ndocs; i++) { writer.AddDocument(doc); } writer.Optimize(); writer.Close(); } public virtual int doTest(int iter, int ndocs, int maxTF, float percentDocs) { Directory dir = new RAMDirectory(); long start = (DateTime.Now.Ticks / TimeSpan.TicksPerMillisecond); AddDocs(dir, ndocs, "foo", "val", maxTF, percentDocs); long end = (DateTime.Now.Ticks / TimeSpan.TicksPerMillisecond); System.Console.Out.WriteLine("milliseconds for creation of " + ndocs + " docs = " + (end - start)); IndexReader reader = IndexReader.Open(dir); TermEnum tenum = reader.Terms(new Term("foo", "val")); TermDocs tdocs = reader.TermDocs(); start = (DateTime.Now.Ticks / TimeSpan.TicksPerMillisecond); int ret = 0; for (int i = 0; i < iter; i++) { tdocs.Seek(tenum); while (tdocs.Next()) { ret += tdocs.Doc(); } } end = (DateTime.Now.Ticks / TimeSpan.TicksPerMillisecond); System.Console.Out.WriteLine("milliseconds for " + iter + " TermDocs iteration: " + (end - start)); return ret; } [Test] public virtual void TestTermDocPerf() { // performance test for 10% of documents containing a term // doTest(100000, 10000,3,.1f); } } }