# ==================================================================== # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. # ==================================================================== import os from unittest import TestCase from time import time from datetime import timedelta from lucene import \ IndexWriter, SimpleAnalyzer, Document, Field, System, \ Term, TermQuery, IndexSearcher, FSDirectory class FieldLengthTest(TestCase): keywords = ["1", "2"] unindexed = ["Netherlands", "Italy"] unstored = ["Amsterdam has lots of bridges", "Venice has lots of canals"] text = ["Amsterdam", "Venice"] def setUp(self): indexDir = os.path.join(System.getProperty("java.io.tmpdir", "tmp"), "index-dir") self.dir = FSDirectory.getDirectory(indexDir, True) def testFieldSize(self): self.addDocuments(self.dir, 10) self.assertEqual(1, self.getHitCount("contents", "bridges")) self.addDocuments(self.dir, 1) self.assertEqual(0, self.getHitCount("contents", "bridges")) def getHitCount(self, fieldName, searchString): searcher = IndexSearcher(self.dir) t = Term(fieldName, searchString) query = TermQuery(t) hits = searcher.search(query) hitCount = hits.length() searcher.close() return hitCount def addDocuments(self, dir, maxFieldLength): writer = IndexWriter(dir, SimpleAnalyzer(), True) writer.setMaxFieldLength(maxFieldLength) for i in xrange(len(self.keywords)): doc = Document() doc.add(Field("id", self.keywords[i], Field.Store.YES, Field.Index.UN_TOKENIZED)) doc.add(Field("country", self.unindexed[i], Field.Store.YES, Field.Index.NO)) doc.add(Field("contents", self.unstored[i], Field.Store.NO, Field.Index.TOKENIZED)) doc.add(Field("city", self.text[i], Field.Store.YES, Field.Index.TOKENIZED)) writer.addDocument(doc) writer.optimize() writer.close()