/* * * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, * software distributed under the License is distributed on an * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY * KIND, either express or implied. See the License for the * specific language governing permissions and limitations * under the License. * */ using System; using System.IO; using System.Text; using System.Collections; using System.Collections.Generic; using Lucene.Net.Analysis; namespace Lucene.Net.Analysis.Fr { /* ==================================================================== * The Apache Software License, Version 1.1 * * Copyright (c) 2004 The Apache Software Foundation. All rights * reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * * 1. Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * * 2. Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in * the documentation and/or other materials provided with the * distribution. * * 3. The end-user documentation included with the redistribution, * if any, must include the following acknowledgment: * "This product includes software developed by the * Apache Software Foundation (http://www.apache.org/)." * Alternately, this acknowledgment may appear in the software itself, * if and wherever such third-party acknowledgments normally appear. * * 4. The names "Apache" and "Apache Software Foundation" and * "Apache Lucene" must not be used to endorse or promote products * derived from this software without prior written permission. For * written permission, please contact apache@apache.org. * * 5. Products derived from this software may not be called "Apache", * "Apache Lucene", nor may "Apache" appear in their name, without * prior written permission of the Apache Software Foundation. * * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE * DISCLAIMED. IN NO EVENT SHALL THE APACHE SOFTWARE FOUNDATION OR * ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF * USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF * SUCH DAMAGE. * ==================================================================== * * This software consists of voluntary contributions made by many * individuals on behalf of the Apache Software Foundation. For more * information on the Apache Software Foundation, please see * . */ /// /// A filter that stemms french words. It supports a table of words that should /// not be stemmed at all. The used stemmer can be changed at runtime after the /// filter object is created (as long as it is a FrenchStemmer). /// /// Patrick Talbot (based on Gerhard Schwarz work for German) /// $Id: FrenchAnalyzer.java,v 1.2 2004/01/23 20:54:47 ehatcher Exp $ /// public sealed class FrenchStemFilter : TokenFilter { /// /// The actual token in the input stream. /// private Token token = null; private FrenchStemmer stemmer = null; private ICollection exclusions = null; public FrenchStemFilter( TokenStream _in ) : base(_in) { stemmer = new FrenchStemmer(); } /// /// Builds a FrenchStemFilter that uses an exclusiontable. /// public FrenchStemFilter(TokenStream _in, ICollection exclusiontable) : this(_in) { exclusions = exclusiontable; } /// /// Returns the next token in the stream, or null at EOS /// /// /// Returns the next token in the stream, or null at EOS /// public override Token Next() { if ( ( token = input.Next() ) == null ) { return null; } // Check the exclusiontable else if ( exclusions != null && exclusions.Contains( token.TermText() ) ) { return token; } else { String s = stemmer.Stem( token.TermText() ); // If not stemmed, dont waste the time creating a new token if ( !s.Equals( token.TermText() ) ) { return new Token( s, 0, s.Length, token.Type() ); } return token; } } /// /// Set a alternative/custom FrenchStemmer for this filter. /// public void SetStemmer( FrenchStemmer stemmer ) { if ( stemmer != null ) { this.stemmer = stemmer; } } /// /// Set an alternative exclusion list for this filter. /// public void SetExclusionTable(ICollection exclusiontable) { exclusions = exclusiontable; } } }