/** * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ using System.IO; using System.Collections; using Lucene.Net.Analysis; using Lucene.Net.Analysis.Tokenattributes; using Lucene.Net.Util; namespace Lucene.Net.Analysis.AR { /** * A {@link TokenFilter} that applies {@link ArabicNormalizer} to normalize the orthography. * */ public class ArabicNormalizationFilter : TokenFilter { protected ArabicNormalizer normalizer = null; private TermAttribute termAtt; public ArabicNormalizationFilter(TokenStream input) : base(input) { normalizer = new ArabicNormalizer(); termAtt = (TermAttribute)AddAttribute(typeof(TermAttribute)); } public override bool IncrementToken() { if (input.IncrementToken()) { int newlen = normalizer.Normalize(termAtt.TermBuffer(), termAtt.TermLength()); termAtt.SetTermLength(newlen); return true; } else { return false; } } } }