package org.apache.lucene.analysis.pattern; /* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ import java.io.Reader; import java.util.Map; import java.util.regex.Pattern; import org.apache.lucene.analysis.CharFilter; import org.apache.lucene.analysis.pattern.PatternReplaceCharFilter; import org.apache.lucene.analysis.util.CharFilterFactory; /** * Factory for {@link PatternReplaceCharFilter}. * <pre class="prettyprint" > * <fieldType name="text_ptnreplace" class="solr.TextField" positionIncrementGap="100"> * <analyzer> * <charFilter class="solr.PatternReplaceCharFilterFactory" * pattern="([^a-z])" replacement=""/> * <tokenizer class="solr.KeywordTokenizerFactory"/> * </analyzer> * </fieldType></pre> * * * @since Solr 3.1 */ public class PatternReplaceCharFilterFactory extends CharFilterFactory { private Pattern p; private String replacement; private int maxBlockChars; private String blockDelimiters; @Override public void init(Map<String, String> args) { super.init( args ); p = getPattern("pattern"); replacement = args.get( "replacement" ); if( replacement == null ) replacement = ""; // TODO: warn if you set maxBlockChars or blockDelimiters ? maxBlockChars = getInt( "maxBlockChars", PatternReplaceCharFilter.DEFAULT_MAX_BLOCK_CHARS ); blockDelimiters = args.get( "blockDelimiters" ); } public CharFilter create(Reader input) { return new PatternReplaceCharFilter( p, replacement, maxBlockChars, blockDelimiters, input ); } }