/*
* Copyright (c) 2009 Andrejs Jermakovics.
*
* All rights reserved. This program and the accompanying materials
* are made available under the terms of the Eclipse Public License v1.0
* which accompanies this distribution, and is available at
* http://www.eclipse.org/legal/epl-v10.html
*
* Contributors:
* Andrejs Jermakovics - initial implementation
*/
package it.unibz.instasearch.indexing.querying;
import it.unibz.instasearch.indexing.Field;
import org.apache.lucene.index.Term;
import org.apache.lucene.search.BooleanClause;
import org.apache.lucene.search.BooleanClause.Occur;
import org.apache.lucene.search.BooleanQuery;
import org.apache.lucene.search.FuzzyQuery;
import org.apache.lucene.search.PhraseQuery;
import org.apache.lucene.search.PrefixQuery;
import org.apache.lucene.search.Query;
import org.apache.lucene.search.TermQuery;
import org.apache.lucene.search.WildcardQuery;
/**
* Makes the query fuzzy.
* Replaces each TermQuery by Query of the form: term* OR *term* OR term~
*/
public class QueryFuzzifier extends QueryVisitor {
@Override
public Query visit(TermQuery termQuery, Field field) {
if( field != Field.CONTENTS )
return termQuery;
// turn term query into: (term* OR *term* OR term~)
Term term = termQuery.getTerm();
PrefixQuery prefixQuery = new PrefixQuery(term);
prefixQuery.setBoost( termQuery.getBoost() );
Term wildcardTerm = Field.CONTENTS.createTerm("*" + term.text() + "*");
WildcardQuery wildcardQuery = new WildcardQuery(wildcardTerm);
wildcardQuery.setBoost( termQuery.getBoost() * 0.75f );
FuzzyQuery fuzzyQuery = new FuzzyQuery( term );
fuzzyQuery.setBoost( termQuery.getBoost() * 0.5f );
BooleanQuery boolQuery = new BooleanQuery();
boolQuery.add(prefixQuery, Occur.SHOULD);
boolQuery.add(wildcardQuery, Occur.SHOULD);
boolQuery.add(fuzzyQuery, Occur.SHOULD);
boolQuery.setBoost( termQuery.getBoost() );
return boolQuery;
}
@Override
public Query visit(PhraseQuery phraseQuery) {
BooleanQuery bq = new BooleanQuery();
for(Term t: phraseQuery.getTerms()) {
Field f = Field.getByName(t.field());
if( f != Field.CONTENTS )
return phraseQuery;
bq.add(new FuzzyQuery(t), Occur.SHOULD);
}
return bq;
}
@Override
public boolean visit(BooleanClause boolClause) {
if(boolClause.getOccur() == Occur.MUST_NOT) // skip prohibited, don't fuzzify
return false;
return true;
}
}