Package it.unibz.instasearch.indexing.querying

Source Code of it.unibz.instasearch.indexing.querying.QueryFuzzifier

/*
* Copyright (c) 2009 Andrejs Jermakovics.
*
* All rights reserved. This program and the accompanying materials
* are made available under the terms of the Eclipse Public License v1.0
* which accompanies this distribution, and is available at
* http://www.eclipse.org/legal/epl-v10.html
*
* Contributors:
*     Andrejs Jermakovics - initial implementation
*/
package it.unibz.instasearch.indexing.querying;

import it.unibz.instasearch.indexing.Field;

import org.apache.lucene.index.Term;
import org.apache.lucene.search.BooleanClause;
import org.apache.lucene.search.BooleanClause.Occur;
import org.apache.lucene.search.BooleanQuery;
import org.apache.lucene.search.FuzzyQuery;
import org.apache.lucene.search.PhraseQuery;
import org.apache.lucene.search.PrefixQuery;
import org.apache.lucene.search.Query;
import org.apache.lucene.search.TermQuery;
import org.apache.lucene.search.WildcardQuery;

/**
* Makes the query fuzzy.
* Replaces each TermQuery by Query of the form: term* OR *term* OR term~
*/
public class QueryFuzzifier extends QueryVisitor {
 
  @Override
  public Query visit(TermQuery termQuery, Field field) {
   
    if( field != Field.CONTENTS )
      return termQuery;
   
    // turn term query into: (term* OR *term* OR term~)
   
    Term term = termQuery.getTerm();
   
    PrefixQuery prefixQuery = new PrefixQuery(term);
    prefixQuery.setBoost( termQuery.getBoost() );
   
    Term wildcardTerm = Field.CONTENTS.createTerm("*" + term.text() + "*");
    WildcardQuery wildcardQuery = new WildcardQuery(wildcardTerm);
    wildcardQuery.setBoost( termQuery.getBoost() * 0.75f );
   
    FuzzyQuery fuzzyQuery = new FuzzyQuery( term );
    fuzzyQuery.setBoost( termQuery.getBoost() * 0.5f );
   
    BooleanQuery boolQuery = new BooleanQuery();
    boolQuery.add(prefixQuery,     Occur.SHOULD);
    boolQuery.add(wildcardQuery,   Occur.SHOULD);
    boolQuery.add(fuzzyQuery,     Occur.SHOULD);
    boolQuery.setBoost( termQuery.getBoost() );
   
    return boolQuery;
  }
 
  @Override
  public Query visit(PhraseQuery phraseQuery) {
    BooleanQuery bq = new BooleanQuery();
   
    for(Term t: phraseQuery.getTerms()) {
      Field f = Field.getByName(t.field());
     
      if( f != Field.CONTENTS )
        return phraseQuery;
     
      bq.add(new FuzzyQuery(t), Occur.SHOULD);
    }
   
    return bq;
  }
 
  @Override
  public boolean visit(BooleanClause boolClause) {
    if(boolClause.getOccur() == Occur.MUST_NOT) // skip prohibited, don't fuzzify
      return false;
   
    return true;
  }
 
}
TOP

Related Classes of it.unibz.instasearch.indexing.querying.QueryFuzzifier

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.