DataSearchAnalysisConfigurer.java
/*
* Copyright 2010 James Pether Sörling
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
* $Id$
* $HeadURL$
*/
package com.hack23.cia.service.data.impl;
import org.apache.lucene.analysis.core.LowerCaseFilterFactory;
import org.apache.lucene.analysis.en.PorterStemFilterFactory;
import org.apache.lucene.analysis.ngram.NGramFilterFactory;
import org.apache.lucene.analysis.standard.StandardTokenizerFactory;
import org.apache.lucene.analysis.sv.SwedishLightStemFilterFactory;
import org.hibernate.search.backend.lucene.analysis.LuceneAnalysisConfigurationContext;
import org.hibernate.search.backend.lucene.analysis.LuceneAnalysisConfigurer;
/**
* The Class DataSearchAnalysisConfigurer.
*/
public class DataSearchAnalysisConfigurer implements LuceneAnalysisConfigurer {
@Override
public void configure(final LuceneAnalysisConfigurationContext context) {
context.analyzer("ngram").custom().tokenizer(StandardTokenizerFactory.class)
.tokenFilter(LowerCaseFilterFactory.class).tokenFilter(NGramFilterFactory.class)
.param("minGramSize", "3").param("maxGramSize", "3");
context.analyzer("se").custom()
.tokenizer(StandardTokenizerFactory.class).tokenFilter(LowerCaseFilterFactory.class)
.tokenFilter(SwedishLightStemFilterFactory.class);
context.analyzer("en").custom()
.tokenizer(StandardTokenizerFactory.class).tokenFilter(LowerCaseFilterFactory.class)
.tokenFilter(PorterStemFilterFactory.class);
}
}