com.browseengine.bobo.index.BoboIndexer Maven / Gradle / Ivy
/**
* Bobo Browse Engine - High performance faceted/parametric search implementation
* that handles various types of semi-structured data. Written in Java.
*
* Copyright (C) 2005-2006 John Wang
*
* This library is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
* This library is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with this library; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*
* To contact the project administrators for the bobo-browse project,
* please go to https://sourceforge.net/projects/bobo-browse/, or
* send mail to [email protected].
*/
package com.browseengine.bobo.index;
import java.io.IOException;
import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.standard.StandardAnalyzer;
import org.apache.lucene.document.Document;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.index.IndexWriter.MaxFieldLength;
import org.apache.lucene.store.Directory;
import org.apache.lucene.util.Version;
import com.browseengine.bobo.index.digest.DataDigester;
public class BoboIndexer {
private Directory _index;
private DataDigester _digester;
private IndexWriter _writer;
private Analyzer _analyzer;
private static class MyDataHandler implements DataDigester.DataHandler{
private IndexWriter _writer;
MyDataHandler(IndexWriter writer){
_writer=writer;
}
public void handleDocument(Document doc) throws IOException {
_writer.addDocument(doc);
}
}
public void setAnalyzer(Analyzer analyzer){
_analyzer=analyzer;
}
private Analyzer getAnalyzer(){
return _analyzer == null ? new StandardAnalyzer(Version.LUCENE_CURRENT) : _analyzer;
}
public BoboIndexer(DataDigester digester,Directory index){
super();
_index=index;
_digester=digester;
}
public void index() throws IOException{
_writer=null;
try{
_writer=new IndexWriter(_index,getAnalyzer(),MaxFieldLength.UNLIMITED);
MyDataHandler handler=new MyDataHandler(_writer);
_digester.digest(handler);
_writer.optimize();
}
finally{
if (_writer!=null){
_writer.close();
}
}
}
}