org.apache.camel.component.lucene.LuceneIndexer Maven / Gradle / Ivy
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.camel.component.lucene;
import java.io.ByteArrayOutputStream;
import java.io.File;
import java.io.FileInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.util.Map;
import java.util.Map.Entry;
import org.apache.camel.Exchange;
import org.apache.camel.util.IOHelper;
import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field;
import org.apache.lucene.document.FieldType;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.index.IndexWriterConfig;
import org.apache.lucene.index.IndexWriterConfig.OpenMode;
import org.apache.lucene.store.NIOFSDirectory;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
public class LuceneIndexer {
private static final Logger LOG = LoggerFactory.getLogger(LuceneIndexer.class);
private static final FieldType TOKENIZED_FIELD_TYPE = createFieldType(true);
private static final FieldType NON_TOKENIZED_FIELD_TYPE = createFieldType(false);
private File sourceDirectory;
private Analyzer analyzer;
private NIOFSDirectory niofsDirectory;
private IndexWriter indexWriter;
private boolean sourceDirectoryIndexed;
public LuceneIndexer(File sourceDirectory, File indexDirectory, Analyzer analyzer) throws Exception {
if (indexDirectory != null) {
if (!indexDirectory.exists()) {
boolean result = indexDirectory.mkdir();
if (!result) {
LOG.error("mkdir failed for {}. Maybe this folder was created externally", indexDirectory);
}
}
this.setNiofsDirectory(new NIOFSDirectory(indexDirectory.toPath()));
} else {
this.setNiofsDirectory(new NIOFSDirectory(new File("./indexDirectory").toPath()));
}
this.setAnalyzer(analyzer);
if (sourceDirectory != null && !sourceDirectoryIndexed) {
this.setSourceDirectory(sourceDirectory);
add(getSourceDirectory());
sourceDirectoryIndexed = true;
}
}
public void index(Exchange exchange) throws Exception {
LOG.debug("Indexing {}", exchange);
openIndexWriter();
Map headers = exchange.getIn().getHeaders();
add("exchangeId", exchange.getExchangeId(), true);
for (Entry entry : headers.entrySet()) {
String field = entry.getKey();
String value = exchange.getContext().getTypeConverter().mandatoryConvertTo(String.class, entry.getValue());
add(field, value, true);
}
add("contents", exchange.getIn().getMandatoryBody(String.class), true);
closeIndexWriter();
}
public NIOFSDirectory getNiofsDirectory() {
return niofsDirectory;
}
public void setNiofsDirectory(NIOFSDirectory niofsDirectory) {
this.niofsDirectory = niofsDirectory;
}
public File getSourceDirectory() {
return sourceDirectory;
}
public void setSourceDirectory(File sourceDirectory) {
this.sourceDirectory = sourceDirectory;
}
public Analyzer getAnalyzer() {
return analyzer;
}
public void setAnalyzer(Analyzer analyzer) {
this.analyzer = analyzer;
}
private void add(String field, String value, boolean analyzed) throws IOException {
if (LOG.isTraceEnabled()) {
LOG.trace("Adding field: {}", field);
LOG.trace(" value: {}", value);
}
Document doc = new Document();
doc.add(new Field(field, value, analyzed ? TOKENIZED_FIELD_TYPE : NON_TOKENIZED_FIELD_TYPE));
indexWriter.addDocument(doc);
}
private void add(File file) throws IOException {
if (file.canRead()) {
if (file.isDirectory()) {
String[] files = file.list();
if (files != null) {
for (String child : files) {
add(new File(file.getAbsolutePath() + "/" + child));
}
}
} else {
LOG.trace("Adding {}", file);
String contents;
try (InputStream is = new FileInputStream(file)) {
ByteArrayOutputStream bos = new ByteArrayOutputStream();
IOHelper.copy(IOHelper.buffered(is), bos);
contents = bos.toString();
}
openIndexWriter();
add("path", file.getPath(), false);
add("contents", contents, true);
closeIndexWriter();
LOG.trace("Added {} successfully", file);
}
} else {
LOG.warn("Directory/File {} could not be read."
+ " This directory will not be indexed. Please check permissions and rebuild indexes.",
file.getAbsolutePath());
}
}
private void openIndexWriter() throws IOException {
IndexWriterConfig indexWriterConfig;
// use create or append so we can reuse existing index if already exists
indexWriterConfig = new IndexWriterConfig(getAnalyzer()).setOpenMode(OpenMode.CREATE_OR_APPEND);
indexWriter = new IndexWriter(niofsDirectory, indexWriterConfig);
}
private void closeIndexWriter() throws IOException {
indexWriter.commit();
indexWriter.close();
}
private static FieldType createFieldType(boolean tokenized) {
FieldType answer = new FieldType();
//answer.setIndexed(true);
answer.setStored(true);
answer.setTokenized(tokenized);
// freeze the answer so that it becomes immutable
answer.freeze();
return answer;
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy