io.zulia.server.index.ShardWriteManager Maven / Gradle / Ivy
package io.zulia.server.index;
import io.zulia.ZuliaConstants;
import io.zulia.message.ZuliaBase.Metadata;
import io.zulia.server.analysis.ZuliaPerFieldAnalyzer;
import io.zulia.server.config.ServerIndexConfig;
import org.apache.lucene.document.Document;
import org.apache.lucene.facet.FacetsConfig;
import org.apache.lucene.facet.taxonomy.directory.DirectoryTaxonomyReader;
import org.apache.lucene.facet.taxonomy.directory.DirectoryTaxonomyWriter;
import org.apache.lucene.index.DirectoryReader;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.index.IndexWriterConfig;
import org.apache.lucene.index.KeepOnlyLastCommitDeletionPolicy;
import org.apache.lucene.index.Term;
import org.apache.lucene.store.Directory;
import org.apache.lucene.store.MMapDirectory;
import org.apache.lucene.store.NRTCachingDirectory;
import java.io.IOException;
import java.nio.file.Path;
import java.util.List;
import java.util.concurrent.atomic.AtomicLong;
import java.util.logging.Logger;
public class ShardWriteManager {
private final static Logger LOG = Logger.getLogger(ShardWriteManager.class.getSimpleName());
private final ZuliaPerFieldAnalyzer zuliaPerFieldAnalyzer;
private final FacetsConfig facetsConfig;
private final ShardDocumentIndexer shardDocumentIndexer;
private final ServerIndexConfig indexConfig;
private final int shardNumber;
private final String indexName;
private final AtomicLong counter;
private Long lastCommit;
private Long lastChange;
private IndexWriter indexWriter;
private DirectoryTaxonomyWriter taxoWriter;
public ShardWriteManager(int shardNumber, Path pathToIndex, Path pathToTaxoIndex, FacetsConfig facetsConfig, ServerIndexConfig indexConfig,
ZuliaPerFieldAnalyzer zuliaPerFieldAnalyzer) throws IOException {
this.shardNumber = shardNumber;
this.zuliaPerFieldAnalyzer = zuliaPerFieldAnalyzer;
this.facetsConfig = facetsConfig;
this.indexConfig = indexConfig;
this.indexName = indexConfig.getIndexName();
this.shardDocumentIndexer = new ShardDocumentIndexer(indexConfig);
this.counter = new AtomicLong();
this.lastCommit = null;
this.lastChange = null;
openIndexWriter(pathToIndex);
openTaxoWriter(pathToTaxoIndex);
updateIndexSettings();
}
public int getShardNumber() {
return shardNumber;
}
public ServerIndexConfig getIndexConfig() {
return indexConfig;
}
private void openIndexWriter(Path pathToIndex) throws IOException {
Directory d = MMapDirectory.open(pathToIndex);
IndexWriterConfig config = new IndexWriterConfig(zuliaPerFieldAnalyzer);
config.setIndexDeletionPolicy(new KeepOnlyLastCommitDeletionPolicy());
config.setMaxBufferedDocs(Integer.MAX_VALUE);
config.setRAMBufferSizeMB(128); // should be overwritten by ZuliaShard.updateIndexSettings()
config.setUseCompoundFile(false);
NRTCachingDirectory nrtCachingDirectory = new NRTCachingDirectory(d, 50, 150);
this.indexWriter = new IndexWriter(nrtCachingDirectory, config);
}
private void openTaxoWriter(Path pathToTaxo) throws IOException {
Directory d = MMapDirectory.open(pathToTaxo);
NRTCachingDirectory nrtCachingDirectory = new NRTCachingDirectory(d, 5, 15);
this.taxoWriter = new DirectoryTaxonomyWriter(nrtCachingDirectory);
}
public void close() throws IOException {
if (indexWriter != null) {
Directory directory = indexWriter.getDirectory();
indexWriter.close();
indexWriter = null;
directory.close();
}
if (taxoWriter != null) {
Directory directory = taxoWriter.getDirectory();
taxoWriter.close();
taxoWriter = null;
directory.close();
}
}
public ShardReader createShardReader() throws IOException {
DirectoryReader indexReader = DirectoryReader.open(indexWriter);
DirectoryTaxonomyReader taxoReader = new DirectoryTaxonomyReader(taxoWriter);
taxoReader.setCacheSize(128000);
return new ShardReader(shardNumber, indexReader, taxoReader, facetsConfig, indexConfig, zuliaPerFieldAnalyzer);
}
public void commit() throws IOException {
LOG.info("Committing shard <" + shardNumber + "> for index <" + indexName + ">");
long currentTime = System.currentTimeMillis();
indexWriter.commit();
taxoWriter.commit();
lastCommit = currentTime;
}
public boolean needsIdleCommit() {
long currentTime = System.currentTimeMillis();
Long lastCh = lastChange;
// if changes since started
if (lastCh != null) {
if ((currentTime - lastCh) > (indexConfig.getIndexSettings().getIdleTimeWithoutCommit() * 1000)) {
if ((lastCommit == null) || (lastCh > lastCommit)) {
return true;
}
}
}
return false;
}
public boolean markedChangedCheckIfCommitNeeded() {
lastChange = System.currentTimeMillis();
long count = counter.incrementAndGet();
return (count % indexConfig.getIndexSettings().getShardCommitInterval()) == 0;
}
public void updateIndexSettings() {
int ramBufferMB = indexConfig.getRAMBufferMB() != 0 ? indexConfig.getRAMBufferMB() : 128;
indexWriter.getConfig().setRAMBufferSizeMB(ramBufferMB);
}
public void deleteDocuments(String uniqueId) throws IOException {
Term term = new Term(ZuliaConstants.ID_FIELD, uniqueId);
indexWriter.deleteDocuments(term);
}
public void forceMerge(int maxNumberSegments) throws IOException {
indexWriter.forceMerge(maxNumberSegments);
}
public void deleteAll() throws IOException {
indexWriter.deleteAll();
}
public FacetsConfig getFacetsConfig() {
return facetsConfig;
}
public void indexDocument(String uniqueId, long timestamp, org.bson.Document mongoDocument, List metadataList) throws Exception {
Document luceneDocument = shardDocumentIndexer.getIndexDocument(uniqueId, timestamp, mongoDocument, metadataList);
luceneDocument = facetsConfig.build(taxoWriter, luceneDocument);
Term updateQuery = new Term(ZuliaConstants.ID_FIELD, uniqueId);
indexWriter.updateDocument(updateQuery, luceneDocument);
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy