com.palantir.atlasdb.table.description.render.StreamStoreRenderer Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of atlasdb-client Show documentation
Show all versions of atlasdb-client Show documentation
Palantir open source project
/*
* (c) Copyright 2018 Palantir Technologies Inc. All rights reserved.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.palantir.atlasdb.table.description.render;
import com.google.common.base.Functions;
import com.google.common.base.Preconditions;
import com.google.common.collect.ArrayListMultimap;
import com.google.common.collect.Collections2;
import com.google.common.collect.HashMultimap;
import com.google.common.collect.ImmutableMap;
import com.google.common.collect.ImmutableSet;
import com.google.common.collect.Lists;
import com.google.common.collect.Maps;
import com.google.common.collect.Multimap;
import com.google.common.collect.Multimaps;
import com.google.common.collect.Sets;
import com.google.common.io.ByteStreams;
import com.google.common.io.CountingInputStream;
import com.google.common.primitives.Ints;
import com.google.protobuf.ByteString;
import com.palantir.atlasdb.keyvalue.api.Cell;
import com.palantir.atlasdb.protos.generated.StreamPersistence.Status;
import com.palantir.atlasdb.protos.generated.StreamPersistence.StreamMetadata;
import com.palantir.atlasdb.stream.AbstractPersistentStreamStore;
import com.palantir.atlasdb.stream.BlockConsumingInputStream;
import com.palantir.atlasdb.stream.BlockGetter;
import com.palantir.atlasdb.stream.BlockLoader;
import com.palantir.atlasdb.stream.PersistentStreamStore;
import com.palantir.atlasdb.stream.StreamCleanedException;
import com.palantir.atlasdb.stream.StreamStorePersistenceConfiguration;
import com.palantir.atlasdb.table.description.ValueType;
import com.palantir.atlasdb.transaction.api.Transaction;
import com.palantir.atlasdb.transaction.api.TransactionFailedRetriableException;
import com.palantir.atlasdb.transaction.api.TransactionManager;
import com.palantir.atlasdb.transaction.api.TransactionTask;
import com.palantir.atlasdb.transaction.impl.TxTask;
import com.palantir.common.base.Throwables;
import com.palantir.common.compression.StreamCompression;
import com.palantir.common.io.ConcatenatedInputStream;
import com.palantir.logsafe.SafeArg;
import com.palantir.logsafe.logger.SafeLogger;
import com.palantir.logsafe.logger.SafeLoggerFactory;
import com.palantir.util.AssertUtils;
import com.palantir.util.ByteArrayIOStream;
import com.palantir.util.Pair;
import com.palantir.util.crypto.Sha256Hash;
import com.palantir.util.file.DeleteOnCloseFileInputStream;
import com.palantir.util.file.TempFileUtils;
import java.io.BufferedInputStream;
import java.io.ByteArrayInputStream;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.security.DigestInputStream;
import java.security.MessageDigest;
import java.util.Arrays;
import java.util.Collection;
import java.util.HashMap;
import java.util.HashSet;
import java.util.List;
import java.util.Map;
import java.util.Optional;
import java.util.Set;
import java.util.concurrent.TimeUnit;
import java.util.function.BiConsumer;
import java.util.function.Supplier;
import javax.annotation.CheckForNull;
import javax.annotation.Generated;
@SuppressWarnings("checkstyle:all") // too many warnings to fix
public class StreamStoreRenderer {
private final String name;
private final ValueType streamIdType;
private final String packageName;
private final String schemaName;
private final int inMemoryThreshold;
private final StreamCompression streamCompression;
public StreamStoreRenderer(
String name,
ValueType streamIdType,
String packageName,
String schemaName,
int inMemoryThreshold,
StreamCompression streamCompression) {
this.name = name;
this.streamIdType = streamIdType;
this.packageName = packageName;
this.schemaName = schemaName;
this.inMemoryThreshold = inMemoryThreshold;
this.streamCompression = streamCompression;
}
public String getPackageName() {
return packageName;
}
public String getStreamStoreClassName() {
return name + "StreamStore";
}
public String getIndexCleanupTaskClassName() {
return name + "IndexCleanupTask";
}
public String getMetadataCleanupTaskClassName() {
return name + "MetadataCleanupTask";
}
public String renderStreamStore() {
final String StreamStore = name + "StreamStore";
final String StreamValueTable = name + "StreamValueTable";
final String StreamValueRow = StreamValueTable + "." + name + "StreamValueRow";
final String StreamMetadataTable = name + "StreamMetadataTable";
final String StreamMetadataRow = StreamMetadataTable + "." + name + "StreamMetadataRow";
final String StreamHashAidxTable = name + "StreamHashAidxTable";
final String StreamHashAidxRow = StreamHashAidxTable + "." + name + "StreamHashAidxRow";
final String StreamHashAidxColumn = StreamHashAidxTable + "." + name + "StreamHashAidxColumn";
final String StreamHashAidxColumnValue = StreamHashAidxTable + "." + name + "StreamHashAidxColumnValue";
final String StreamIdxTable = name + "StreamIdxTable";
final String StreamIdxRow = StreamIdxTable + "." + name + "StreamIdxRow";
final String StreamIdxColumn = StreamIdxTable + "." + name + "StreamIdxColumn";
final String StreamIdxColumnValue = StreamIdxTable + "." + name + "StreamIdxColumnValue";
final String TableFactory = schemaName + "TableFactory";
final String StreamId = streamIdType.getJavaObjectClassName();
return new Renderer() {
@Override
protected void run() {
ImportRenderer importRenderer = new ImportRenderer(this, Arrays.asList(IMPORTS));
line("package ", packageName, ";");
line();
importRenderer.renderImports();
line("@Generated(\"", StreamStoreRenderer.class.getName(), "\")");
line("@SuppressWarnings({\"all\", \"deprecation\"})");
line("public final class ", StreamStore, " extends AbstractPersistentStreamStore", " {");
{
fields();
line();
constructors();
line();
getInMemoryThreshold();
line();
storeBlock();
line();
touchMetadataWhileStoringForConflicts();
line();
putMetadataAndHashIndexTask();
line();
getNumberOfBlocksFromMetadata();
line();
createTempFile();
line();
loadSingleBlockToOutputStream();
line();
getBlock();
line();
getMetadata();
line();
lookupStreamIdsByHash();
line();
getHashIndexRowsForHashes();
line();
getMetadataRowsForIds();
line();
putHashIndexTask();
line();
deleteStreams();
line();
markStreamsAsUsedInternal();
line();
unmarkStreamsAsUsed();
line();
touchMetadataWhileMarkingUsedForConflicts();
line();
importRenderer.renderImportJavaDoc();
line("static final int dummy = 0;");
}
line("}");
}
private void fields() {
line("public static final int BLOCK_SIZE_IN_BYTES = 1000000; // 1MB. DO NOT CHANGE THIS WITHOUT AN"
+ " UPGRADE TASK");
line(
"public static final int IN_MEMORY_THRESHOLD = ",
String.valueOf(inMemoryThreshold),
"; // streams under this size are kept in memory when loaded");
line("public static final String STREAM_FILE_PREFIX = \"", name, "_stream_\";");
line("public static final String STREAM_FILE_SUFFIX = \".tmp\";");
line();
line("private static final SafeLogger log = SafeLoggerFactory.get(", StreamStore, ".class);");
line();
line("private final ", TableFactory, " tables;");
}
private void constructors() {
line("private ", StreamStore, "(TransactionManager txManager, ", TableFactory, " tables) {");
{
line("this(txManager, tables, () -> StreamStorePersistenceConfiguration.DEFAULT_CONFIG);");
}
line("}");
line();
line(
"private ",
StreamStore,
"(TransactionManager txManager, ",
TableFactory,
" tables, ",
"Supplier persistenceConfiguration) {");
{
line(
"super(txManager, ",
streamCompression.getDeclaringClass().getSimpleName() + "." + streamCompression,
", persistenceConfiguration);");
line("this.tables = tables;");
}
line("}");
line();
line("public static ", StreamStore, " of(TransactionManager txManager, ", TableFactory, " tables) {");
{
line("return new ", StreamStore, "(txManager, tables);");
}
line("}");
line();
line(
"public static ",
StreamStore,
" of(TransactionManager txManager, ",
TableFactory,
" tables, ",
" Supplier persistenceConfiguration) {");
{
line("return new ", StreamStore, "(txManager, tables, persistenceConfiguration);");
}
line("}");
line();
line("/**");
line(" * This should only be used by test code or as a performance optimization.");
line(" */");
line("static ", StreamStore, " of(", TableFactory, " tables) {");
{
line("return new ", StreamStore, "(null, tables);");
}
line("}");
}
private void storeBlock() {
line("@Override");
line("protected void storeBlock(Transaction t, long id, long blockNumber, final byte[] block) {");
{
line("Preconditions.checkArgument(block.length <= BLOCK_SIZE_IN_BYTES, \"Block to store in DB"
+ " must be less than BLOCK_SIZE_IN_BYTES\");");
line("final ", StreamValueRow, " row = ", StreamValueRow, ".of(id, blockNumber);");
line("try {");
{
line("// Do a touch operation on this table to ensure we get a conflict if someone cleans"
+ " it up.");
line("touchMetadataWhileStoringForConflicts(t, row.getId(), row.getBlockId());");
line("tables.get", StreamValueTable, "(t).putValue(row, block);");
}
line("} catch (RuntimeException e) {");
{
line("log.error(");
line(" \"Error storing block {} for stream id {}\",");
line(" SafeArg.of(\"blockId\", row.getBlockId()),");
line(" SafeArg.of(\"id\", row.getId()),");
line(" e);");
line("throw e;");
}
line("}");
}
line("}");
}
private void touchMetadataWhileStoringForConflicts() {
line(
"private void touchMetadataWhileStoringForConflicts(Transaction t, ",
StreamId,
" id, long blockNumber) {");
{
line(StreamMetadataTable, " metaTable = tables.get", StreamMetadataTable, "(t);");
line(StreamMetadataRow, " row = ", StreamMetadataRow, ".of(id);");
line("StreamMetadata metadata ="
+ " metaTable.getMetadatas(ImmutableSet.of(row)).values().iterator().next();");
line("Preconditions.checkState(metadata.getStatus() == Status.STORING, \"This stream is being"
+ " cleaned up while storing blocks: %s\", id);");
line("StreamMetadata.Builder builder = StreamMetadata.newBuilder(metadata);");
line("builder.setLength(blockNumber * BLOCK_SIZE_IN_BYTES + 1);");
line("metaTable.putMetadata(row, builder.build());");
}
line("}");
}
private void putMetadataAndHashIndexTask() {
line("@Override");
line(
"protected void putMetadataAndHashIndexTask(Transaction t, Map<",
StreamId,
", StreamMetadata> streamIdsToMetadata) {");
{
line(StreamMetadataTable, " mdTable = tables.get", StreamMetadataTable, "(t);");
line(
"Map<",
StreamId,
", StreamMetadata> prevMetadatas = getMetadata(t, streamIdsToMetadata.keySet());");
line();
line("Map<", StreamMetadataRow, ", StreamMetadata> rowsToStoredMetadata = new HashMap<>();");
line("Map<", StreamMetadataRow, ", StreamMetadata> rowsToUnstoredMetadata = new HashMap<>();");
line("for (Entry<", StreamId, ", StreamMetadata> e : streamIdsToMetadata.entrySet()) {");
{
line("long streamId = e.getKey();");
line("StreamMetadata metadata = e.getValue();");
line("StreamMetadata prevMetadata = prevMetadatas.get(streamId);");
line("if (metadata.getStatus() == Status.STORED) {");
{
line("if (prevMetadata == null || prevMetadata.getStatus() != Status.STORING) {");
{
line("// This can happen if we cleanup old streams.");
line("throw new TransactionFailedRetriableException(\"Cannot mark a stream as"
+ " stored that isn't currently storing: \" + prevMetadata);");
}
line("}");
line("rowsToStoredMetadata.put(", StreamMetadataRow, ".of(streamId), metadata);");
}
line("} else if (metadata.getStatus() == Status.STORING) {");
{
line("// This will prevent two users trying to store the same id.");
line("if (prevMetadata != null) {");
{
line("throw new TransactionFailedRetriableException(\"Cannot reuse the same stream"
+ " id: \" + streamId);");
}
line("}");
line("rowsToUnstoredMetadata.put(", StreamMetadataRow, ".of(streamId), metadata);");
}
line("}");
}
line("}");
line("putHashIndexTask(t, rowsToStoredMetadata);");
line();
line("Map<", StreamMetadataRow, ", StreamMetadata> rowsToMetadata = new HashMap<>();");
line("rowsToMetadata.putAll(rowsToStoredMetadata);");
line("rowsToMetadata.putAll(rowsToUnstoredMetadata);");
line("mdTable.putMetadata(rowsToMetadata);");
}
line("}");
}
private void getNumberOfBlocksFromMetadata() {
line("private long getNumberOfBlocksFromMetadata(StreamMetadata metadata) {");
{
line("return (metadata.getLength() + BLOCK_SIZE_IN_BYTES - 1) / BLOCK_SIZE_IN_BYTES;");
}
line("}");
}
private void getInMemoryThreshold() {
line("@Override");
line("protected long getInMemoryThreshold() {");
{
line("return IN_MEMORY_THRESHOLD;");
}
line("}");
}
private void createTempFile() {
line("@Override");
line("protected File createTempFile(", StreamId, " id) throws IOException {");
{
line("File file = TempFileUtils.createTempFile(STREAM_FILE_PREFIX + id, STREAM_FILE_SUFFIX);");
line("file.deleteOnExit();");
line("return file;");
}
line("}");
}
private void loadSingleBlockToOutputStream() {
line("@Override");
line(
"protected void loadSingleBlockToOutputStream(Transaction t, ",
StreamId,
" streamId, long blockId, OutputStream os) {");
{
line(StreamValueRow, " row = ", StreamValueRow, ".of(streamId, blockId);");
line("try {");
{
line("os.write(getBlock(t, row));");
}
line("} catch (RuntimeException e) {");
{
line("log.error(");
line(" \"Error storing block {} for stream id {}\",");
line(" SafeArg.of(\"blockId\", row.getBlockId()),");
line(" SafeArg.of(\"id\", row.getId()),");
line(" e);");
line("throw e;");
}
line("} catch (IOException e) {");
{
line("log.error(");
line(" \"Error writing block {} to file when getting stream id {}\",");
line(" SafeArg.of(\"blockId\", row.getBlockId()),");
line(" SafeArg.of(\"id\", row.getId()),");
line(" e);");
line("throw Throwables.rewrapAndThrowUncheckedException(\"Error writing blocks to file when"
+ " creating stream.\", e);");
}
line("}");
}
line("}");
}
private void getBlock() {
line("private byte[] getBlock(Transaction t, ", StreamValueRow, " row) {");
{
line(StreamValueTable, " valueTable = tables.get", StreamValueTable, "(t);");
line("return valueTable.getValues(ImmutableSet.of(row)).get(row);");
}
line("}");
}
private void getMetadata() {
line("@Override");
line(
"protected Map<",
StreamId,
", StreamMetadata> getMetadata(Transaction t, Set<",
StreamId,
"> streamIds) {");
{
line("if (streamIds.isEmpty()) {");
{
line("return ImmutableMap.of();");
}
line("}");
line(StreamMetadataTable, " table = tables.get", StreamMetadataTable, "(t);");
line(
"Map<",
StreamMetadataRow,
", StreamMetadata> metadatas = table.getMetadatas(getMetadataRowsForIds(streamIds));");
line("Map<", StreamId, ", StreamMetadata> ret = new HashMap<>();");
line("for (Map.Entry<", StreamMetadataRow, ", StreamMetadata> e : metadatas.entrySet()) {");
{
line("ret.put(e.getKey().getId(), e.getValue());");
}
line("}");
line("return ret;");
}
line("}");
}
private void lookupStreamIdsByHash() {
line("@Override");
line(
"public Map lookupStreamIdsByHash(Transaction t, final Set hashes) {");
{
line("if (hashes.isEmpty()) {");
{
line("return ImmutableMap.of();");
}
line("}");
line(StreamHashAidxTable, " idx = tables.get", StreamHashAidxTable, "(t);");
line("Set<", StreamHashAidxRow, "> rows = getHashIndexRowsForHashes(hashes);");
line();
line(
"Multimap<",
StreamHashAidxRow,
", ",
StreamHashAidxColumnValue,
"> m = idx.getRowsMultimap(rows);");
line("Map<", StreamId, ", Sha256Hash> hashForStreams = new HashMap<>();");
line("for (", StreamHashAidxRow, " r : m.keySet()) {");
{
line("for (", StreamHashAidxColumnValue, " v : m.get(r)) {");
{
line(StreamId, " streamId = v.getColumnName().getStreamId();");
line("Sha256Hash hash = r.getHash();");
line("if (hashForStreams.containsKey(streamId)) {");
{
line("AssertUtils.assertAndLog(log, hashForStreams.get(streamId).equals(hash),"
+ " \"(BUG) Stream ID has 2 different hashes: \" + streamId);");
}
line("}");
line("hashForStreams.put(streamId, hash);");
}
line("}");
}
line("}");
line("Map<", StreamId, ", StreamMetadata> metadata = getMetadata(t, hashForStreams.keySet());");
line();
line("Map ret = new HashMap<>();");
line("for (Map.Entry<", StreamId, ", StreamMetadata> e : metadata.entrySet()) {");
{
line("if (e.getValue().getStatus() != Status.STORED) {");
{
line("continue;");
}
line("}");
line("Sha256Hash hash = hashForStreams.get(e.getKey());");
line("ret.put(hash, e.getKey());");
}
line("}");
line();
line("return ret;");
}
line("}");
}
private void getHashIndexRowsForHashes() {
line("private Set<", StreamHashAidxRow, "> getHashIndexRowsForHashes(final Set hashes) {");
{
line("Set<", StreamHashAidxRow, "> rows = new HashSet<>();");
line("for (Sha256Hash h : hashes) {");
{
line("rows.add(", StreamHashAidxRow, ".of(h));");
}
line("}");
line("return rows;");
}
line("}");
}
private void getMetadataRowsForIds() {
line(
"private Set<",
StreamMetadataRow,
"> getMetadataRowsForIds(final Iterable<",
StreamId,
"> ids) {");
{
line("Set<", StreamMetadataRow, "> rows = new HashSet<>();");
line("for (", StreamId, " id : ids) {");
{
line("rows.add(", StreamMetadataRow, ".of(id));");
}
line("}");
line("return rows;");
}
line("}");
}
private void putHashIndexTask() {
line(
"private void putHashIndexTask(Transaction t, Map<",
StreamMetadataRow,
", StreamMetadata> rowsToMetadata) {");
{
line(
"Multimap<",
StreamHashAidxRow,
", ",
StreamHashAidxColumnValue,
"> indexMap = HashMultimap.create();");
line("for (Entry<", StreamMetadataRow, ", StreamMetadata> e : rowsToMetadata.entrySet()) {");
{
line(StreamMetadataRow, " row = e.getKey();");
line("StreamMetadata metadata = e.getValue();");
line("Preconditions.checkArgument(");
line(" metadata.getStatus() == Status.STORED,");
line(" \"Should only index successfully stored streams.\");");
line();
line("Sha256Hash hash = Sha256Hash.EMPTY;");
line("if (!ByteString.EMPTY.equals(metadata.getHash())) {");
{
line("hash = new Sha256Hash(metadata.getHash().toByteArray());");
}
line("}");
line(StreamHashAidxRow, " hashRow = ", StreamHashAidxRow, ".of(hash);");
line(StreamHashAidxColumn, " column = ", StreamHashAidxColumn, ".of(row.getId());");
line(
StreamHashAidxColumnValue,
" columnValue = ",
StreamHashAidxColumnValue,
".of(column, 0L);");
line("indexMap.put(hashRow, columnValue);");
}
line("}");
line(StreamHashAidxTable, " hiTable = tables.get", StreamHashAidxTable, "(t);");
line("hiTable.put(indexMap);");
}
line("}");
}
private void deleteStreams() {
line("/**");
line(" * This should only be used from the cleanup tasks.");
line(" */");
line("void deleteStreams(Transaction t, final Set<", StreamId, "> streamIds) {");
{
line("if (streamIds.isEmpty()) {");
{
line("return;");
}
line("}");
line("Set<", StreamMetadataRow, "> smRows = new HashSet<>();");
line(
"Multimap<",
StreamHashAidxRow,
", ",
StreamHashAidxColumn,
"> shToDelete = HashMultimap.create();");
line("for (", StreamId, " streamId : streamIds) {");
{
line("smRows.add(", StreamMetadataRow, ".of(streamId));");
}
line("}");
line(StreamMetadataTable, " table = tables.get", StreamMetadataTable, "(t);");
line("Map<", StreamMetadataRow, ", StreamMetadata> metadatas = table.getMetadatas(smRows);");
line("Set<", StreamValueRow, "> streamValueToDelete = new HashSet<>();");
line("for (Entry<", StreamMetadataRow, ", StreamMetadata> e : metadatas.entrySet()) {");
{
line(StreamId, " streamId = e.getKey().getId();");
line("long blocks = getNumberOfBlocksFromMetadata(e.getValue());");
line("for (long i = 0; i < blocks; i++) {");
{
line("streamValueToDelete.add(", StreamValueRow, ".of(streamId, i));");
}
line("}");
line("ByteString streamHash = e.getValue().getHash();");
line("Sha256Hash hash = Sha256Hash.EMPTY;");
line("if (!ByteString.EMPTY.equals(streamHash)) {");
{
line("hash = new Sha256Hash(streamHash.toByteArray());");
}
line("} else {");
{
line("log.error(");
line(" \"Empty hash for stream {}\",");
line(" SafeArg.of(\"id\", streamId));");
}
line("}");
line(StreamHashAidxRow, " hashRow = ", StreamHashAidxRow, ".of(hash);");
line(StreamHashAidxColumn, " column = ", StreamHashAidxColumn, ".of(streamId);");
line("shToDelete.put(hashRow, column);");
}
line("}");
line("tables.get", StreamHashAidxTable, "(t).delete(shToDelete);");
line("tables.get", StreamValueTable, "(t).delete(streamValueToDelete);");
line("table.delete(smRows);");
}
line("}");
}
private void touchMetadataWhileMarkingUsedForConflicts() {
line("@Override");
line(
"protected void touchMetadataWhileMarkingUsedForConflicts(Transaction t, Iterable<",
StreamId,
"> ids) {");
{
line(StreamMetadataTable, " metaTable = tables.get", StreamMetadataTable, "(t);");
line("Set<", StreamMetadataRow, "> rows = new HashSet<>();");
line("for (", StreamId, " id : ids) {");
{
line("rows.add(", StreamMetadataRow, ".of(id));");
}
line("}");
line("Map<", StreamMetadataRow, ", StreamMetadata> metadatas = metaTable.getMetadatas(rows);");
line("for (Map.Entry<", StreamMetadataRow, ", StreamMetadata> e : metadatas.entrySet()) {");
{
line("StreamMetadata metadata = e.getValue();");
line("Preconditions.checkState(metadata.getStatus() == Status.STORED,");
line("\"Stream: %s has status: %s\", e.getKey().getId(), metadata.getStatus());");
line("metaTable.putMetadata(e.getKey(), metadata);");
}
line("}");
line("SetView<", StreamMetadataRow, "> missingRows = Sets.difference(rows, metadatas.keySet());");
line("if (!missingRows.isEmpty()) {");
{
line("throw new IllegalStateException(\"Missing metadata rows for:\" + missingRows");
line("+ \" rows: \" + rows + \" metadata: \" + metadatas + \" txn timestamp: \" +"
+ " t.getTimestamp());");
}
line("}");
}
line("}");
}
private void markStreamsAsUsedInternal() {
line("@Override");
line(
"protected void markStreamsAsUsedInternal(Transaction t, final Map<",
StreamId,
", byte[]> streamIdsToReference) {");
{
line("if (streamIdsToReference.isEmpty()) {");
{
line("return;");
}
line("}");
line(StreamIdxTable, " index = tables.get", StreamIdxTable, "(t);");
line(
"Multimap<",
StreamIdxRow,
", ",
StreamIdxColumnValue,
"> rowsToValues = HashMultimap.create();");
line("for (Map.Entry<", StreamId, ", byte[]> entry : streamIdsToReference.entrySet()) {");
{
line(StreamId, " streamId = entry.getKey();");
line("byte[] reference = entry.getValue();");
line(StreamIdxColumn, " col = ", StreamIdxColumn, ".of(reference);");
line(StreamIdxColumnValue, " value = ", StreamIdxColumnValue, ".of(col, 0L);");
line("rowsToValues.put(", StreamIdxRow, ".of(streamId), value);");
}
line("}");
line("index.put(rowsToValues);");
}
line("}");
}
private void unmarkStreamsAsUsed() {
line("@Override");
line(
"public void unmarkStreamsAsUsed(Transaction t, final Map<",
StreamId,
", byte[]> streamIdsToReference) {");
{
line("if (streamIdsToReference.isEmpty()) {");
{
line("return;");
}
line("}");
line(StreamIdxTable, " index = tables.get", StreamIdxTable, "(t);");
line(
"Multimap<",
StreamIdxRow,
", ",
StreamIdxColumn,
"> toDelete = ArrayListMultimap.create(streamIdsToReference.size(), 1);");
line("for (Map.Entry<", StreamId, ", byte[]> entry : streamIdsToReference.entrySet()) {");
{
line(StreamId, " streamId = entry.getKey();");
line("byte[] reference = entry.getValue();");
line(StreamIdxColumn, " col = ", StreamIdxColumn, ".of(reference);");
line("toDelete.put(", StreamIdxRow, ".of(streamId), col);");
}
line("}");
line("index.delete(toDelete);");
}
line("}");
}
}.render();
}
public String renderIndexCleanupTask() {
final String StreamStore = name + "StreamStore";
final String StreamIdxTable = name + "StreamIdxTable";
final String StreamIdxRow = StreamIdxTable + "." + name + "StreamIdxRow";
final String StreamIdxColumnValue = StreamIdxTable + "." + name + "StreamIdxColumnValue";
final String TableFactory = schemaName + "TableFactory";
final String IndexCleanupTask = getIndexCleanupTaskClassName();
final String StreamId = streamIdType.getJavaObjectClassName();
return new Renderer() {
@Override
protected void run() {
packageAndImports();
line();
line("public class ", IndexCleanupTask, " implements OnCleanupTask {");
{
line();
line("private final ", TableFactory, " tables;");
line();
line("public ", IndexCleanupTask, "(Namespace namespace) {");
{
line("tables = ", TableFactory, ".of(namespace);");
}
line("}");
line();
cellsCleanedUp();
}
line("}");
}
private void packageAndImports() {
line("package ", packageName, ";");
line();
line("import java.util.Map;");
line("import java.util.Set;");
line();
line("import com.google.common.collect.Sets;");
line("import com.palantir.atlasdb.cleaner.api.OnCleanupTask;");
line("import com.palantir.atlasdb.encoding.PtBytes;");
line("import com.palantir.atlasdb.keyvalue.api.BatchColumnRangeSelection;");
line("import com.palantir.atlasdb.keyvalue.api.Cell;");
line("import com.palantir.atlasdb.keyvalue.api.Namespace;");
line("import com.palantir.atlasdb.transaction.api.Transaction;");
line("import com.palantir.common.base.BatchingVisitable;");
if (streamIdType == ValueType.SHA256HASH) {
line("import com.palantir.util.crypto.Sha256Hash;");
}
}
private void cellsCleanedUp() {
line("@Override");
line("public boolean cellsCleanedUp(Transaction t, Set cells) {");
{
line(StreamIdxTable, " usersIndex = tables.get", StreamIdxTable, "(t);");
line("Set<", StreamIdxRow, "> rows = Sets.newHashSetWithExpectedSize(cells.size());");
line("for (Cell cell : cells) {");
{
line("rows.add(", StreamIdxRow, ".BYTES_HYDRATOR.hydrateFromBytes(cell.getRowName()));");
}
line("}");
line("BatchColumnRangeSelection oneColumn = BatchColumnRangeSelection.create(");
line(" PtBytes.EMPTY_BYTE_ARRAY, PtBytes.EMPTY_BYTE_ARRAY, 1);");
line("Map<", StreamIdxRow, ", BatchingVisitable<", StreamIdxColumnValue, ">> existentRows");
line(" = usersIndex.getRowsColumnRange(rows, oneColumn);");
line("Set<", StreamIdxRow, "> rowsInDb = Sets.newHashSetWithExpectedSize(cells.size());");
line(
"for (Map.Entry<",
StreamIdxRow,
", BatchingVisitable<",
StreamIdxColumnValue,
">> rowVisitable");
line(" : existentRows.entrySet()) {");
{
line("rowVisitable.getValue().batchAccept(1, columnValues -> {");
{
line("if (!columnValues.isEmpty()) {");
{
line("rowsInDb.add(rowVisitable.getKey());");
}
line("}");
line("return false;");
}
line("});");
}
line("}");
line(
"Set<",
StreamId,
"> toDelete = Sets.newHashSetWithExpectedSize(rows.size() - rowsInDb.size());");
line("for (", StreamIdxRow, " rowToDelete : Sets.difference(rows, rowsInDb)) {");
{
line("toDelete.add(rowToDelete.getId());");
}
line("}");
line(StreamStore, ".of(tables).deleteStreams(t, toDelete);");
line("return false;");
}
line("}");
}
}.render();
}
public String renderMetadataCleanupTask() {
final String StreamStore = name + "StreamStore";
final String StreamMetadataTable = name + "StreamMetadataTable";
final String StreamMetadataRow = StreamMetadataTable + "." + name + "StreamMetadataRow";
final String StreamIndexTable = name + "StreamIdxTable";
final String StreamIndexRow = StreamIndexTable + "." + name + "StreamIdxRow";
final String StreamIndexColumnValue = StreamIndexTable + "." + name + "StreamIdxColumnValue";
final String TableFactory = schemaName + "TableFactory";
final String MetadataCleanupTask = getMetadataCleanupTaskClassName();
final String StreamId = streamIdType.getJavaObjectClassName();
return new Renderer() {
@Override
protected void run() {
packageAndImports();
line();
line("public class ", MetadataCleanupTask, " implements OnCleanupTask {");
{
line();
line("private final ", TableFactory, " tables;");
line();
line("public ", MetadataCleanupTask, "(Namespace namespace) {");
{
line("tables = ", TableFactory, ".of(namespace);");
}
line("}");
line();
cellsCleanedUp();
line();
unreferencedStreamsByIterator();
}
line("}");
}
private void packageAndImports() {
line("package ", packageName, ";");
line();
line("import java.util.Iterator;");
line("import java.util.Map;");
line("import java.util.HashSet;");
line("import java.util.Set;");
line("import java.util.stream.Collectors;");
line();
line("import com.google.common.collect.Sets;");
line("import com.palantir.atlasdb.cleaner.api.OnCleanupTask;");
line("import com.palantir.atlasdb.encoding.PtBytes;");
line("import com.palantir.atlasdb.keyvalue.api.BatchColumnRangeSelection;");
line("import com.palantir.atlasdb.keyvalue.api.Cell;");
line("import com.palantir.atlasdb.keyvalue.api.Namespace;");
line("import com.palantir.atlasdb.protos.generated.StreamPersistence.Status;");
line("import com.palantir.atlasdb.protos.generated.StreamPersistence.StreamMetadata;");
line("import com.palantir.atlasdb.transaction.api.Transaction;");
if (streamIdType == ValueType.SHA256HASH) {
line("import com.palantir.util.crypto.Sha256Hash;");
}
}
private void cellsCleanedUp() {
line("@Override");
line("public boolean cellsCleanedUp(Transaction t, Set cells) {");
{
line(StreamMetadataTable, " metaTable = tables.get", StreamMetadataTable, "(t);");
line("Set<", StreamMetadataRow, "> rows = Sets.newHashSetWithExpectedSize(cells.size());");
line("for (Cell cell : cells) {");
{
line("rows.add(", StreamMetadataRow, ".BYTES_HYDRATOR.hydrateFromBytes(cell.getRowName()));");
}
line("}");
line(StreamIndexTable, " indexTable = tables.get", StreamIndexTable, "(t);");
line("Set<", StreamMetadataRow, "> rowsWithNoIndexEntries =");
line(" getUnreferencedStreamsByIterator(indexTable, rows);");
line("Set<", StreamId, "> toDelete = new HashSet<>();");
line("Map<", StreamMetadataRow, ", StreamMetadata> currentMetadata =");
line(" metaTable.getMetadatas(rows);");
line("for (Map.Entry<", StreamMetadataRow, ", StreamMetadata> e : currentMetadata.entrySet()) {");
{
line("if (e.getValue().getStatus() != Status.STORED ||"
+ " rowsWithNoIndexEntries.contains(e.getKey())) {");
{
line("toDelete.add(e.getKey().getId());");
}
line("}");
}
line("}");
line(StreamStore, ".of(tables).deleteStreams(t, toDelete);");
line("return false;");
}
line("}");
}
private void unreferencedStreamsByIterator() {
line(
"private static Set<",
StreamMetadataRow,
"> getUnreferencedStreamsByIterator(",
StreamIndexTable,
" indexTable, Set<",
StreamMetadataRow,
"> metadataRows) {");
{
line("Set<", StreamIndexRow, "> indexRows = metadataRows.stream()");
line(" .map(", StreamMetadataRow, "::getId)");
line(" .map(", StreamIndexRow, "::of)");
line(" .collect(Collectors.toSet());");
line("Map<", StreamIndexRow, ", Iterator<", StreamIndexColumnValue, ">> referenceIteratorByStream");
line(" = indexTable.getRowsColumnRangeIterator(indexRows,");
line(" BatchColumnRangeSelection.create(PtBytes.EMPTY_BYTE_ARRAY,"
+ " PtBytes.EMPTY_BYTE_ARRAY, 1));");
line("return referenceIteratorByStream.entrySet().stream()");
line(" .filter(entry -> !entry.getValue().hasNext())");
line(" .map(Map.Entry::getKey)");
line(" .map(", StreamIndexRow, "::getId)");
line(" .map(", StreamMetadataRow, "::of)");
line(" .collect(Collectors.toSet());");
}
line("}");
}
}.render();
}
private static final Class>[] IMPORTS = new Class>[] {
BufferedInputStream.class,
ByteArrayInputStream.class,
File.class,
FileNotFoundException.class,
FileOutputStream.class,
IOException.class,
InputStream.class,
OutputStream.class,
DigestInputStream.class,
MessageDigest.class,
Collection.class,
Optional.class,
HashMap.class,
HashSet.class,
Map.class,
Map.Entry.class,
Set.class,
TimeUnit.class,
BiConsumer.class,
SafeArg.class,
SafeLogger.class,
SafeLoggerFactory.class,
Preconditions.class,
Arrays.class,
ArrayListMultimap.class,
Collections2.class,
HashMultimap.class,
ImmutableMap.class,
ImmutableSet.class,
Lists.class,
Maps.class,
Multimap.class,
Multimaps.class,
Sets.class,
Sets.SetView.class,
CountingInputStream.class,
Ints.class,
ByteString.class,
Status.class,
StreamMetadata.class,
Throwables.class,
ConcatenatedInputStream.class,
Cell.class,
PersistentStreamStore.class,
Transaction.class,
TransactionManager.class,
TransactionTask.class,
TxTask.class,
AssertUtils.class,
ByteArrayIOStream.class,
Sha256Hash.class,
DeleteOnCloseFileInputStream.class,
TempFileUtils.class,
TransactionFailedRetriableException.class,
StreamCleanedException.class,
AbstractPersistentStreamStore.class,
BlockConsumingInputStream.class,
BlockGetter.class,
BlockLoader.class,
List.class,
CheckForNull.class,
Generated.class,
StreamCompression.class,
Pair.class,
Functions.class,
ByteStreams.class,
Supplier.class,
StreamStorePersistenceConfiguration.class,
};
}
| |
© 2015 - 2025 Weber Informatics LLC | Privacy Policy