All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.palantir.atlasdb.stream.AbstractPersistentStreamStore Maven / Gradle / Ivy

There is a newer version: 0.1193.0
Show newest version
/*
 * (c) Copyright 2018 Palantir Technologies Inc. All rights reserved.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.palantir.atlasdb.stream;

import com.google.common.base.Preconditions;
import com.google.common.collect.ImmutableMap;
import com.google.common.collect.Iterables;
import com.google.common.collect.Sets;
import com.google.common.io.ByteStreams;
import com.google.common.io.CountingInputStream;
import com.google.protobuf.ByteString;
import com.palantir.atlasdb.encoding.PtBytes;
import com.palantir.atlasdb.protos.generated.StreamPersistence.Status;
import com.palantir.atlasdb.protos.generated.StreamPersistence.StreamMetadata;
import com.palantir.atlasdb.transaction.api.Transaction;
import com.palantir.atlasdb.transaction.api.TransactionManager;
import com.palantir.atlasdb.transaction.api.TransactionTask;
import com.palantir.atlasdb.transaction.impl.TxTask;
import com.palantir.common.base.Throwables;
import com.palantir.common.compression.StreamCompression;
import com.palantir.common.streams.KeyedStream;
import com.palantir.logsafe.SafeArg;
import com.palantir.util.Pair;
import com.palantir.util.crypto.Sha256Hash;
import java.io.IOException;
import java.io.InputStream;
import java.security.DigestInputStream;
import java.security.MessageDigest;
import java.util.Map;
import java.util.function.Supplier;
import javax.annotation.Nullable;

public abstract class AbstractPersistentStreamStore extends AbstractGenericStreamStore
        implements PersistentStreamStore {
    private final StreamStoreBackoffStrategy backoffStrategy;
    private final StreamCompression compression;

    protected AbstractPersistentStreamStore(TransactionManager txManager, StreamCompression compression) {
        this(txManager, compression, () -> StreamStorePersistenceConfigurations.DEFAULT_CONFIG);
    }

    protected AbstractPersistentStreamStore(
            TransactionManager txManager,
            StreamCompression compression,
            Supplier persistenceConfiguration) {
        super(txManager, compression);
        this.compression = compression;
        this.backoffStrategy = StandardPeriodicBackoffStrategy.create(persistenceConfiguration);
    }

    protected final void storeMetadataAndIndex(final long streamId, final StreamMetadata metadata) {
        com.palantir.logsafe.Preconditions.checkNotNull(txnMgr, "Transaction manager must not be null");
        txnMgr.runTaskThrowOnConflict((TxTask) tx -> {
            putMetadataAndHashIndexTask(tx, streamId, metadata);
            return null;
        });
    }

    private Long lookupStreamIdByHash(Transaction tx, Sha256Hash hash) {
        Map hashToId = lookupStreamIdsByHash(tx, Sets.newHashSet(hash));
        if (hashToId.isEmpty()) {
            return null;
        }
        return Iterables.getOnlyElement(hashToId.entrySet()).getValue();
    }

    @Override
    public final long getByHashOrStoreStreamAndMarkAsUsed(
            Transaction tx, Sha256Hash hash, InputStream stream, byte[] reference) {
        Long streamId = lookupStreamIdByHash(tx, hash);
        if (streamId != null) {
            markStreamsAsUsed(
                    tx,
                    ImmutableMap.builder()
                            .put(streamId, reference)
                            .build());
            return streamId;
        }
        Pair pair = storeStream(stream);
        Preconditions.checkArgument(
                hash.equals(pair.rhSide), "passed hash: %s does not equal stream hash: %s", hash, pair.rhSide);
        markStreamsAsUsedInternal(
                tx,
                ImmutableMap.builder().put(pair.lhSide, reference).build());
        return pair.lhSide;
    }

    @Override
    public void unmarkStreamAsUsed(Transaction tx, long streamId, byte[] reference) {
        unmarkStreamsAsUsed(
                tx,
                ImmutableMap.builder().put(streamId, reference).build());
    }

    @Override
    public void markStreamAsUsed(Transaction tx, long streamId, byte[] reference) {
        markStreamsAsUsed(
                tx,
                ImmutableMap.builder().put(streamId, reference).build());
    }

    @Override
    public void markStreamsAsUsed(Transaction tx, Map streamIdsToReference) {
        touchMetadataWhileMarkingUsedForConflicts(tx, streamIdsToReference.keySet());
        markStreamsAsUsedInternal(tx, streamIdsToReference);
    }

    protected long storeEmptyMetadata() {
        com.palantir.logsafe.Preconditions.checkNotNull(txnMgr, "Transaction manager must not be null");
        return txnMgr.runTaskThrowOnConflict(tx -> {
            putMetadataAndHashIndexTask(tx, tx.getTimestamp(), getEmptyMetadata());
            return tx.getTimestamp();
        });
    }

    @Override
    public Pair storeStream(InputStream stream) {
        // Store empty metadata before doing anything
        long id = storeEmptyMetadata();

        StreamMetadata metadata = storeBlocksAndGetFinalMetadata(null, id, stream);
        storeMetadataAndIndex(id, metadata);
        return Pair.create(id, new Sha256Hash(metadata.getHash().toByteArray()));
    }

    @Override
    public Map storeStreams(final Transaction tx, final Map streams) {
        if (streams.isEmpty()) {
            return ImmutableMap.of();
        }

        Map idsToEmptyMetadata =
                KeyedStream.stream(streams).map($ -> getEmptyMetadata()).collectToMap();
        putMetadataAndHashIndexTask(tx, idsToEmptyMetadata);

        Map idsToMetadata = KeyedStream.stream(streams)
                .map((id, stream) -> storeBlocksAndGetFinalMetadata(tx, id, stream))
                .collectToMap();
        putMetadataAndHashIndexTask(tx, idsToMetadata);

        return KeyedStream.stream(idsToMetadata)
                .map(metadata -> new Sha256Hash(metadata.getHash().toByteArray()))
                .collectToMap();
    }

    // This method is overridden in generated code. Changes to this method may have unintended consequences.
    protected StreamMetadata storeBlocksAndGetFinalMetadata(@Nullable Transaction tx, long id, InputStream stream) {
        MessageDigest digest = Sha256Hash.getMessageDigest();
        try (InputStream hashingStream = new DigestInputStream(stream, digest);
                InputStream compressingStream = compression.compress(hashingStream)) {
            StreamMetadata metadata = storeBlocksAndGetHashlessMetadata(tx, id, compressingStream);
            return StreamMetadata.newBuilder(metadata)
                    .setHash(ByteString.copyFrom(digest.digest()))
                    .build();
        } catch (IOException e) {
            throw new RuntimeException(e);
        }
    }

    protected final StreamMetadata storeBlocksAndGetHashlessMetadata(
            @Nullable Transaction tx, long id, InputStream stream) {
        CountingInputStream countingStream = new CountingInputStream(stream);

        // Try to store the bytes in the stream and get length
        try {
            storeBlocksFromStream(tx, id, countingStream);
        } catch (IOException e) {
            long length = countingStream.getCount();
            StreamMetadata metadata = StreamMetadata.newBuilder()
                    .setStatus(Status.FAILED)
                    .setLength(length)
                    .setHash(ByteString.EMPTY)
                    .build();
            storeMetadataAndIndex(id, metadata);
            log.error(
                    "Could not store stream {}. Failed after {} bytes.",
                    SafeArg.of("stream", id),
                    SafeArg.of("length", length),
                    e);
            throw Throwables.rewrapAndThrowUncheckedException("Failed to store stream.", e);
        }

        long length = countingStream.getCount();
        return StreamMetadata.newBuilder()
                .setStatus(Status.STORED)
                .setLength(length)
                .setHash(ByteString.EMPTY)
                .build();
    }

    private void storeBlocksFromStream(@Nullable Transaction tx, long id, InputStream stream) throws IOException {
        long blockNumber = 0;

        while (true) {
            byte[] bytesToStore = new byte[BLOCK_SIZE_IN_BYTES];
            int length = ByteStreams.read(stream, bytesToStore, 0, BLOCK_SIZE_IN_BYTES);
            // Store only relevant data if it only filled a partial block
            if (length == 0) {
                break;
            }
            if (length < BLOCK_SIZE_IN_BYTES) {
                // This is the last block.
                storeBlockWithNonNullTransaction(tx, id, blockNumber, PtBytes.head(bytesToStore, length));
                break;
            } else {
                // Store a full block.
                storeBlockWithNonNullTransaction(tx, id, blockNumber, bytesToStore);
            }
            blockNumber++;
            if (!streamOperationIsTransactional(tx)) {
                backoffStrategy.accept(blockNumber);
            }
        }
    }

    private boolean streamOperationIsTransactional(@Nullable Transaction tx) {
        // TODO (jkong): I'm using tx == null as a proxy for whether the entire operation should be done
        // transactionally or not (null implies nontransactional).
        // This is not ideal, but was done in the interest of time.
        return tx != null;
    }

    protected void storeBlockWithNonNullTransaction(
            @Nullable Transaction tx, final long id, final long blockNumber, final byte[] bytesToStore) {
        if (tx != null) {
            storeBlock(tx, id, blockNumber, bytesToStore);
        } else {
            com.palantir.logsafe.Preconditions.checkNotNull(txnMgr, "Transaction manager must not be null");
            txnMgr.runTaskThrowOnConflict((TransactionTask) t1 -> {
                storeBlock(t1, id, blockNumber, bytesToStore);
                return null;
            });
        }
    }

    private void putMetadataAndHashIndexTask(Transaction tx, Long streamId, StreamMetadata metadata) {
        putMetadataAndHashIndexTask(
                tx,
                ImmutableMap.builder()
                        .put(streamId, metadata)
                        .build());
    }

    protected abstract void putMetadataAndHashIndexTask(Transaction tx, Map streamIdsToMetadata);

    protected abstract void storeBlock(Transaction tx, long id, long blockNumber, byte[] block);

    protected abstract void touchMetadataWhileMarkingUsedForConflicts(Transaction tx, Iterable ids)
            throws StreamCleanedException;

    protected abstract void markStreamsAsUsedInternal(Transaction tx, Map streamIdsToReference);
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy