All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.palantir.atlasdb.schema.stream.StreamStoreDefinitionBuilder Maven / Gradle / Ivy

/*
 * (c) Copyright 2018 Palantir Technologies Inc. All rights reserved.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.palantir.atlasdb.schema.stream;

import com.google.common.base.Preconditions;
import com.google.common.collect.Maps;
import com.palantir.atlasdb.AtlasDbConstants;
import com.palantir.atlasdb.protos.generated.TableMetadataPersistence;
import com.palantir.atlasdb.table.description.TableDefinition;
import com.palantir.atlasdb.table.description.ValueType;
import com.palantir.common.compression.StreamCompression;
import java.util.Map;
import java.util.stream.Collectors;

public class StreamStoreDefinitionBuilder {
    private final ValueType valueType;
    private final String shortName;
    private final String longName;
    private Map streamTables =
            Maps.newHashMapWithExpectedSize(StreamTableType.values().length);
    private int inMemoryThreshold = AtlasDbConstants.DEFAULT_STREAM_IN_MEMORY_THRESHOLD;
    private StreamCompression compressStreamType;
    private int numberOfRowComponentsHashed = 0;

    /**
     * @param shortName The prefix of the table names in the DB.
     * @param longName The prefix of the generated Java class names.
     * @param valueType The type of the column that will store the stream ID internally. Usually a VAR_LONG.
     */
    public StreamStoreDefinitionBuilder(String shortName, String longName, ValueType valueType) {
        for (StreamTableType tableType : StreamTableType.values()) {
            streamTables.put(
                    tableType.getTableName(shortName),
                    new StreamTableDefinitionBuilder(tableType, longName, valueType));
        }
        this.valueType = valueType;
        this.shortName = shortName;
        this.longName = longName;
        this.compressStreamType = StreamCompression.NONE;
    }

    /**
     * We recommend using hashRowComponents() instead as it has the additional benefit of preventing hotspotting
     * within a stream. However, do not change this flag for an existing store schema as we currently do not support
     * StreamStore migrations.
     */
    public StreamStoreDefinitionBuilder hashFirstRowComponent() {
        return hashFirstNRowComponents(1);
    }

    /**
     * We recommend that this flag is set in order to prevent hotspotting in the underlying table which stores
     * the data blocks. The effect of this method is that row keys will be prefixed by the hashed
     * concatenation of the stream id and block id. AtlasDB does not have support for StreamStore migrations,
     * so if you are adding this flag for an existing StreamStore you will have to implement the migration as well.
     */
    public StreamStoreDefinitionBuilder hashRowComponents() {
        return hashFirstNRowComponents(2);
    }

    private StreamStoreDefinitionBuilder hashFirstNRowComponents(int numberOfComponentsHashed) {
        com.palantir.logsafe.Preconditions.checkArgument(
                numberOfComponentsHashed <= 2,
                "The number of components specified must be less than two as "
                        + "StreamStore internal tables use at most two row components.");
        streamTables.forEach((tableName, streamTableBuilder) ->
                streamTableBuilder.hashFirstNRowComponents(numberOfComponentsHashed));
        numberOfRowComponentsHashed = numberOfComponentsHashed;
        return this;
    }

    public StreamStoreDefinitionBuilder tableNameLogSafety(TableMetadataPersistence.LogSafety logSafety) {
        streamTables.forEach((tableName, streamTableBuilder) -> streamTableBuilder.tableNameLogSafety(logSafety));
        return this;
    }

    public StreamStoreDefinitionBuilder isAppendHeavyAndReadLight() {
        streamTables.forEach((tableName, streamTableBuilder) -> streamTableBuilder.appendHeavyAndReadLight());
        return this;
    }

    /**
     * @deprecated use {@link #compressStreamInClient()} instead, because that will compress before sending the data
     * over the network to Cassandra.
     */
    @Deprecated
    public StreamStoreDefinitionBuilder compressBlocksInDb() {
        streamTables.forEach((tableName, streamTableBuilder) -> streamTableBuilder.compressBlocksInDb());
        return this;
    }

    public StreamStoreDefinitionBuilder compressStreamInClient() {
        return compressStreamInClient(StreamCompression.LZ4);
    }

    public StreamStoreDefinitionBuilder compressStreamInClient(StreamCompression compressionType) {
        compressStreamType = compressionType;
        return this;
    }

    public StreamStoreDefinitionBuilder inMemoryThreshold(int inMemoryThreshold) {
        this.inMemoryThreshold = inMemoryThreshold;
        return this;
    }

    public StreamStoreDefinition build() {
        Map tablesToCreate = streamTables.entrySet().stream()
                .collect(Collectors.toMap(
                        Map.Entry::getKey, entry -> entry.getValue().build()));

        com.palantir.logsafe.Preconditions.checkArgument(
                valueType.getJavaClassName().equals("long"), "Stream ids must be a long");
        Preconditions.checkArgument(
                inMemoryThreshold <= StreamStoreDefinition.MAX_IN_MEMORY_THRESHOLD,
                "inMemoryThreshold cannot be greater than %s",
                StreamStoreDefinition.MAX_IN_MEMORY_THRESHOLD);

        return new StreamStoreDefinition(
                tablesToCreate,
                shortName,
                longName,
                valueType,
                inMemoryThreshold,
                compressStreamType,
                numberOfRowComponentsHashed);
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy