All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.palantir.atlasdb.keyvalue.cassandra.thrift.ThriftObjectSizeUtils Maven / Gradle / Ivy

The newest version!
/*
 * (c) Copyright 2018 Palantir Technologies Inc. All rights reserved.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.palantir.atlasdb.keyvalue.cassandra.thrift;

import com.google.common.collect.Maps;
import java.nio.ByteBuffer;
import java.util.Collection;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.RandomAccess;
import java.util.function.Function;
import java.util.function.ToLongFunction;
import java.util.stream.Collectors;
import javax.annotation.Nullable;
import org.apache.cassandra.thrift.Column;
import org.apache.cassandra.thrift.ColumnOrSuperColumn;
import org.apache.cassandra.thrift.CounterColumn;
import org.apache.cassandra.thrift.CounterSuperColumn;
import org.apache.cassandra.thrift.CqlMetadata;
import org.apache.cassandra.thrift.CqlResult;
import org.apache.cassandra.thrift.CqlRow;
import org.apache.cassandra.thrift.Deletion;
import org.apache.cassandra.thrift.KeySlice;
import org.apache.cassandra.thrift.Mutation;
import org.apache.cassandra.thrift.SlicePredicate;
import org.apache.cassandra.thrift.SliceRange;
import org.apache.cassandra.thrift.SuperColumn;

public final class ThriftObjectSizeUtils {

    private static final long ONE_BYTE = 1;

    private ThriftObjectSizeUtils() {
        // utility class
    }

    public static long getApproximateSizeOfMutationMap(Map>> batchMutateMap) {
        long approxBytesForKeys = getCollectionSize(batchMutateMap.keySet(), ThriftObjectSizeUtils::getByteBufferSize);
        long approxBytesForValues = getCollectionSize(
                batchMutateMap.values(),
                currentMap -> getCollectionSize(currentMap.keySet(), ThriftObjectSizeUtils::getStringSize)
                        + getCollectionSize(
                                currentMap.values(),
                                mutations -> getListSize(mutations, ThriftObjectSizeUtils::getMutationSize)));
        return approxBytesForKeys + approxBytesForValues;
    }

    public static Map getSizeOfMutationPerTable(
            Map>> batchMutateMap) {
        Map tableToSize = new HashMap<>();

        batchMutateMap.forEach((key, tableToMutations) -> {
            long keySize = ThriftObjectSizeUtils.getByteBufferSize(key);

            tableToMutations.forEach((table, mutations) -> {
                long size = tableToSize.getOrDefault(table, 0L);
                size += keySize;
                size += getListSize(mutations, ThriftObjectSizeUtils::getMutationSize);

                tableToSize.put(table, size);
            });
        });

        return tableToSize;
    }

    public static long getApproximateSizeOfColsByKey(Map> result) {
        return getCollectionSize(
                result.entrySet(),
                rowResult -> ThriftObjectSizeUtils.getByteBufferSize(rowResult.getKey())
                        + getListSize(rowResult.getValue(), ThriftObjectSizeUtils::getColumnOrSuperColumnSize));
    }

    public static long getApproximateSizeOfColListsByKey(Map>> result) {
        Map> flattenedColumnListMap = Maps.transformValues(
                result, lists -> lists.stream().flatMap(List::stream).collect(Collectors.toList()));
        return getApproximateSizeOfColsByKey(flattenedColumnListMap);
    }

    public static long getApproximateSizeOfKeySlices(List slices) {
        return getListSize(slices, ThriftObjectSizeUtils::getKeySliceSize);
    }

    public static long getCasByteCount(List updates) {
        // TODO(nziebart): CAS actually writes more bytes than this, because the associated Paxos negotiations must
        // be persisted
        return getListSize(updates, ThriftObjectSizeUtils::getColumnSize);
    }

    public static long getColumnOrSuperColumnSize(ColumnOrSuperColumn columnOrSuperColumn) {
        if (columnOrSuperColumn == null) {
            return getNullSize();
        }
        return getColumnSize(columnOrSuperColumn.getColumn())
                + getSuperColumnSize(columnOrSuperColumn.getSuper_column())
                + getCounterColumnSize(columnOrSuperColumn.getCounter_column())
                + getCounterSuperColumnSize(columnOrSuperColumn.getCounter_super_column());
    }

    public static long getByteBufferSize(ByteBuffer byteBuffer) {
        if (byteBuffer == null) {
            return getNullSize();
        }
        return byteBuffer.remaining();
    }

    public static long getMutationSize(Mutation mutation) {
        if (mutation == null) {
            return getNullSize();
        }
        return getColumnOrSuperColumnSize(mutation.getColumn_or_supercolumn())
                + getDeletionSize(mutation.getDeletion());
    }

    public static long getCqlResultSize(CqlResult cqlResult) {
        if (cqlResult == null) {
            return getNullSize();
        }
        return getThriftEnumSize()
                + getListSize(cqlResult.getRows(), ThriftObjectSizeUtils::getCqlRowSize)
                + Integer.BYTES
                + getCqlMetadataSize(cqlResult.getSchema());
    }

    public static long getKeySliceSize(KeySlice keySlice) {
        if (keySlice == null) {
            return getNullSize();
        }
        return getBytesSize(keySlice, KeySlice::bufferForKey, KeySlice::getKey)
                + getListSize(keySlice.getColumns(), ThriftObjectSizeUtils::getColumnOrSuperColumnSize);
    }

    public static long getStringSize(String string) {
        if (string == null) {
            return getNullSize();
        }
        return string.length();
    }

    public static long getColumnSize(Column column) {
        if (column == null) {
            return getNullSize();
        }
        return getBytesSize(column, Column::bufferForName, Column::getName)
                + getBytesSize(column, Column::bufferForValue, Column::getValue)
                + getTtlSize()
                + getTimestampSize();
    }

    private static long getCounterSuperColumnSize(CounterSuperColumn counterSuperColumn) {
        if (counterSuperColumn == null) {
            return getNullSize();
        }
        return getBytesSize(counterSuperColumn, CounterSuperColumn::bufferForName, CounterSuperColumn::getName)
                + getListSize(counterSuperColumn.getColumns(), ThriftObjectSizeUtils::getCounterColumnSize);
    }

    private static long getCounterColumnSize(CounterColumn counterColumn) {
        if (counterColumn == null) {
            return getNullSize();
        }
        return getBytesSize(counterColumn, CounterColumn::bufferForName, CounterColumn::getName)
                + getCounterValueSize();
    }

    private static long getSuperColumnSize(SuperColumn superColumn) {
        if (superColumn == null) {
            return getNullSize();
        }
        return getBytesSize(superColumn, SuperColumn::bufferForName, SuperColumn::getName)
                + getListSize(superColumn.getColumns(), ThriftObjectSizeUtils::getColumnSize);
    }

    private static long getDeletionSize(Deletion deletion) {
        if (deletion == null) {
            return getNullSize();
        }
        return getTimestampSize()
                + getBytesSize(deletion, Deletion::bufferForSuper_column, Deletion::getSuper_column)
                + getSlicePredicateSize(deletion.getPredicate());
    }

    private static long getSlicePredicateSize(SlicePredicate predicate) {
        if (predicate == null) {
            return getNullSize();
        }

        return getListSize(predicate.getColumn_names(), ThriftObjectSizeUtils::getByteBufferSize)
                + getSliceRangeSize(predicate.getSlice_range());
    }

    private static long getSliceRangeSize(SliceRange sliceRange) {
        if (sliceRange == null) {
            return getNullSize();
        }
        return getBytesSize(sliceRange, SliceRange::bufferForStart, SliceRange::getStart)
                + getBytesSize(sliceRange, SliceRange::bufferForFinish, SliceRange::getFinish)
                + getReversedBooleanSize()
                + getSliceRangeCountSize();
    }

    private static long getCqlMetadataSize(CqlMetadata schema) {
        if (schema == null) {
            return getNullSize();
        }

        return getByteBufferStringMapSize(schema.getName_types())
                + getByteBufferStringMapSize(schema.getValue_types())
                + getStringSize(schema.getDefault_name_type())
                + getStringSize(schema.getDefault_value_type());
    }

    private static long getByteBufferStringMapSize(Map nameTypes) {
        return getCollectionSize(
                nameTypes.entrySet(),
                entry -> ThriftObjectSizeUtils.getByteBufferSize(entry.getKey())
                        + ThriftObjectSizeUtils.getStringSize(entry.getValue()));
    }

    private static long getCqlRowSize(CqlRow cqlRow) {
        if (cqlRow == null) {
            return getNullSize();
        }
        return getBytesSize(cqlRow, CqlRow::bufferForKey, CqlRow::getKey)
                + getListSize(cqlRow.getColumns(), ThriftObjectSizeUtils::getColumnSize);
    }

    private static long getThriftEnumSize() {
        return Integer.BYTES;
    }

    private static long getByteArraySize(byte[] byteArray) {
        if (byteArray == null) {
            return getNullSize();
        }
        return byteArray.length;
    }

    private static long getTimestampSize() {
        return Long.BYTES;
    }

    private static long getTtlSize() {
        return Integer.BYTES;
    }

    private static long getCounterValueSize() {
        return Long.BYTES;
    }

    private static long getReversedBooleanSize() {
        return ONE_BYTE;
    }

    private static long getSliceRangeCountSize() {
        return Integer.BYTES;
    }

    private static long getNullSize() {
        return Integer.BYTES;
    }

    private static  long getBytesSize(T data, Function toByteBuffer, Function toBytes) {
        // determine the size of bytes for the given slice of data,
        // ideally without having to copy that data into an array.
        ByteBuffer byteBuffer = toByteBuffer.apply(data);
        if (byteBuffer == null) {
            // fallback to slow path that potentially copies array and creates ByteBuffer
            byte[] bytes = toBytes.apply(data);
            return getByteArraySize(bytes);
        }
        // fast-path where no copies are needed
        return byteBuffer.remaining();
    }

    public static  long getCollectionSize(@Nullable Collection collection, ToLongFunction sizeFunction) {
        if (collection == null) {
            return getNullSize();
        }
        if (collection instanceof List) {
            return getListSize((List) collection, sizeFunction);
        }
        return sumSizes(collection, sizeFunction);
    }

    private static  long getListSize(@Nullable List list, ToLongFunction sizeFunction) {
        if (list == null) {
            return getNullSize();
        }

        // random access lists can be more efficiently accessed via List::get(int)
        // as this avoids allocating iterator
        if (list instanceof RandomAccess) {
            long sum = 0L;
            //noinspection ForLoopReplaceableByForEach -- performance sensitive
            for (int i = 0; i < list.size(); i++) {
                sum += sizeFunction.applyAsLong(list.get(i));
            }
            return sum;
        }

        return sumSizes(list, sizeFunction);
    }

    private static  long sumSizes(Collection collection, ToLongFunction sizeFunction) {
        long sum = 0L;
        //noinspection ForLoopReplaceableByStream -- performance sensitive, avoiding stream allocations
        for (T t : collection) {
            sum += sizeFunction.applyAsLong(t);
        }
        return sum;
    }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy