All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.bazaarvoice.emodb.sor.db.astyanax.DefaultChangeEncoder Maven / Gradle / Ivy

There is a newer version: 6.5.190
Show newest version
package com.bazaarvoice.emodb.sor.db.astyanax;

import com.bazaarvoice.emodb.common.cassandra.nio.BufferUtils;
import com.bazaarvoice.emodb.common.json.JsonHelper;
import com.bazaarvoice.emodb.common.json.deferred.LazyJsonMap;
import com.bazaarvoice.emodb.sor.api.Change;
import com.bazaarvoice.emodb.sor.api.ChangeBuilder;
import com.bazaarvoice.emodb.sor.api.Compaction;
import com.bazaarvoice.emodb.sor.api.History;
import com.bazaarvoice.emodb.sor.db.LazyDelta;
import com.bazaarvoice.emodb.sor.delta.Deltas;
import com.bazaarvoice.emodb.sor.delta.deser.JsonTokener;
import com.google.common.base.Charsets;
import com.google.common.base.Functions;
import com.google.common.collect.FluentIterable;
import org.apache.cassandra.utils.ByteBufferUtil;

import javax.annotation.Nonnull;
import javax.annotation.Nullable;
import java.nio.ByteBuffer;
import java.util.EnumSet;
import java.util.Set;
import java.util.UUID;

import static com.google.common.base.Preconditions.checkArgument;

class DefaultChangeEncoder implements ChangeEncoder {

    private enum Encoding {
        D1,  // delta (version 1 encoding)
        D2,  // delta (version 2 encoding includes tags)
        D3,  // delta (version 3 encoding, adds change flags to D2
        C1,  // compaction (version 1 encoding)
        H1,  // historical deltas (version 1 encoding)
    }

    private final Encoding _deltaEncoding;

    public DefaultChangeEncoder() {
        // Default constructor uses the latest version.
        this(3);
    }

    public DefaultChangeEncoder(int deltaEncodingVersion) {
        // To support a rolling upgrade between delta encodings the caller can specify which of the two most recent
        // delta encoding versions to use.  When upgrading the version should be deployed as the old version so that
        // old instances can read deltas written by the new instances.  Once all old instances have been terminated
        // the encoding version can be flipped to the new version.

        checkArgument(deltaEncodingVersion == 2 || deltaEncodingVersion == 3, "Only delta encoding versions 2 and 3 are permitted");
        _deltaEncoding = deltaEncodingVersion == 2 ? Encoding.D2 : Encoding.D3;
    }

    @Override
    public StringBuilder encodeDelta(String deltaString, @Nullable EnumSet changeFlags, @Nonnull Set tags, StringBuilder changeBody) {
        // Encoding will be either the legacy D2 or the current D3
        // Spec for D2 is :
        // Spec for D3 is ::

        changeBody.append(_deltaEncoding)
                .append(":")
                .append(tags.isEmpty() ? "[]" : JsonHelper.asJson(tags));

        if (_deltaEncoding == Encoding.D3) {
            changeBody.append(":");
            if (changeFlags != null) {
                for (ChangeFlag changeFlag : changeFlags) {
                    changeBody.append(changeFlag.serialize());
                }
            }
        }

        changeBody.append(":")
                .append(deltaString);


        return changeBody;
    }

    @Override
    public StringBuilder encodeCompaction(Compaction compaction, StringBuilder prefix) {
        return encodeChange(Encoding.C1, JsonHelper.asJson(compaction), prefix);
    }

    @Override
    public String encodeHistory(History history) {
        return encodeChange(Encoding.H1, JsonHelper.asJson(history), new StringBuilder()).toString();
    }

    private StringBuilder encodeChange(Encoding encoding, String bodyString, StringBuilder prefix) {
        return prefix.append(encoding).append(":").append(bodyString);
    }

    /**
     * Decodes a change encoded by {@link #encodeChange}.
     */
    @Override
    public Change decodeChange(UUID changeId, ByteBuffer buf) {
        int sep = getSeparatorIndex(buf);
        Encoding encoding = getEncoding(buf, sep);
        String body = getBody(buf, sep);
        JsonTokener tokener;
        Set tags;

        ChangeBuilder builder = new ChangeBuilder(changeId);
        switch (encoding) {
            case D1:
                builder.with(Deltas.fromString(body));
                break;
            case D2:
                // Spec for D2 is as follows:
                // D2::
                tokener = new JsonTokener(body);
                tags = FluentIterable.from(tokener.nextArray()).transform(Functions.toStringFunction()).toSet();
                tokener.next(':');
                builder.with(Deltas.fromString(tokener)).with(tags);
                break;
            case D3:
                // Spec for D3 is as follows:
                // D3:::
                tokener = new JsonTokener(body);
                tags = FluentIterable.from(tokener.nextArray()).transform(Functions.toStringFunction()).toSet();
                tokener.next(':');
                boolean isConstant = false;
                boolean isMapDelta = false;
                char changeFlag = tokener.next();
                while (changeFlag != ':' && changeFlag != 0) {
                    // In the future there may be more change flags, though for now we're only interested in
                    // those provided below
                    switch (ChangeFlag.deserialize(changeFlag)) {
                        case CONSTANT_DELTA:
                            isConstant = true;
                            break;
                        case MAP_DELTA:
                            isMapDelta = true;
                            break;
                    }
                    changeFlag = tokener.next();
                }

                // There are numerous circumstances where the expense of parsing a literal map delta is wasted.  For
                // example, with two consecutive literal deltas for the same record the elder is immediately replaced
                // by the latter, so resources spent parsing and instantiating the elder are unnecessary.  Return a lazy
                // map literal instead to defer instantiation until necessary.
                if (isConstant && isMapDelta) {
                    builder.with(Deltas.literal(new LazyJsonMap(body.substring(tokener.pos())))).with(tags);
                } else {
                    // Even if the delta is not a literal map delta there are still benefits to evaluating it lazily.
                    // For example, if a delta is behind a compaction record but has not yet been deleted it won't
                    // be used.
                    builder.with(new LazyDelta(tokener, isConstant)).with(tags);
                }
                break;
            case C1:
                builder.with(JsonHelper.fromJson(body, Compaction.class));
                break;
            case H1:
                builder.with(JsonHelper.fromJson(body, History.class));
                break;
            default:
                throw new UnsupportedOperationException(encoding.name());
        }
        return builder.build();
    }

    @Override
    public Compaction decodeCompaction(ByteBuffer buf) {
        // Used in the first pass of the resolver, doesn't bother decoding deltas since they're not relevant in pass 1.
        int sep = getSeparatorIndex(buf);
        if (getEncoding(buf, sep) != Encoding.C1) {
            return null;  // Not a compaction record
        }
        return JsonHelper.fromJson(getBody(buf, sep), Compaction.class);
    }

    /** Returns the index of the colon that separates the encoding prefix from the body suffix. */
    private int getSeparatorIndex(ByteBuffer buf) {
        int colon = BufferUtils.indexOf(buf, (byte) ':');
        if (colon == -1) {
            throw new IllegalStateException("Unknown encoding format: " + ByteBufferUtil.bytesToHex(buf));
        }
        return colon;
    }

    private Encoding getEncoding(ByteBuffer buf, int sep) {
        // This method gets called frequently enough that it's worth avoiding string building & memory allocation.
        int position = buf.position();

        if (sep == 2) {
            switch (buf.get(position) | (buf.get(position + 1) << 8)) {
                case 'D' | ('1' << 8):
                    return Encoding.D1;
                case 'D' | ('2' << 8):
                    return Encoding.D2;
                case 'D' | ('3' << 8):
                    return Encoding.D3;
                case 'C' | ('1' << 8):
                    return Encoding.C1;
                case 'H' | ('1' << 8):
                    return Encoding.H1;
            }
        }
        throw new IllegalArgumentException("Unknown encoding: " + BufferUtils.getString(buf, position, sep, Charsets.US_ASCII));
    }

    private String getBody(ByteBuffer buf, int sep) {
        return BufferUtils.getString(buf, sep + 1, buf.remaining() - (sep + 1), Charsets.UTF_8);
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy