All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.bazaarvoice.emodb.sor.db.DeltaIterator Maven / Gradle / Ivy

There is a newer version: 6.5.190
Show newest version
package com.bazaarvoice.emodb.sor.db;


import com.google.common.collect.AbstractIterator;
import com.google.common.collect.Lists;

import java.nio.ByteBuffer;
import java.util.Collections;
import java.util.Iterator;
import java.util.List;
import java.util.UUID;


/**
 *  Iterator abstraction that stitches blocked deltas together
 */
abstract public class DeltaIterator extends AbstractIterator {

    private List _list;

    private final Iterator _iterator;
    private R _next;
    private R _oldDelta;
    private final boolean _reverse;
    private final int _prefixLength;
    private boolean _firstIteration;
    private String _rowKey;

    public DeltaIterator(Iterator iterator, boolean reverse, int prefixLength, String rowKey) {
        _iterator = iterator;
        _reverse = reverse;
        _prefixLength = prefixLength;
        _firstIteration = true;
        _rowKey = rowKey;
    }

    // stitch delta together in reverse
    private BlockedDelta reverseCompute() {
        int contentSize = getValue(_next).remaining();
        UUID correctChangeId = getChangeId(_next);
        int numBlocks = 1;

        if (_list == null) {
            _list = Lists.newArrayListWithCapacity(3);
        }

        _list.add(_next);


        _oldDelta = _next;

        while (_iterator.hasNext() && getChangeId(_next = _iterator.next()).equals(correctChangeId)) {
            numBlocks++;
            _list.add(_next);
            contentSize += getValue(_next).remaining();
            _next = null;
        }

        Collections.reverse(_list);

        // delta is fragmented if the first block is not zero. In this case, we skip it.
        if (getBlock(_list.get(0)) != 0) {
            // We must also clear the list of the fragmented delta blocks to avoid them being stitched in with
            // the next delta, which will cause a buffer overflow
            _list.clear();
            return null;
        }

        int expectedBlocks = getNumBlocks(_list.get(0));

        while (expectedBlocks != _list.size()) {
            contentSize -= getValue(_list.remove(_list.size() - 1)).remaining();
        }

        return new BlockedDelta(numBlocks, stitchContent(contentSize));

    }

    // stitch delta together and return it as one bytebuffer
    private BlockedDelta compute(int numBlocks) {

        int contentSize = getValue(_next).remaining();
        _oldDelta = _next;
        UUID changeId = getChangeId(_next);

        if (_list == null) {
            _list = Lists.newArrayListWithCapacity(numBlocks);
        }

        _list.add(_next);

        for (int i = 1; i < numBlocks; i++) {
            if (_iterator.hasNext()) {
                _next = _iterator.next();
                if (getChangeId(_next).equals(changeId)) {
                    _list.add(_next);
                    contentSize += getValue(_next).remaining();
                } else {
                    // fragmented delta encountered, we must skip over it

                    // We must also clear the list of the fragmented delta blocks to avoid them being stitched in with
                    // the next delta, which will cause a buffer overflow
                    _list.clear();
                    return null;
                }
            } else {
                // fragmented delta and no other deltas to skip to
                throw new DeltaStitchingException(_rowKey, getChangeId(_next).toString(), numBlocks, i - 1);
            }
        }

        numBlocks += skipForward();

        return new BlockedDelta(numBlocks, stitchContent(contentSize));
    }

    @Override
    protected T computeNext() {

        if (_firstIteration) {
            if (_iterator.hasNext()) {
                _next = _iterator.next();
                _firstIteration = false;
            }
        }

        while(true) {

            if (_next == null) {
                return endOfData();
            }

            BlockedDelta blockedDelta;

            if (!_reverse) {

                // Ensure that the block we are looking at is truly the first block in the sequence. It not,
                // we should skip over it.
                // TODO: add a metric here so that we know if this is happening. The only case where this should be
                // permissable is when a delta is overwritten by another with the same changeid. Ideally, we will rid
                // ourselves of this possiblility entirely, and fail the request if the condition below is ever satisfied
                if (getBlock(_next) != 0) {
                    skipForward();
                }

                int numBlocks = getNumBlocks(_next);

                if (numBlocks == 1) {
                    R delta = _next;
                    numBlocks += skipForward();
                    return convertDelta(delta, new BlockedDelta(numBlocks, getValue(delta)));
                }

                blockedDelta = compute(numBlocks);

            } else {
                if (getBlock(_next) == 0) {
                    if (getNumBlocks(_next) != 1) {
                        continue;
                    }
                    T ret = convertDelta(_next, new BlockedDelta(1, getValue(_next)));
                    _next = _iterator.hasNext() ? _iterator.next() : null;
                    return ret;
                }

                blockedDelta = reverseCompute();
            }

            if (blockedDelta != null) {
                return convertDelta(_oldDelta, blockedDelta);
            }

        }
    }

    // This handles the edge case in which a client has explicity specified a changeId when writing and overwrote an exisiting delta.
    private int skipForward() {
        int numSkips = 0;
        _next = null;
        while (_iterator.hasNext() && getBlock(_next = _iterator.next()) != 0) {
            numSkips++;
            _next = null;
        }
        return numSkips;
    }

    // converts utf-8 encoded hex to int by building it digit by digit.
    private int getNumBlocks(R delta) {
        ByteBuffer content = getValue(delta);
        int numBlocks = 0;

        // build numBlocks by adding together each hex digit
        for (int i = 0; i < _prefixLength; i++) {
            byte b = content.get(i);
            numBlocks = numBlocks << 4 | (b <= '9' ? b - '0' : b - 'A' + 10);
        }

        return numBlocks;
    }

    private ByteBuffer stitchContent(int contentSize) {
        ByteBuffer content = ByteBuffer.allocate(contentSize);
        for (R delta : _list) {
            content.put(getValue(delta).duplicate());
        }
        content.position(0);
        _list.clear();
        return content;
    }

    protected static class BlockedDelta {
        private final int _numBlocks;
        private final ByteBuffer _content;

        public BlockedDelta(int numBlocks, ByteBuffer content) {
            _numBlocks = numBlocks;
            _content = content;
        }

        public int getNumBlocks() {
            return _numBlocks;
        }

        public ByteBuffer getContent() {
            return _content;
        }
    }

    // transforms delta from the provided type to the return type, while also changing content to be the parameter provided
    abstract protected T convertDelta(R delta, BlockedDelta blockedDelta);

    // get block number from delta
    abstract protected int getBlock(R delta);

    // get change UUID from delta
    abstract protected UUID getChangeId(R delta);

    // get delta content from delta
    abstract protected ByteBuffer getValue(R delta);

}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy