All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.hadoop.hdfs.util.Diff Maven / Gradle / Ivy

There is a newer version: 3.4.1
Show newest version
/**
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.hadoop.hdfs.util;

import java.util.ArrayList;
import java.util.Collections;
import java.util.Iterator;
import java.util.List;

import com.google.common.base.Preconditions;

/**
 * The difference between the current state and a previous state of a list.
 * 
 * Given a previous state of a set and a sequence of create, delete and modify
 * operations such that the current state of the set can be obtained by applying
 * the operations on the previous state, the following algorithm construct the
 * difference between the current state and the previous state of the set.
 * 
 * 
 * Two lists are maintained in the algorithm:
 * - c-list for newly created elements
 * - d-list for the deleted elements
 *
 * Denote the state of an element by the following
 *   (0, 0): neither in c-list nor d-list
 *   (c, 0): in c-list but not in d-list
 *   (0, d): in d-list but not in c-list
 *   (c, d): in both c-list and d-list
 *
 * For each case below, ( , ) at the end shows the result state of the element.
 *
 * Case 1. Suppose the element i is NOT in the previous state.           (0, 0)
 *   1.1. create i in current: add it to c-list                          (c, 0)
 *   1.1.1. create i in current and then create: impossible
 *   1.1.2. create i in current and then delete: remove it from c-list   (0, 0)
 *   1.1.3. create i in current and then modify: replace it in c-list    (c', 0)
 *
 *   1.2. delete i from current: impossible
 *
 *   1.3. modify i in current: impossible
 *
 * Case 2. Suppose the element i is ALREADY in the previous state.       (0, 0)
 *   2.1. create i in current: impossible
 *
 *   2.2. delete i from current: add it to d-list                        (0, d)
 *   2.2.1. delete i from current and then create: add it to c-list      (c, d)
 *   2.2.2. delete i from current and then delete: impossible
 *   2.2.2. delete i from current and then modify: impossible
 *
 *   2.3. modify i in current: put it in both c-list and d-list          (c, d)
 *   2.3.1. modify i in current and then create: impossible
 *   2.3.2. modify i in current and then delete: remove it from c-list   (0, d)
 *   2.3.3. modify i in current and then modify: replace it in c-list    (c', d)
 * 
* * @param The key type. * @param The element type, which must implement {@link Element} interface. */ public class Diff> { public static enum ListType { CREATED, DELETED } /** An interface for the elements in a {@link Diff}. */ public static interface Element extends Comparable { /** @return the key of this object. */ public K getKey(); } /** An interface for passing a method in order to process elements. */ public static interface Processor { /** Process the given element. */ public void process(E element); } /** Containing exactly one element. */ public static class Container { private final E element; private Container(E element) { this.element = element; } /** @return the element. */ public E getElement() { return element; } } /** * Undo information for some operations such as delete(E) * and {@link Diff#modify(Element, Element)}. */ public static class UndoInfo { private final int createdInsertionPoint; private final E trashed; private final Integer deletedInsertionPoint; private UndoInfo(final int createdInsertionPoint, final E trashed, final Integer deletedInsertionPoint) { this.createdInsertionPoint = createdInsertionPoint; this.trashed = trashed; this.deletedInsertionPoint = deletedInsertionPoint; } public E getTrashedElement() { return trashed; } } private static final int DEFAULT_ARRAY_INITIAL_CAPACITY = 4; /** * Search the element from the list. * @return -1 if the list is null; otherwise, return the insertion point * defined in {@link Collections#binarySearch(List, Object)}. * Note that, when the list is null, -1 is the correct insertion point. */ protected static > int search( final List elements, final K name) { return elements == null? -1: Collections.binarySearch(elements, name); } private static void remove(final List elements, final int i, final E expected) { final E removed = elements.remove(-i - 1); Preconditions.checkState(removed == expected, "removed != expected=%s, removed=%s.", expected, removed); } /** c-list: element(s) created in current. */ private List created; /** d-list: element(s) deleted from current. */ private List deleted; protected Diff() {} protected Diff(final List created, final List deleted) { this.created = created; this.deleted = deleted; } /** @return the created list, which is never null. */ public List getList(final ListType type) { final List list = type == ListType.CREATED ? created : deleted; return list == null ? Collections.emptyList() : list; } public List getCreatedUnmodifiable() { return created != null? Collections.unmodifiableList(created) : Collections.emptyList(); } public E setCreated(int index, E element) { final E old = created.set(index, element); if (old.compareTo(element.getKey()) != 0) { throw new AssertionError("Element mismatched: element=" + element + " but old=" + old); } return old; } public boolean removeCreated(final E element) { if (created != null) { final int i = search(created, element.getKey()); if (i >= 0 && created.get(i) == element) { created.remove(i); return true; } } return false; } public void clearCreated() { if (created != null) { created.clear(); } } public List getDeletedUnmodifiable() { return deleted != null? Collections.unmodifiableList(deleted) : Collections.emptyList(); } public boolean containsDeleted(final K key) { if (deleted != null) { return search(deleted, key) >= 0; } return false; } public int searchIndex(final ListType type, final K name) { return search(getList(type), name); } /** * @return null if the element is not found; * otherwise, return the element in the created/deleted list. */ public E search(final ListType type, final K name) { final List list = getList(type); final int c = search(list, name); return c < 0 ? null : list.get(c); } /** @return true if no changes contained in the diff */ public boolean isEmpty() { return (created == null || created.isEmpty()) && (deleted == null || deleted.isEmpty()); } /** * Insert the given element to the created/deleted list. * @param i the insertion point defined * in {@link Collections#binarySearch(List, Object)} */ private void insert(final ListType type, final E element, final int i) { List list = type == ListType.CREATED? created: deleted; if (i >= 0) { throw new AssertionError("Element already exists: element=" + element + ", " + type + "=" + list); } if (list == null) { list = new ArrayList(DEFAULT_ARRAY_INITIAL_CAPACITY); if (type == ListType.CREATED) { created = list; } else if (type == ListType.DELETED){ deleted = list; } } list.add(-i - 1, element); } /** * Create an element in current state. * @return the c-list insertion point for undo. */ public int create(final E element) { final int c = search(created, element.getKey()); insert(ListType.CREATED, element, c); return c; } /** * Undo the previous create(E) operation. Note that the behavior is * undefined if the previous operation is not create(E). */ public void undoCreate(final E element, final int insertionPoint) { remove(created, insertionPoint, element); } /** * Delete an element from current state. * @return the undo information. */ public UndoInfo delete(final E element) { final int c = search(created, element.getKey()); E previous = null; Integer d = null; if (c >= 0) { // remove a newly created element previous = created.remove(c); } else { // not in c-list, it must be in previous d = search(deleted, element.getKey()); insert(ListType.DELETED, element, d); } return new UndoInfo(c, previous, d); } /** * Undo the previous delete(E) operation. Note that the behavior is * undefined if the previous operation is not delete(E). */ public void undoDelete(final E element, final UndoInfo undoInfo) { final int c = undoInfo.createdInsertionPoint; if (c >= 0) { created.add(c, undoInfo.trashed); } else { remove(deleted, undoInfo.deletedInsertionPoint, element); } } /** * Modify an element in current state. * @return the undo information. */ public UndoInfo modify(final E oldElement, final E newElement) { Preconditions.checkArgument(oldElement != newElement, "They are the same object: oldElement == newElement = %s", newElement); Preconditions.checkArgument(oldElement.compareTo(newElement.getKey()) == 0, "The names do not match: oldElement=%s, newElement=%s", oldElement, newElement); final int c = search(created, newElement.getKey()); E previous = null; Integer d = null; if (c >= 0) { // Case 1.1.3 and 2.3.3: element is already in c-list, previous = created.set(c, newElement); // For previous != oldElement, set it to oldElement previous = oldElement; } else { d = search(deleted, oldElement.getKey()); if (d < 0) { // Case 2.3: neither in c-list nor d-list insert(ListType.CREATED, newElement, c); insert(ListType.DELETED, oldElement, d); } } return new UndoInfo(c, previous, d); } /** * Undo the previous modify(E, E) operation. Note that the behavior * is undefined if the previous operation is not modify(E, E). */ public void undoModify(final E oldElement, final E newElement, final UndoInfo undoInfo) { final int c = undoInfo.createdInsertionPoint; if (c >= 0) { created.set(c, undoInfo.trashed); } else { final int d = undoInfo.deletedInsertionPoint; if (d < 0) { remove(created, c, newElement); remove(deleted, d, oldElement); } } } /** * Find an element in the previous state. * * @return null if the element cannot be determined in the previous state * since no change is recorded and it should be determined in the * current state; otherwise, return a {@link Container} containing the * element in the previous state. Note that the element can possibly * be null which means that the element is not found in the previous * state. */ public Container accessPrevious(final K name) { return accessPrevious(name, created, deleted); } private static > Container accessPrevious( final K name, final List clist, final List dlist) { final int d = search(dlist, name); if (d >= 0) { // the element was in previous and was once deleted in current. return new Container(dlist.get(d)); } else { final int c = search(clist, name); // When c >= 0, the element in current is a newly created element. return c < 0? null: new Container(null); } } /** * Find an element in the current state. * * @return null if the element cannot be determined in the current state since * no change is recorded and it should be determined in the previous * state; otherwise, return a {@link Container} containing the element in * the current state. Note that the element can possibly be null which * means that the element is not found in the current state. */ public Container accessCurrent(K name) { return accessPrevious(name, deleted, created); } /** * Apply this diff to previous state in order to obtain current state. * @return the current state of the list. */ public List apply2Previous(final List previous) { return apply2Previous(previous, getList(ListType.CREATED), getList(ListType.DELETED)); } private static > List apply2Previous( final List previous, final List clist, final List dlist) { // Assumptions: // (A1) All lists are sorted. // (A2) All elements in dlist must be in previous. // (A3) All elements in clist must be not in tmp = previous - dlist. final List tmp = new ArrayList(previous.size() - dlist.size()); { // tmp = previous - dlist final Iterator i = previous.iterator(); for(E deleted : dlist) { E e = i.next(); //since dlist is non-empty, e must exist by (A2). int cmp = 0; for(; (cmp = e.compareTo(deleted.getKey())) < 0; e = i.next()) { tmp.add(e); } Preconditions.checkState(cmp == 0); // check (A2) } for(; i.hasNext(); ) { tmp.add(i.next()); } } final List current = new ArrayList(tmp.size() + clist.size()); { // current = tmp + clist final Iterator tmpIterator = tmp.iterator(); final Iterator cIterator = clist.iterator(); E t = tmpIterator.hasNext()? tmpIterator.next(): null; E c = cIterator.hasNext()? cIterator.next(): null; for(; t != null || c != null; ) { final int cmp = c == null? 1 : t == null? -1 : c.compareTo(t.getKey()); if (cmp < 0) { current.add(c); c = cIterator.hasNext()? cIterator.next(): null; } else if (cmp > 0) { current.add(t); t = tmpIterator.hasNext()? tmpIterator.next(): null; } else { throw new AssertionError("Violated assumption (A3)."); } } } return current; } /** * Apply the reverse of this diff to current state in order * to obtain the previous state. * @return the previous state of the list. */ public List apply2Current(final List current) { return apply2Previous(current, getList(ListType.DELETED), getList(ListType.CREATED)); } /** * Combine this diff with a posterior diff. We have the following cases: * *
   * 1. For (c, 0) in the posterior diff, check the element in this diff:
   * 1.1 (c', 0)  in this diff: impossible
   * 1.2 (0, d')  in this diff: put in c-list --> (c, d')
   * 1.3 (c', d') in this diff: impossible
   * 1.4 (0, 0)   in this diff: put in c-list --> (c, 0)
   * This is the same logic as create(E).
   * 
   * 2. For (0, d) in the posterior diff,
   * 2.1 (c', 0)  in this diff: remove from c-list --> (0, 0)
   * 2.2 (0, d')  in this diff: impossible
   * 2.3 (c', d') in this diff: remove from c-list --> (0, d')
   * 2.4 (0, 0)   in this diff: put in d-list --> (0, d)
   * This is the same logic as delete(E).
   * 
   * 3. For (c, d) in the posterior diff,
   * 3.1 (c', 0)  in this diff: replace the element in c-list --> (c, 0)
   * 3.2 (0, d')  in this diff: impossible
   * 3.3 (c', d') in this diff: replace the element in c-list --> (c, d')
   * 3.4 (0, 0)   in this diff: put in c-list and d-list --> (c, d)
   * This is the same logic as modify(E, E).
   * 
* * @param posterior The posterior diff to combine with. * @param deletedProcesser * process the deleted/overwritten elements in case 2.1, 2.3, 3.1 and 3.3. */ public void combinePosterior(final Diff posterior, final Processor deletedProcesser) { final Iterator createdIterator = posterior.getList(ListType.CREATED).iterator(); final Iterator deletedIterator = posterior.getList(ListType.DELETED).iterator(); E c = createdIterator.hasNext()? createdIterator.next(): null; E d = deletedIterator.hasNext()? deletedIterator.next(): null; for(; c != null || d != null; ) { final int cmp = c == null? 1 : d == null? -1 : c.compareTo(d.getKey()); if (cmp < 0) { // case 1: only in c-list create(c); c = createdIterator.hasNext()? createdIterator.next(): null; } else if (cmp > 0) { // case 2: only in d-list final UndoInfo ui = delete(d); if (deletedProcesser != null) { deletedProcesser.process(ui.trashed); } d = deletedIterator.hasNext()? deletedIterator.next(): null; } else { // case 3: in both c-list and d-list final UndoInfo ui = modify(d, c); if (deletedProcesser != null) { deletedProcesser.process(ui.trashed); } c = createdIterator.hasNext()? createdIterator.next(): null; d = deletedIterator.hasNext()? deletedIterator.next(): null; } } } @Override public String toString() { return getClass().getSimpleName() + "{created=" + getList(ListType.CREATED) + ", deleted=" + getList(ListType.DELETED) + "}"; } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy