All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.hadoop.hbase.wal.WALEdit Maven / Gradle / Ivy

There is a newer version: 3.0.0-beta-1
Show newest version
/**
 *
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.hadoop.hbase.wal;

import java.io.IOException;
import java.util.ArrayList;
import java.util.List;
import java.util.Map;
import java.util.Set;
import java.util.TreeSet;

import org.apache.hadoop.hbase.Cell;
import org.apache.hadoop.hbase.CellUtil;
import org.apache.hadoop.hbase.HBaseInterfaceAudience;
import org.apache.hadoop.hbase.PrivateCellUtil;
import org.apache.hadoop.hbase.KeyValue;
import org.apache.hadoop.hbase.client.RegionInfo;
import org.apache.hadoop.hbase.codec.Codec;
import org.apache.hadoop.hbase.io.HeapSize;
import org.apache.hadoop.hbase.util.Bytes;
import org.apache.hadoop.hbase.util.ClassSize;
import org.apache.hadoop.hbase.util.EnvironmentEdgeManager;
import org.apache.yetus.audience.InterfaceAudience;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.apache.hbase.thirdparty.com.google.common.annotations.VisibleForTesting;
import org.apache.hadoop.hbase.shaded.protobuf.generated.WALProtos;
import org.apache.hadoop.hbase.shaded.protobuf.generated.WALProtos.CompactionDescriptor;
import org.apache.hadoop.hbase.shaded.protobuf.generated.WALProtos.FlushDescriptor;
import org.apache.hadoop.hbase.shaded.protobuf.generated.WALProtos.RegionEventDescriptor;


/**
 * Used in HBase's transaction log (WAL) to represent a collection of edits (Cell/KeyValue objects)
 * that came in as a single transaction. All the edits for a given transaction are written out as a
 * single record, in PB format, followed (optionally) by Cells written via the WALCellEncoder.
 * 

This class is LimitedPrivate for CPs to read-only. The {@link #add} methods are * classified as private methods, not for use by CPs.

*

WALEdit will accumulate a Set of all column family names referenced by the Cells * {@link #add(Cell)}'d. This is an optimization. Usually when loading a WALEdit, we have the * column family name to-hand.. just shove it into the WALEdit if available. Doing this, we can * save on a parse of each Cell to figure column family down the line when we go to add the * WALEdit to the WAL file. See the hand-off in FSWALEntry Constructor. */ // TODO: Do not expose this class to Coprocessors. It has set methods. A CP might meddle. @InterfaceAudience.LimitedPrivate({ HBaseInterfaceAudience.REPLICATION, HBaseInterfaceAudience.COPROC }) public class WALEdit implements HeapSize { private static final Logger LOG = LoggerFactory.getLogger(WALEdit.class); // TODO: Get rid of this; see HBASE-8457 public static final byte [] METAFAMILY = Bytes.toBytes("METAFAMILY"); @VisibleForTesting public static final byte [] METAROW = Bytes.toBytes("METAROW"); @VisibleForTesting public static final byte[] COMPACTION = Bytes.toBytes("HBASE::COMPACTION"); @VisibleForTesting public static final byte [] FLUSH = Bytes.toBytes("HBASE::FLUSH"); @VisibleForTesting public static final byte [] REGION_EVENT = Bytes.toBytes("HBASE::REGION_EVENT"); @VisibleForTesting public static final byte [] BULK_LOAD = Bytes.toBytes("HBASE::BULK_LOAD"); private final boolean replay; private ArrayList cells = null; /** * All the Cell families in cells. Updated by {@link #add(Cell)} and * {@link #add(Map)}. This Set is passed to the FSWALEntry so it does not have * to recalculate the Set of families in a transaction; makes for a bunch of CPU savings. * An optimization that saves on CPU-expensive Cell-parsing. */ private Set families = null; public WALEdit() { this(false); } /** * @deprecated Since 2.0.1. Use {@link #WALEdit(int, boolean)} instead. */ @Deprecated public WALEdit(boolean isReplay) { this(1, isReplay); } /** * @deprecated Since 2.0.1. Use {@link #WALEdit(int, boolean)} instead. */ @Deprecated public WALEdit(int cellCount) { this(cellCount, false); } /** * @param cellCount Pass so can pre-size the WALEdit. Optimization. */ public WALEdit(int cellCount, boolean isReplay) { this.replay = isReplay; cells = new ArrayList<>(cellCount); } private Set getOrCreateFamilies() { if (this.families == null) { this.families = new TreeSet(Bytes.BYTES_COMPARATOR); } return this.families; } /** * For use by FSWALEntry ONLY. An optimization. * @return All families in {@link #getCells()}; may be null. */ public Set getFamilies() { return this.families; } /** * @return True is f is {@link #METAFAMILY} */ public static boolean isMetaEditFamily(final byte [] f) { return Bytes.equals(METAFAMILY, f); } public static boolean isMetaEditFamily(Cell cell) { return CellUtil.matchingFamily(cell, METAFAMILY); } public boolean isMetaEdit() { for (Cell cell: cells) { if (!isMetaEditFamily(cell)) { return false; } } return true; } /** * @return True when current WALEdit is created by log replay. Replication skips WALEdits from * replay. */ public boolean isReplay() { return this.replay; } @InterfaceAudience.Private public WALEdit add(Cell cell, byte [] family) { getOrCreateFamilies().add(family); return addCell(cell); } @InterfaceAudience.Private public WALEdit add(Cell cell) { // We clone Family each time we add a Cell. Expensive but safe. For CPU savings, use // add(Map) or add(Cell, family). return add(cell, CellUtil.cloneFamily(cell)); } public boolean isEmpty() { return cells.isEmpty(); } public int size() { return cells.size(); } public ArrayList getCells() { return cells; } /** * This is not thread safe. * This will change the WALEdit and shouldn't be used unless you are sure that nothing * else depends on the contents being immutable. * * @param cells the list of cells that this WALEdit now contains. */ @InterfaceAudience.Private // Used by replay. public void setCells(ArrayList cells) { this.cells = cells; this.families = null; } /** * Reads WALEdit from cells. * @param cellDecoder Cell decoder. * @param expectedCount Expected cell count. * @return Number of KVs read. */ public int readFromCells(Codec.Decoder cellDecoder, int expectedCount) throws IOException { cells.clear(); cells.ensureCapacity(expectedCount); while (cells.size() < expectedCount && cellDecoder.advance()) { cells.add(cellDecoder.current()); } return cells.size(); } @Override public long heapSize() { long ret = ClassSize.ARRAYLIST; for (Cell cell : cells) { ret += PrivateCellUtil.estimatedSizeOfCell(cell); } return ret; } public long estimatedSerializedSizeOf() { long ret = 0; for (Cell cell: cells) { ret += PrivateCellUtil.estimatedSerializedSizeOf(cell); } return ret; } @Override public String toString() { StringBuilder sb = new StringBuilder(); sb.append("[#edits: " + cells.size() + " = <"); for (Cell cell : cells) { sb.append(cell); sb.append("; "); } sb.append(">]"); return sb.toString(); } public static WALEdit createFlushWALEdit(RegionInfo hri, FlushDescriptor f) { KeyValue kv = new KeyValue(getRowForRegion(hri), METAFAMILY, FLUSH, EnvironmentEdgeManager.currentTime(), f.toByteArray()); return new WALEdit().add(kv, METAFAMILY); } public static FlushDescriptor getFlushDescriptor(Cell cell) throws IOException { if (CellUtil.matchingColumn(cell, METAFAMILY, FLUSH)) { return FlushDescriptor.parseFrom(CellUtil.cloneValue(cell)); } return null; } public static WALEdit createRegionEventWALEdit(RegionInfo hri, RegionEventDescriptor regionEventDesc) { KeyValue kv = new KeyValue(getRowForRegion(hri), METAFAMILY, REGION_EVENT, EnvironmentEdgeManager.currentTime(), regionEventDesc.toByteArray()); return new WALEdit().add(kv, METAFAMILY); } public static RegionEventDescriptor getRegionEventDescriptor(Cell cell) throws IOException { if (CellUtil.matchingColumn(cell, METAFAMILY, REGION_EVENT)) { return RegionEventDescriptor.parseFrom(CellUtil.cloneValue(cell)); } return null; } /** * Create a compaction WALEdit * @param c * @return A WALEdit that has c serialized as its value */ public static WALEdit createCompaction(final RegionInfo hri, final CompactionDescriptor c) { byte [] pbbytes = c.toByteArray(); KeyValue kv = new KeyValue(getRowForRegion(hri), METAFAMILY, COMPACTION, EnvironmentEdgeManager.currentTime(), pbbytes); return new WALEdit().add(kv, METAFAMILY); //replication scope null so this won't be replicated } public static byte[] getRowForRegion(RegionInfo hri) { byte[] startKey = hri.getStartKey(); if (startKey.length == 0) { // empty row key is not allowed in mutations because it is both the start key and the end key // we return the smallest byte[] that is bigger (in lex comparison) than byte[0]. return new byte[] {0}; } return startKey; } /** * Deserialized and returns a CompactionDescriptor is the KeyValue contains one. * @param kv the key value * @return deserialized CompactionDescriptor or null. */ public static CompactionDescriptor getCompaction(Cell kv) throws IOException { if (isCompactionMarker(kv)) { return CompactionDescriptor.parseFrom(CellUtil.cloneValue(kv)); } return null; } /** * Returns true if the given cell is a serialized {@link CompactionDescriptor} * * @see #getCompaction(Cell) */ public static boolean isCompactionMarker(Cell cell) { return CellUtil.matchingColumn(cell, METAFAMILY, COMPACTION); } /** * Create a bulk loader WALEdit * * @param hri The RegionInfo for the region in which we are bulk loading * @param bulkLoadDescriptor The descriptor for the Bulk Loader * @return The WALEdit for the BulkLoad */ public static WALEdit createBulkLoadEvent(RegionInfo hri, WALProtos.BulkLoadDescriptor bulkLoadDescriptor) { KeyValue kv = new KeyValue(getRowForRegion(hri), METAFAMILY, BULK_LOAD, EnvironmentEdgeManager.currentTime(), bulkLoadDescriptor.toByteArray()); return new WALEdit().add(kv, METAFAMILY); } /** * Deserialized and returns a BulkLoadDescriptor from the passed in Cell * @param cell the key value * @return deserialized BulkLoadDescriptor or null. */ public static WALProtos.BulkLoadDescriptor getBulkLoadDescriptor(Cell cell) throws IOException { if (CellUtil.matchingColumn(cell, METAFAMILY, BULK_LOAD)) { return WALProtos.BulkLoadDescriptor.parseFrom(CellUtil.cloneValue(cell)); } return null; } /** * Append the given map of family->edits to a WALEdit data structure. * This does not write to the WAL itself. * Note that as an optimization, we will stamp the Set of column families into the WALEdit * to save on our having to calculate it subsequently way down in the actual WAL writing. * * @param familyMap map of family->edits */ public void add(Map> familyMap) { for (Map.Entry> e: familyMap.entrySet()) { // 'foreach' loop NOT used. See HBASE-12023 "...creates too many iterator objects." int listSize = e.getValue().size(); // Add all Cells first and then at end, add the family rather than call {@link #add(Cell)} // and have it clone family each time. Optimization! for (int i = 0; i < listSize; i++) { addCell(e.getValue().get(i)); } addFamily(e.getKey()); } } private void addFamily(byte [] family) { getOrCreateFamilies().add(family); } private WALEdit addCell(Cell cell) { this.cells.add(cell); return this; } }





© 2015 - 2024 Weber Informatics LLC | Privacy Policy