org.apache.hadoop.hbase.mapreduce.BigtableTableHashAccessor Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of bigtable-hbase-1.x-mapreduce Show documentation
Show all versions of bigtable-hbase-1.x-mapreduce Show documentation
This project contains tweaks to the hbase 1.* map reduce jobs that work for
bigtable.
Specifically, HBase's Import M/R job has ZooKeeper referrence which needed
to be removed
in order to work with Bigtable.
/*
* Copyright 2022 Google LLC
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.hadoop.hbase.mapreduce;
import com.google.bigtable.repackaged.com.google.api.core.InternalApi;
import com.google.common.collect.ImmutableList;
import java.io.IOException;
import org.apache.hadoop.hbase.client.Result;
import org.apache.hadoop.hbase.client.Scan;
import org.apache.hadoop.hbase.io.ImmutableBytesWritable;
import org.apache.hadoop.hbase.mapreduce.HashTable.ResultHasher;
import org.apache.hadoop.hbase.mapreduce.HashTable.TableHash;
/** A helper class to access package private fields of HashTable.TableHash. */
@InternalApi
public class BigtableTableHashAccessor {
// Restrict object creation. This class should only be used to access state from TableHash.
private BigtableTableHashAccessor() {}
public static int getNumHashFiles(TableHash hash) {
return hash.numHashFiles;
}
public static ImmutableList getPartitions(TableHash hash) {
return ImmutableList.copyOf(hash.partitions);
}
public static ImmutableBytesWritable getStartRow(TableHash hash) {
return new ImmutableBytesWritable(hash.startRow);
}
public static ImmutableBytesWritable getStopRow(TableHash hash) {
return new ImmutableBytesWritable(hash.stopRow);
}
public static Scan getScan(TableHash hash) throws IOException {
return hash.initScan();
}
public static String getTableName(TableHash hash) {
return hash.tableName;
}
public static long getBatchSize(TableHash hash) {
return hash.batchSize;
}
public static String getHashDataDir() {
return HashTable.HASH_DATA_DIR;
}
public static String getHashOutputDataFilePrefix() {
return HashTable.OUTPUT_DATA_FILE_PREFIX;
}
public static boolean isTableEndRow(byte[] row) {
return HashTable.isTableEndRow(row);
}
// Wrapper to access package private class ResultHasher. Delegates all the calls to underlying
// TableHash.ResultHasher, helps in mocking for unit tests.
public static class BigtableResultHasher {
private final ResultHasher hasher;
public BigtableResultHasher() {
hasher = new ResultHasher();
}
public void startBatch(ImmutableBytesWritable batchStartKey) {
hasher.startBatch(batchStartKey);
}
public void finishBatch() {
hasher.finishBatch();
}
public ImmutableBytesWritable getBatchHash() {
return hasher.getBatchHash();
}
public void hashResult(Result result) {
hasher.hashResult(result);
}
public boolean isBatchStarted() {
return hasher.isBatchStarted();
}
public long getBatchSize() {
return hasher.getBatchSize();
}
public ImmutableBytesWritable getBatchStartKey() {
return hasher.getBatchStartKey();
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy