All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.hadoop.hbase.mapreduce.BigtableTableHashAccessor Maven / Gradle / Ivy

Go to download

This project contains tweaks to the hbase 1.* map reduce jobs that work for bigtable. Specifically, HBase's Import M/R job has ZooKeeper referrence which needed to be removed in order to work with Bigtable.

There is a newer version: 2.14.8
Show newest version
/*
 * Copyright 2022 Google LLC
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.hadoop.hbase.mapreduce;

import com.google.bigtable.repackaged.com.google.api.core.InternalApi;
import com.google.common.collect.ImmutableList;
import java.io.IOException;
import org.apache.hadoop.hbase.client.Result;
import org.apache.hadoop.hbase.client.Scan;
import org.apache.hadoop.hbase.io.ImmutableBytesWritable;
import org.apache.hadoop.hbase.mapreduce.HashTable.ResultHasher;
import org.apache.hadoop.hbase.mapreduce.HashTable.TableHash;

/** A helper class to access package private fields of HashTable.TableHash. */
@InternalApi
public class BigtableTableHashAccessor {

  // Restrict object creation. This class should only be used to access state from TableHash.
  private BigtableTableHashAccessor() {}

  public static int getNumHashFiles(TableHash hash) {
    return hash.numHashFiles;
  }

  public static ImmutableList getPartitions(TableHash hash) {
    return ImmutableList.copyOf(hash.partitions);
  }

  public static ImmutableBytesWritable getStartRow(TableHash hash) {
    return new ImmutableBytesWritable(hash.startRow);
  }

  public static ImmutableBytesWritable getStopRow(TableHash hash) {
    return new ImmutableBytesWritable(hash.stopRow);
  }

  public static Scan getScan(TableHash hash) throws IOException {
    return hash.initScan();
  }

  public static String getTableName(TableHash hash) {
    return hash.tableName;
  }

  public static long getBatchSize(TableHash hash) {
    return hash.batchSize;
  }

  public static String getHashDataDir() {
    return HashTable.HASH_DATA_DIR;
  }

  public static String getHashOutputDataFilePrefix() {
    return HashTable.OUTPUT_DATA_FILE_PREFIX;
  }

  public static boolean isTableEndRow(byte[] row) {
    return HashTable.isTableEndRow(row);
  }

  // Wrapper to access package private class ResultHasher. Delegates all the calls to underlying
  // TableHash.ResultHasher, helps in mocking for unit tests.
  public static class BigtableResultHasher {
    private final ResultHasher hasher;

    public BigtableResultHasher() {
      hasher = new ResultHasher();
    }

    public void startBatch(ImmutableBytesWritable batchStartKey) {
      hasher.startBatch(batchStartKey);
    }

    public void finishBatch() {
      hasher.finishBatch();
    }

    public ImmutableBytesWritable getBatchHash() {
      return hasher.getBatchHash();
    }

    public void hashResult(Result result) {
      hasher.hashResult(result);
    }

    public boolean isBatchStarted() {
      return hasher.isBatchStarted();
    }

    public long getBatchSize() {
      return hasher.getBatchSize();
    }

    public ImmutableBytesWritable getBatchStartKey() {
      return hasher.getBatchStartKey();
    }
  }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy