org.apache.phoenix.mapreduce.util.PhoenixMapReduceUtil Maven / Gradle / Ivy
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.phoenix.mapreduce.util;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.lib.db.DBWritable;
import org.apache.phoenix.mapreduce.PhoenixInputFormat;
import org.apache.phoenix.mapreduce.PhoenixOutputFormat;
import org.apache.phoenix.mapreduce.util.PhoenixConfigurationUtil.SchemaType;
import java.io.IOException;
import java.util.UUID;
/**
* Utility class for setting Configuration parameters for the Map Reduce job
*/
public final class PhoenixMapReduceUtil {
private PhoenixMapReduceUtil() {
}
/**
*
* @param job
* @param inputClass DBWritable class
* @param tableName Input table name
* @param conditions Condition clause to be added to the WHERE clause. Can be null if there are no conditions.
* @param fieldNames fields being projected for the SELECT query.
*/
public static void setInput(final Job job, final Class extends DBWritable> inputClass, final String tableName,
final String conditions, final String... fieldNames) {
final Configuration configuration = setInput(job, inputClass, tableName);
if(conditions != null) {
PhoenixConfigurationUtil.setInputTableConditions(configuration, conditions);
}
PhoenixConfigurationUtil.setSelectColumnNames(configuration, fieldNames);
}
/**
*
* @param job
* @param inputClass DBWritable class
* @param tableName Input table name
* @param inputQuery Select query.
*/
public static void setInput(final Job job, final Class extends DBWritable> inputClass, final String tableName, final String inputQuery) {
final Configuration configuration = setInput(job, inputClass, tableName);
PhoenixConfigurationUtil.setInputQuery(configuration, inputQuery);
PhoenixConfigurationUtil.setSchemaType(configuration, SchemaType.QUERY);
}
/**
*
* @param job
* @param inputClass DBWritable class
* @param snapshotName The name of a snapshot (of a table) to read from
* @param tableName Input table name
* @param restoreDir a temporary dir to copy the snapshot files into
* @param conditions Condition clause to be added to the WHERE clause. Can be null if there are no conditions.
* @param fieldNames fields being projected for the SELECT query.
*/
public static void setInput(final Job job, final Class extends DBWritable> inputClass, final String snapshotName, String tableName,
Path restoreDir, final String conditions, final String... fieldNames) throws
IOException {
final Configuration configuration = setSnapshotInput(job, inputClass, snapshotName, tableName, restoreDir);
if(conditions != null) {
PhoenixConfigurationUtil.setInputTableConditions(configuration, conditions);
}
PhoenixConfigurationUtil.setSelectColumnNames(configuration, fieldNames);
}
/**
*
* @param job
* @param inputClass DBWritable class
* @param snapshotName The name of a snapshot (of a table) to read from
* @param tableName Input table name
* @param restoreDir a temporary dir to copy the snapshot files into
* @param inputQuery The select query
*/
public static void setInput(final Job job, final Class extends DBWritable> inputClass, final String snapshotName, String tableName,
Path restoreDir, String inputQuery) throws
IOException {
final Configuration configuration = setSnapshotInput(job, inputClass, snapshotName, tableName, restoreDir);
if(inputQuery != null) {
PhoenixConfigurationUtil.setInputQuery(configuration, inputQuery);
}
}
/**
*
* @param job
* @param inputClass DBWritable class
* @param snapshotName The name of a snapshot (of a table) to read from
* @param tableName Input table name
* @param restoreDir a temporary dir to copy the snapshot files into
*/
private static Configuration setSnapshotInput(Job job, Class extends DBWritable> inputClass, String snapshotName,
String tableName, Path restoreDir) {
job.setInputFormatClass(PhoenixInputFormat.class);
final Configuration configuration = job.getConfiguration();
PhoenixConfigurationUtil.setInputClass(configuration, inputClass);
PhoenixConfigurationUtil.setSnapshotNameKey(configuration, snapshotName);
PhoenixConfigurationUtil.setInputTableName(configuration, tableName);
PhoenixConfigurationUtil.setRestoreDirKey(configuration, new Path(restoreDir, UUID.randomUUID().toString()).toString());
PhoenixConfigurationUtil.setSchemaType(configuration, SchemaType.QUERY);
return configuration;
}
private static Configuration setInput(final Job job, final Class extends DBWritable> inputClass, final String tableName){
job.setInputFormatClass(PhoenixInputFormat.class);
final Configuration configuration = job.getConfiguration();
PhoenixConfigurationUtil.setInputTableName(configuration, tableName);
PhoenixConfigurationUtil.setInputClass(configuration,inputClass);
return configuration;
}
/**
* A method to override which HBase cluster for {@link PhoenixInputFormat} to read from
* @param job MapReduce Job
* @param quorum an HBase cluster's ZooKeeper quorum
*/
public static void setInputCluster(final Job job, final String quorum) {
final Configuration configuration = job.getConfiguration();
PhoenixConfigurationUtil.setInputCluster(configuration, quorum);
}
/**
*
* @param job
* @param tableName Output table
* @param columns List of columns separated by ,
*/
public static void setOutput(final Job job, final String tableName,final String columns) {
job.setOutputFormatClass(PhoenixOutputFormat.class);
final Configuration configuration = job.getConfiguration();
PhoenixConfigurationUtil.setOutputTableName(configuration, tableName);
PhoenixConfigurationUtil.setUpsertColumnNames(configuration,columns.split(","));
}
/**
*
* @param job
* @param tableName Output table
* @param fieldNames fields
*/
public static void setOutput(final Job job, final String tableName , final String... fieldNames) {
job.setOutputFormatClass(PhoenixOutputFormat.class);
final Configuration configuration = job.getConfiguration();
PhoenixConfigurationUtil.setOutputTableName(configuration, tableName);
PhoenixConfigurationUtil.setUpsertColumnNames(configuration,fieldNames);
}
/**
* A method to override which HBase cluster for {@link PhoenixOutputFormat} to write to
* @param job MapReduce Job
* @param quorum an HBase cluster's ZooKeeper quorum
*/
public static void setOutputCluster(final Job job, final String quorum) {
final Configuration configuration = job.getConfiguration();
PhoenixConfigurationUtil.setOutputCluster(configuration, quorum);
}
public static void setTenantId(final Job job, final String tenantId) {
PhoenixConfigurationUtil.setTenantId(job.getConfiguration(), tenantId);
}
}
© 2015 - 2024 Weber Informatics LLC | Privacy Policy