All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.hadoop.hive.ql.lockmgr.HiveTxnManager Maven / Gradle / Ivy

There is a newer version: 4.0.0
Show newest version
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.hadoop.hive.ql.lockmgr;

import org.apache.hadoop.hive.common.ValidTxnList;
import org.apache.hadoop.hive.common.ValidTxnWriteIdList;
import org.apache.hadoop.hive.metastore.api.CommitTxnRequest;
import org.apache.hadoop.hive.metastore.api.GetOpenTxnsResponse;
import org.apache.hadoop.hive.metastore.api.LockResponse;
import org.apache.hadoop.hive.metastore.api.TxnToWriteId;
import org.apache.hadoop.hive.metastore.api.TxnType;
import org.apache.hadoop.hive.ql.Context;
import org.apache.hadoop.hive.ql.DriverState;
import org.apache.hadoop.hive.ql.ddl.database.lock.LockDatabaseDesc;
import org.apache.hadoop.hive.ql.ddl.database.unlock.UnlockDatabaseDesc;
import org.apache.hadoop.hive.ql.ddl.table.lock.LockTableDesc;
import org.apache.hadoop.hive.ql.ddl.table.lock.UnlockTableDesc;
import org.apache.hadoop.hive.ql.QueryPlan;
import org.apache.hadoop.hive.ql.metadata.Hive;
import org.apache.hadoop.hive.ql.metadata.HiveException;

import java.util.List;

/**
 * An interface that allows Hive to manage transactions.  All classes
 * implementing this should extend {@link HiveTxnManagerImpl} rather than
 * implementing this directly.
 */
public interface HiveTxnManager {

  /**
   * Open a new transaction.
   * @param ctx Context for this query
   * @param user Hive user who is opening this transaction.
   * @return The new transaction id
   * @throws LockException if a transaction is already open.
   */
  long openTxn(Context ctx, String user) throws LockException;

 /**
  * Open a new transaction.
  * @param ctx Context for this query
  * @param user Hive user who is opening this transaction.
  * @param txnType transaction type.
  * @return The new transaction id
  * @throws LockException if a transaction is already open.
  */
  long openTxn(Context ctx, String user, TxnType txnType) throws LockException;

  /**
   * Open a new transaction in target cluster.
   * @param replPolicy Replication policy to uniquely identify the source cluster.
   * @param srcTxnIds The ids of the transaction at the source cluster
   * @param user The user who has fired the repl load command
   * @return The new transaction id.
   * @throws LockException in case of failure to start the transaction.
   */
  List replOpenTxn(String replPolicy, List srcTxnIds, String user) throws LockException;

  /**
   * Commit the transaction in target cluster.
   *
   * @param rqst Commit transaction request having information related to commit txn and write events.
   * @throws LockException in case of failure to commit the transaction.
   */
  void replCommitTxn(CommitTxnRequest rqst) throws LockException;

 /**
   * Abort the transaction in target cluster.
   * @param replPolicy Replication policy to uniquely identify the source cluster.
   * @param srcTxnId The id of the transaction at the source cluster
   * @throws LockException in case of failure to abort the transaction.
   */
  void replRollbackTxn(String replPolicy, long srcTxnId) throws LockException;

 /**
  * Replicate Table Write Ids state to mark aborted write ids and writeid high water mark.
  * @param validWriteIdList Snapshot of writeid list when the table/partition is dumped.
  * @param dbName Database name
  * @param tableName Table which is written.
  * @param partNames List of partitions being written.
  * @throws LockException in case of failure.
  */
  void replTableWriteIdState(String validWriteIdList, String dbName, String tableName, List partNames)
          throws LockException;

  /**
   * Get the lock manager.  This must be used rather than instantiating an
   * instance of the lock manager directly as the transaction manager will
   * choose which lock manager to instantiate.
   * @return the instance of the lock manager
   * @throws LockException if there is an issue obtaining the lock manager.
   */
  HiveLockManager getLockManager() throws LockException;

  /**
   * Acquire all of the locks needed by a query.  If used with a query that
   * requires transactions, this should be called after {@link #openTxn(Context, String)}.
   * A list of acquired locks will be stored in the
   * {@link org.apache.hadoop.hive.ql.Context} object and can be retrieved
   * via {@link org.apache.hadoop.hive.ql.Context#getHiveLocks}.
   *
   * @param plan query plan
   * @param ctx Context for this query
   * @param username name of the user for this query
   * @throws LockException if there is an error getting the locks.  Use {@link LockException#getCanonicalErrorMsg()}
   * to get more info on how to handle the exception.
   */
  void acquireLocks(QueryPlan plan, Context ctx, String username) throws LockException;

  /**
   * Acquire all of the locks needed by a query.  If used with a query that
   * requires transactions, this should be called after {@link #openTxn(Context, String)}.
   * A list of acquired locks will be stored in the
   * {@link org.apache.hadoop.hive.ql.Context} object and can be retrieved
   * via {@link org.apache.hadoop.hive.ql.Context#getHiveLocks}.
   * @param plan query plan
   * @param ctx Context for this query
   * @param username name of the user for this query
   * @param driverState the state to inform if the query cancelled or not
   * @throws LockException if there is an error getting the locks
   */
   void acquireLocks(QueryPlan plan, Context ctx, String username, DriverState driverState) throws LockException;

  /**
   * Release specified locks.
   * Transaction aware TxnManagers, which has {@code supportsAcid() == true},
   * will track locks internally and ignore this parameter
   * @param hiveLocks The list of locks to be released.
   */
  void releaseLocks(List hiveLocks) throws LockException;

  /**
   * Commit the current transaction.  This will release all locks obtained in
   * {@link #acquireLocks(org.apache.hadoop.hive.ql.QueryPlan,
   * org.apache.hadoop.hive.ql.Context, java.lang.String)}.
   * @throws LockException if there is no current transaction or the
   * transaction has already been committed or aborted.
   */
  void commitTxn() throws LockException;

  /**
   * Abort the current transaction.  This will release all locks obtained in
   * {@link #acquireLocks(org.apache.hadoop.hive.ql.QueryPlan,
   * org.apache.hadoop.hive.ql.Context, java.lang.String)}.
   * @throws LockException if there is no current transaction or the
   * transaction has already been committed or aborted.
   */
  void rollbackTxn() throws LockException;

  /**
   * Send a heartbeat to the transaction management storage so other Hive
   * clients know that the transaction and locks held by this client are
   * still valid.  For implementations that do not require heartbeats this
   * can be a no-op.
   * @throws LockException If current transaction exists or the transaction
   * has already been committed or aborted.
   */
  void heartbeat() throws LockException;

  GetOpenTxnsResponse getOpenTxns() throws LockException;

  /**
   * Get the transactions that are currently valid.  The resulting
   * {@link ValidTxnList} object can be passed as string to the processing
   * tasks for use in the reading the data.  This call should be made once up
   * front by the planner and should never be called on the backend,
   * as this will violate the isolation level semantics.
   * @return list of valid transactions.
   * @throws LockException
   */
  ValidTxnList getValidTxns() throws LockException;

 /**
  * Get the transactions that are currently valid.  The resulting
  * {@link ValidTxnList} object can be passed as string to the processing
  * tasks for use in the reading the data.  This call should be made once up
  * front by the planner and should never be called on the backend,
  * as this will violate the isolation level semantics.
  * @return list of valid transactions.
  * @param  excludeTxnTypes list of transaction types that should be excluded.
  * @throws LockException
  */
  ValidTxnList getValidTxns(List excludeTxnTypes) throws LockException;

  /**
   * Get the table write Ids that are valid for the current transaction.  The resulting
   * {@link ValidTxnWriteIdList} object can be passed as string to the processing
   * tasks for use in the reading the data.  This call will return same results as long as validTxnString
   * passed is same.
   * @param tableList list of tables (<db_name>.<table_name>) read/written by current transaction.
   * @param validTxnList snapshot of valid txns for the current txn
   * @return list of valid table write Ids.
   * @throws LockException
   */
  ValidTxnWriteIdList getValidWriteIds(List tableList, String validTxnList) throws LockException;

  /**
   * Get the name for currently installed transaction manager.
   * @return transaction manager name
   */
  String getTxnManagerName();

  /**
   * This call closes down the transaction manager.  All open transactions
   * are aborted.  If no transactions are open but locks are held those locks
   * are released.  This method should be called if processing of a session
   * is being halted in an abnormal way.  It avoids locks and transactions
   * timing out.
   */
  void closeTxnManager();

  /**
   * Indicate whether this lock manager supports the use of lock
   * database or lock table.
   * @return
   */
  boolean supportsExplicitLock();

  /**
   * This function is called to lock the table when explicit lock command is
   * issued on a table.
   * @param hiveDB    an object to communicate with the metastore
   * @param lockTbl   table locking info, such as table name, locking mode
   * @return 0 if the locking succeeds, 1 otherwise.
   * @throws HiveException
   */
  int lockTable(Hive hiveDB, LockTableDesc lockTbl) throws HiveException;

  /**
   * This function is called to unlock the table when explicit unlock command is
   * issued on a table.
   * @param hiveDB    an object to communicate with the metastore
   * @param unlockTbl table unlocking info, such as table name
   * @return 0 if the locking succeeds, 1 otherwise.
   * @throws HiveException
   */
  int unlockTable(Hive hiveDB, UnlockTableDesc unlockTbl) throws HiveException;

  /**
   * This function is called to lock the database when explicit lock command is
   * issued on a database.
   * @param hiveDB    an object to communicate with the metastore
   * @param lockDb    database locking info, such as database name, locking mode
   * @return 0 if the locking succeeds, 1 otherwise.
   * @throws HiveException
   */
  int lockDatabase(Hive hiveDB, LockDatabaseDesc lockDb) throws HiveException;

  /**
   * This function is called to unlock the database when explicit unlock command
   * is issued on a database.
   * @param hiveDB    an object to communicate with the metastore
   * @param unlockDb  database unlocking info, such as database name
   * @return 0 if the locking succeeds, 1 otherwise.
   * @throws HiveException
   */
  int unlockDatabase(Hive hiveDB, UnlockDatabaseDesc unlockDb) throws HiveException;

  /**
   * Indicate whether this transaction manager returns information about locks in the new format
   * for show locks or the old one.
   * @return true if the new format should be used.
   */
  boolean useNewShowLocksFormat();

  /**
   * Indicate whether this transaction manager supports ACID operations.
   * @return true if this transaction manager does ACID
   */
  boolean supportsAcid();

  /**
   * For resources that support MVCC, the state of the DB must be recorded for the duration of the
   * operation/transaction.  Returns {@code true} if current statement needs to do this.
   */
  boolean recordSnapshot(QueryPlan queryPlan);

  @Deprecated
  boolean isImplicitTransactionOpen();

  boolean isImplicitTransactionOpen(Context ctx);

  boolean isTxnOpen();
  /**
   * if {@code isTxnOpen()}, returns the currently active transaction ID.
   */
  long getCurrentTxnId();

 /**
  * if {@code writeId > 0}, sets it in the tableWriteId cache, otherwise, calls {@link #getTableWriteId(String, String)}.
  * @param dbName
  * @param tableName
  * @throws LockException
  */
 void setTableWriteId(String dbName, String tableName, long writeId) throws LockException;

 /**
   * if {@code isTxnOpen()}, returns the table write ID associated with current active transaction.
   */
  long getTableWriteId(String dbName, String tableName) throws LockException;

 /**
  * if {@code isTxnOpen()}, returns the already allocated table write ID of the table with
  * the given "dbName.tableName" for the current active transaction.
  * If not allocated, then returns 0.
  * @param dbName
  * @param tableName
  * @return 0 if not yet allocated
  * @throws LockException
  */
 long getAllocatedTableWriteId(String dbName, String tableName) throws LockException;

 /**
   * Allocates write id for each transaction in the list.
   * @param dbName database name
   * @param tableName the name of the table to allocate the write id
   * @param replPolicy used by replication task to identify the source cluster
   * @param srcTxnToWriteIdList List of txn id to write id Map
   * @throws LockException
   */
  void replAllocateTableWriteIdsBatch(String dbName, String tableName, String replPolicy,
                                      List srcTxnToWriteIdList) throws LockException;

  /**
   * Should be though of more as a unique write operation ID in a given txn (at QueryPlan level).
   * Each statement writing data within a multi statement txn should have a unique WriteId.
   * Even a single statement, (e.g. Merge, multi-insert may generates several writes).
   */
  int getStmtIdAndIncrement();

  // Can be used by operation to set the stmt id when allocation is done somewhere else.
  int getCurrentStmtId();

  /**
   * Reset locally cached information.
   * This is called before re-compilation after aquiring lock if the transaction is not
   * outdated. The intent is to clear any cached information such as WriteIds (but not
   * reseting/rolling back the overall transaction).
   */
   void clearCaches();

  /**
   * Acquire the materialization rebuild lock for a given view. We need to specify the fully
   * qualified name of the materialized view and the open transaction ID so we can identify
   * uniquely the lock.
   * @return the response from the metastore, where the lock id is equal to the txn id and
   * the status can be either ACQUIRED or NOT ACQUIRED
   */
  LockResponse acquireMaterializationRebuildLock(String dbName, String tableName, long txnId)
      throws LockException;

 /**
  * Checks if there is a conflicting transaction
  * @return latest txnId in conflict
  */ 
 long getLatestTxnIdInConflict() throws LockException;

 /**
  * Return the queryId this txnManager is handling
  * @return
  */
 String getQueryid();

 /**
  * Persists txnWriteId hwm list into a backend DB to identify obsolete directories eligible for cleanup
  */
 void addWriteIdsToMinHistory(QueryPlan plan, ValidTxnWriteIdList txnWriteIds);
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy