All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.phoenix.hbase.index.covered.IndexCodec Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one or more contributor license agreements. See the NOTICE
 * file distributed with this work for additional information regarding copyright ownership. The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the
 * License. You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0 Unless required by
 * applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language
 * governing permissions and limitations under the License.
 */
package org.apache.phoenix.hbase.index.covered;

import java.io.IOException;

import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.hbase.client.Mutation;
import org.apache.hadoop.hbase.client.Put;
import org.apache.phoenix.hbase.index.BaseIndexCodec;

/**
 * Codec for creating index updates from the current state of a table.
 * 

* Generally, you should extend {@link BaseIndexCodec} instead, so help maintain compatibility as features need to be * added to the codec, as well as potentially not haivng to implement some methods. */ public interface IndexCodec { /** * Get the index cleanup entries. Currently, this must return just single row deletes (where just the row-key is * specified and no columns are returned) mapped to the table name. For instance, to you have an index 'myIndex' * with row : * *

     * v1,v2,v3 | CF:CQ0  | rowkey
     *          | CF:CQ1  | rowkey
     * 
* * To then cleanup this entry, you would just return 'v1,v2,v3', 'myIndex'. * * @param state * the current state of the table that needs to be cleaned up. Generally, you only care about the latest * column values, for each column you are indexing for each index table. * @param context TODO * @param regionStartKey TODO * @param regionEndKey TODO * @return the pairs of (deletes, index table name) that should be applied. * @throws IOException */ public Iterable getIndexDeletes(TableState state, IndexMetaData context, byte[] regionStartKey, byte[] regionEndKey) throws IOException; // table state has the pending update already applied, before calling // get the new index entries /** * Get the index updates for the primary table state, for each index table. The returned {@link Put}s need to be * fully specified (including timestamp) to minimize passes over the same key-values multiple times. *

* You must specify the same timestamps on the Put as {@link TableState#getCurrentTimestamp()} so the index entries * match the primary table row. This could be managed at a higher level, but would require iterating all the kvs in * the Put again - very inefficient when compared to the current interface where you must provide a timestamp * anyways (so you might as well provide the right one). * * @param state * the current state of the table that needs to an index update Generally, you only care about the latest * column values, for each column you are indexing for each index table. * @param context TODO * @param regionStartKey TODO * @param regionEndKey TODO * @return the pairs of (updates,index table name) that should be applied. * @throws IOException */ public Iterable getIndexUpserts(TableState state, IndexMetaData context, byte[] regionStartKey, byte[] regionEndKey, boolean verified) throws IOException; /** * This allows the codec to dynamically change whether or not indexing should take place for a table. If it doesn't * take place, we can save a lot of time on the regular Put patch. By making it dynamic, we can save offlining and * then onlining a table just to turn indexing on. *

* We can also be smart about even indexing a given update here too - if the update doesn't contain any columns that * we care about indexing, we can save the effort of analyzing the put and further. * * @param m * mutation that should be indexed. * @return true if indexing is enabled for the given table. This should be on a per-table basis, as each * codec is instantiated per-region. */ public boolean isEnabled(Mutation m); public void initialize(Configuration conf, byte[] tableName); }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy