com.bigdata.btree.keys.IKeyBuilder Maven / Gradle / Ivy

Go to download
/*

Copyright (C) SYSTAP, LLC DBA Blazegraph 2006-2016.  All rights reserved.

Contact:
     SYSTAP, LLC DBA Blazegraph
     2501 Calvert ST NW #106
     Washington, DC 20008
     [email protected]

This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; version 2 of the License.

This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU General Public License for more details.

You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA

*/
/*
 * Created on Apr 30, 2007
 */

package com.bigdata.btree.keys;

import java.math.BigDecimal;
import java.math.BigInteger;
import java.util.Locale;
import java.util.Properties;
import java.util.UUID;

import com.bigdata.btree.keys.KeyBuilder.Options;
import com.bigdata.io.IManagedByteArray;
import com.bigdata.util.BytesUtil;

/**
 * 
 * Interface for building up variable unsigned byte[] keys from
 * one or more primitive data types values and/or Unicode strings. An instance
 * of this interface may be {@link #reset()} and reused to encode a series of
 * keys.
 * 
 * 
 * A sort key is an unsigned byte[] that preserves the total order of the
 * original data. Sort keys may potentially be formed from multiple fields but
 * field markers do not appear within the resulting sort key. While the original
 * values can be extracted from sort keys (this is true of all the fixed length
 * fields, such as int, long, float, or double) they can not be extracted from
 * Unicode variable length fields (the collation ordering for a Unicode string
 * depends on the {@link Locale}, the collation strength, and the decomposition
 * mode and is a non-reversable operation).
 * 
 * Unicode
 * 
 * Factory methods are defined by {@link KeyBuilder} for obtaining instances of
 * this interface that optionally support Unicode. Instances may be created for
 * a given {@link Locale}, collation strength, decomposition mode, etc.
 * 
 * 
 * The ICU library supports generation of compressed Unicode sort keys and is
 * used by default when available. The JDK {@link java.text} package also
 * supports the generation of Unicode sort keys, but it does NOT produce
 * compressed sort keys. The resulting sort keys are therefore (a) incompatible
 * with those produced by the ICU library and (b) much larger than those
 * produced by the ICU library.
 * 
 * 
 * Support for Unicode MAY be disabled using {@link Options#COLLATOR}, by using
 * {@link KeyBuilder#newInstance()} or another factory method that does not
 * enable Unicode support, or by using one of the {@link KeyBuilder}
 * constructors that does not support Unicode.
 * 
 * Multi-field keys with variable length fields
 * 
 * Multi-field keys in which variable length fields are embedded within the key
 * present a special problem. Any run of fixed length fields can be compared as
 * unsigned byte[]s. Likewise, any any key with a fixed length prefix (including
 * zero) but a variable length field in its tail can also be compared directly
 * as unsigned byte[]s. However, the introduction of a variable length field
 * into any non-terminal position in a multi-field key must be handled specially
 * since simple concatenation of the field keys will NOT produce the correct
 * total ordering. (This is why SQL requires that text fields compare as if they
 * were padded out with ASCII blanks (0x20) to some maximum length for the
 * field.) A utility method exists specifically for this purpose - see
 * {@link #appendText(String, boolean, boolean)}.
 * 
 * 
 * @see KeyBuilder#newInstance()
 * @see KeyBuilder#newUnicodeInstance()
 * @see KeyBuilder#newUnicodeInstance(Properties)
 * @see SuccessorUtil
 * 
 * @author Bryan Thompson
 * @version $Id$
 */
public interface IKeyBuilder extends ISortKeyBuilder