com.hp.autonomy.aci.content.database.Databases Maven / Gradle / Ivy
/*
* Copyright 2009-2015 Hewlett-Packard Development Company, L.P.
* Licensed under the MIT License (the "License"); you may not use this file except in compliance with the License.
*/
package com.hp.autonomy.aci.content.database;
import com.hp.autonomy.aci.content.identifier.QueryIdentifiers;
import org.apache.commons.lang.StringUtils;
import org.apache.commons.lang.Validate;
import java.util.Arrays;
import java.util.Collections;
import java.util.Iterator;
import java.util.LinkedHashSet;
import java.util.Set;
import java.util.regex.Pattern;
/**
* Helper class for building database restrictions, such as those used in the databasematch parameter of a
* query. Individual database names are represented as Strings and deduplicated where possible.
*
*
Some of the characteristics of the {@code append} methods of this class might be considered inconsistent with the
* behaviour of IDOL's databasematch parameter. This has been done to make those methods behave as a logical
* OR operations in all circumstances. The IDOL behaviour which is not honoured is:
*
*
* - An empty databasematch will match all non-internal databases, whereas * will match all
* databases.
*
- If the first non-blank database in the databasematch is a * then it will match everything. If
* the * appears later in the databasematch it is ignored.
*
*
* Instead, {@code Databases} exhibits the following behaviour:
*
*
* - If * is added to an instance then all other values will be discarded.
*
- If an instance is empty then its string representation will be a nonsense string intended to match no
* databases.
*
- An instance cannot be created that has an empty string representation.
*
- {@link #parse(String)} treats an empty string as equivalent to *.
*
*
* This class makes no attempt at internal synchronization and an instance is not safe to be used by multiple threads
* without external synchronization.
*/
public class Databases implements Iterable, QueryIdentifiers {
private static final String MATCH_NOTHING = "MATCH_NOTHING_9be3e331-8046-4182-9e2d-ebbcf12f6e4c";
private static final Pattern SEPARATORS = Pattern.compile("[,\\+ ]");
private static final Pattern INVALID = Pattern.compile(".*[,\\+ ].*");
private static final Pattern SPACES = Pattern.compile(" *");
private final Set values = new LinkedHashSet();
/**
* An instance of {@code Databases} that corresponds to all databases, i.e. *
*
*
This instance is immutable, attempting to append further databases will only validate their names, it will not
* actually append them.
*/
public static final Databases ALL = new Databases("*");
/**
* Create a new instance using the database names provided.
*
* @param databases The names of the databases
*/
public Databases(final Iterable databases) {
doAppend(databases);
}
/**
* Create a new instance using the database names provided.
*
* @param databases The names of the databases
*/
public Databases(final String... databases) {
doAppend(Arrays.asList(databases));
}
/**
* Appends the given database names to this instance.
*
* @param values The names of the databases
* @return {@code this}
*/
public Databases append(final Iterable values) {
return doAppend(values);
}
/**
* Appends the given database names to this instance.
*
* @param values The names of the databases
* @return {@code this}
*/
public Databases append(final String... values) {
return doAppend(Arrays.asList(values));
}
private Databases doAppend(final Iterable databases) {
Validate.notNull(databases, "Databases must not be null");
// In case of nulls, build a new Set and then add them all
final Set newDatabases = new LinkedHashSet();
for (final String database : databases) {
Validate.isTrue(StringUtils.isNotEmpty(database), "One of the database names provided was empty");
Validate.isTrue(!INVALID.matcher(database).matches(), "A database name cannot contain a plus, comma or whitespace: [" + database + ']');
// Split on comma, plus and space
newDatabases.add(database);
}
// Here we use contains rather than just this.equals(ALL) to avoid using an overridable method from a
// constructor. Once the use of 'final' is sorted out for this class we might change it back to the more obvious
// version.
if (!this.values.contains("*")) {
if (newDatabases.contains("*")) {
this.values.clear();
this.values.add("*");
}
else {
this.values.addAll(newDatabases);
}
}
return this;
}
/**
* {@link Iterator} for the database names. Removing elements is not currently supported.
*
* @return A suitable iterator
*/
@Override
public Iterator iterator() {
// For now we disable removal
return Collections.unmodifiableSet(values).iterator();
}
/**
* The number of database names currently in this instance.
*
* @return Number of databases
*/
public int size() {
return values.size();
}
/**
* Whether or not size is 0. Note that, for consistency reasons, empty corresponds to matching no databases rather
* than all databases and the implementations of {@link #toString()} and {@link #toIndexingString()} takes this into
* account.
*
* @return {@code true} if and only if {@code size() == 0}
*/
@Override
public boolean isEmpty() {
return values.isEmpty();
}
/**
* Two {@code Databases} objects are considered equal if they contain the same set of database names. Equality is
* order invariant.
*
* @param obj A object to test for equality
* @return {@code true} if the {@code obj} is equal to {@code this}
*/
@Override
public boolean equals(final Object obj) {
return this == obj || obj instanceof Databases && this.values.equals(((Databases) obj).values);
}
/**
* A suitable hashcode implementation.
*
* @return The hashcode
*/
@Override
public int hashCode() {
return values.hashCode();
}
/**
* A {@code String} representation of the databases, suitable for use in a query or getcontent
* action.
*
*
If this object is empty then this method will return a nonsense value that will not match any database. This
* makes appending databases consistently an OR operation and also closes a common security hole. Note that
* when building a query it is generally preferred to explicitly check {@link #isEmpty()} rather than proceeding to
* execute a query that matches no documents.
*
* @return A string representation of the databases
*/
@Override
public String toString() {
final StringBuilder builder = new StringBuilder();
for(final String value : this) {
// Oddly, this doesn't need URL encoding
builder.append(value).append('+');
}
if(builder.length() == 0) {
return MATCH_NOTHING;
}
builder.deleteCharAt(builder.length() - 1);
return builder.toString();
}
/**
*
* @return {@code "databasematch"} or equivalent
*/
@Override
public String getMatchParameterName() {
return DATABASE_MATCH;
}
/**
*
* @return {@code "DREDBNAME"} or equivalent
*/
@Override
public String getIndexingIdentifierName() {
return DREDBNAME;
}
/**
*
A {@code String} representation of the databases, suitable for use in a DREREPLACE index command.
*
*
If this object is empty then current behaviour is to return a nonsense value. Note that this behaviour should
* not be relied upon and an explicit check using {@link #isEmpty()} should be used instead.
*
* @return A string representation of the databases
*/
@Override
public String toIndexingString() {
return toString();
}
/**
* Converts an iterable of strings into a {@code Databases}. This method can be more efficient than using the
* equivalent constructor but the returned object might be backed by the object provided.
*
* @param databases The references to convert
* @return An equivalent instance of {@code Databases}
*/
public static Databases from(final Iterable databases) {
return (databases instanceof Databases) ? (Databases)databases : new Databases(databases);
}
/**
* Parses a {@code String} of database names in the format used in a query or getcontent action.
* This includes parsing the output of {@link #toString()}. An empty string will be treated as equivalent to
* *, even though technically there is a slight difference when working with internal databases.
*
* @param databases The string representation to parse
* @return A {@code Databases} object
*/
public static Databases parse(final String databases) {
Validate.notNull(databases, "Databases must not be null");
if (SPACES.matcher(databases).matches()) {
return Databases.ALL;
}
final Set databasesSet = new LinkedHashSet(Arrays.asList(SEPARATORS.split(databases)));
databasesSet.remove("");
if (databasesSet.isEmpty()) {
return new Databases();
}
if ("*".equals(databasesSet.iterator().next())) {
return ALL;
}
databasesSet.remove("*");
databasesSet.remove(MATCH_NOTHING);
return new Databases(databasesSet);
}
}